codebyzeb commited on
Commit
7205efc
·
verified ·
1 Parent(s): 7f0fc5f

Training in progress, step 20000

Browse files
Files changed (5) hide show
  1. config.json +1 -1
  2. model.safetensors +2 -2
  3. tokenizer.json +109 -25
  4. training_args.bin +1 -1
  5. vocab.json +1 -1
config.json CHANGED
@@ -27,5 +27,5 @@
27
  "torch_dtype": "float32",
28
  "transformers_version": "4.44.2",
29
  "use_cache": true,
30
- "vocab_size": 31
31
  }
 
27
  "torch_dtype": "float32",
28
  "transformers_version": "4.44.2",
29
  "use_cache": true,
30
+ "vocab_size": 115
31
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4a555fb95a12d45a694e96ce59d9cf43d69a3e5476b5d3b277ab7f23d8c179c5
3
- size 19257664
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:42c3ecb6fd8d551111138ba77f01ed049a5b5cb50d1924211d6773c7e249584c
3
+ size 19343680
tokenizer.json CHANGED
@@ -51,7 +51,7 @@
51
  ]
52
  },
53
  "pre_tokenizer": {
54
- "type": "Whitespace"
55
  },
56
  "post_processor": {
57
  "type": "TemplateProcessing",
@@ -115,33 +115,117 @@
115
  "PAD": 1,
116
  "WORD_BOUNDARY": 2,
117
  "UTT_BOUNDARY": 3,
118
- "a": 4,
119
- "i": 5,
120
- "ɾ": 6,
121
- "": 7,
122
  "n": 8,
123
- "k": 9,
124
- "ɲ": 10,
125
- "": 11,
126
- "m": 12,
127
- "s": 13,
128
- "u": 14,
129
  "p": 15,
130
- "d": 16,
131
- "l": 17,
132
- "t": 18,
133
- "β": 19,
134
- "ɡ": 20,
135
  "w": 21,
136
- "ʝ": 22,
137
- "f": 23,
138
- "x": 24,
139
- "j": 25,
140
- "r": 26,
141
- "t̠ʃ": 27,
142
- "ʃ": 28,
143
- "tl": 29,
144
- "ts": 30
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
145
  },
146
  "unk_token": "UNK"
147
  }
 
51
  ]
52
  },
53
  "pre_tokenizer": {
54
+ "type": "WhitespaceSplit"
55
  },
56
  "post_processor": {
57
  "type": "TemplateProcessing",
 
115
  "PAD": 1,
116
  "WORD_BOUNDARY": 2,
117
  "UTT_BOUNDARY": 3,
118
+ "a˧˥": 4,
119
+ "u˧˥": 5,
120
+ "": 6,
121
+ "au": 7,
122
  "n": 8,
123
+ "a˥˩": 9,
124
+ "ʃ̺": 10,
125
+ "ɻ̩˥˩": 11,
126
+ "ə˧˥": 12,
127
+ "m": 13,
128
+ "ɤ": 14,
129
  "p": 15,
130
+ "j": 16,
131
+ "e˧˥": 17,
132
+ "": 18,
133
+ "k": 19,
134
+ "ɤ˥˩": 20,
135
  "w": 21,
136
+ "": 22,
137
+ "t̠ʃ̺ʰ": 23,
138
+ "ə˥": 24,
139
+ "ŋ": 25,
140
+ "t": 26,
141
+ "ʊ˥": 27,
142
+ "ɕ": 28,
143
+ "i": 29,
144
+ "a": 30,
145
+ "l": 31,
146
+ "au˧˩˧": 32,
147
+ "x": 33,
148
+ "u˧˩˧": 34,
149
+ "i˥": 35,
150
+ "ei˧˩˧": 36,
151
+ "pʰ": 37,
152
+ "i˧˥": 38,
153
+ "ai˧˥": 39,
154
+ "ou˧˩˧": 40,
155
+ "ɤ˧˥": 41,
156
+ "o˧˩˧": 42,
157
+ "tɕ": 43,
158
+ "au˥˩": 44,
159
+ "ts": 45,
160
+ "ə˧˩˧": 46,
161
+ "ɤ˥": 47,
162
+ "ei˧˥": 48,
163
+ "ʊ˧˥": 49,
164
+ "i˧˩˧": 50,
165
+ "t̠ʃ̺": 51,
166
+ "ɻ̩˧˩˧": 52,
167
+ "ei˥˩": 53,
168
+ "s": 54,
169
+ "u˥˩": 55,
170
+ "ɹ̪̩": 56,
171
+ "ai˥": 57,
172
+ "u˥": 58,
173
+ "tɕʰ": 59,
174
+ "a˧˩˧": 60,
175
+ "ai˥˩": 61,
176
+ "ɛ˥˩": 62,
177
+ "f": 63,
178
+ "i˥˩": 64,
179
+ "y˥˩": 65,
180
+ "au˧˥": 66,
181
+ "ɻ": 67,
182
+ "ou˥˩": 68,
183
+ "e˥": 69,
184
+ "tʰ": 70,
185
+ "ɹ̪̩˥˩": 71,
186
+ "ɛ˧˥": 72,
187
+ "au˥": 73,
188
+ "ou˧˥": 74,
189
+ "e˧˩˧": 75,
190
+ "ɛ˥": 76,
191
+ "ɻ̩˥": 77,
192
+ "ɥ": 78,
193
+ "ɹ̪̩˧˩˧": 79,
194
+ "ai˧˩˧": 80,
195
+ "ou˥": 81,
196
+ "o˥˩": 82,
197
+ "ɛ˧˩˧": 83,
198
+ "ʊ˧˩˧": 84,
199
+ "ɔ˥": 85,
200
+ "tsʰ": 86,
201
+ "ei": 87,
202
+ "ə˥˩": 88,
203
+ "o": 89,
204
+ "ʊ˥˩": 90,
205
+ "ou": 91,
206
+ "ɤ˧˩˧": 92,
207
+ "o˧˥": 93,
208
+ "ei˥": 94,
209
+ "e˥˩": 95,
210
+ "ɚ˧˩˧": 96,
211
+ "y˥": 97,
212
+ "ɚ˥˩": 98,
213
+ "y˧˥": 99,
214
+ "ɻ̩": 100,
215
+ "y˧˩˧": 101,
216
+ "ɹ̪̩˥": 102,
217
+ "ɻ̩˧˥": 103,
218
+ "u": 104,
219
+ "ə": 105,
220
+ "ai": 106,
221
+ "ʊ": 107,
222
+ "e": 108,
223
+ "ɚ˧˥": 109,
224
+ "ɔ˥˩": 110,
225
+ "ɹ̪̩˧˥": 111,
226
+ "ɛ": 112,
227
+ "y": 113,
228
+ "m˧˥": 114
229
  },
230
  "unk_token": "UNK"
231
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:82b3efe1c353bf704a32a56d3e2d90a521ee074a5be0597867a8e435f00dc496
3
  size 5368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:084e0397b40c5e56e7d3df631100c29dc2e74d25bb673e1905a6ce4ebdfd3f52
3
  size 5368
vocab.json CHANGED
@@ -1 +1 @@
1
- {"UNK":0,"PAD":1,"WORD_BOUNDARY":2,"UTT_BOUNDARY":3,"a":4,"i":5,"ɾ":6,"":7,"n":8,"k":9,"ɲ":10,"":11,"m":12,"s":13,"u":14,"p":15,"d":16,"l":17,"t":18,"β":19,"ɡ":20,"w":21,"ʝ":22,"f":23,"x":24,"j":25,"r":26,"t̠ʃ":27,"ʃ":28,"tl":29,"ts":30}
 
1
+ {"UNK":0,"PAD":1,"WORD_BOUNDARY":2,"UTT_BOUNDARY":3,"a˧˥":4,"u˧˥":5,"":6,"au":7,"n":8,"a˥˩":9,"ʃ̺":10,"ɻ̩˥˩":11,"ə˧˥":12,"m":13,"ɤ":14,"p":15,"j":16,"e˧˥":17,"":18,"k":19,"ɤ˥˩":20,"w":21,"":22,"t̠ʃ̺ʰ":23,"ə˥":24,"ŋ":25,"t":26,"ʊ˥":27,"ɕ":28,"i":29,"a":30,"l":31,"au˧˩˧":32,"x":33,"u˧˩˧":34,"i˥":35,"ei˧˩˧":36,"pʰ":37,"i˧˥":38,"ai˧˥":39,"ou˧˩˧":40,"ɤ˧˥":41,"o˧˩˧":42,"tɕ":43,"au˥˩":44,"ts":45,"ə˧˩˧":46,"ɤ˥":47,"ei˧˥":48,"ʊ˧˥":49,"i˧˩˧":50,"t̠ʃ̺":51,"ɻ̩˧˩˧":52,"ei˥˩":53,"s":54,"u˥˩":55,"ɹ̪̩":56,"ai˥":57,"u˥":58,"tɕʰ":59,"a˧˩˧":60,"ai˥˩":61,"ɛ˥˩":62,"f":63,"i˥˩":64,"y˥˩":65,"au˧˥":66,"ɻ":67,"ou˥˩":68,"e˥":69,"tʰ":70,"ɹ̪̩˥˩":71,"ɛ˧˥":72,"au˥":73,"ou˧˥":74,"e˧˩˧":75,"ɛ˥":76,"ɻ̩˥":77,"ɥ":78,"ɹ̪̩˧˩˧":79,"ai˧˩˧":80,"ou˥":81,"o˥˩":82,"ɛ˧˩˧":83,"ʊ˧˩˧":84,"ɔ˥":85,"tsʰ":86,"ei":87,"ə˥˩":88,"o":89,"ʊ˥˩":90,"ou":91,"ɤ˧˩˧":92,"o˧˥":93,"ei˥":94,"e˥˩":95,"ɚ˧˩˧":96,"y˥":97,"ɚ˥˩":98,"y˧˥":99,"ɻ̩":100,"y˧˩˧":101,"ɹ̪̩˥":102,"ɻ̩˧˥":103,"u":104,"ə":105,"ai":106,"ʊ":107,"e":108,"ɚ˧˥":109,"ɔ˥˩":110,"ɹ̪̩˧˥":111,"ɛ":112,"y":113,"m˧˥":114}