KoichiYasuoka commited on
Commit
d154ac6
1 Parent(s): 370ef3b

model improved

Browse files
Files changed (5) hide show
  1. README.md +1 -1
  2. config.json +236 -230
  3. pytorch_model.bin +2 -2
  4. supar.model +2 -2
  5. tokenizer.json +0 -0
README.md CHANGED
@@ -17,7 +17,7 @@ widget:
17
 
18
  ## Model Description
19
 
20
- This is a DeBERTa(V2) model pre-trained on Ainu texts (both カタカナ and romanized) for POS-tagging and dependency-parsing, derived from [deberta-base-ainu](https://huggingface.co/KoichiYasuoka/deberta-base-ainu). Every word is tagged by [UPOS](https://universaldependencies.org/u/pos/) (Universal Part-Of-Speech).
21
 
22
  ## How to Use
23
 
 
17
 
18
  ## Model Description
19
 
20
+ This is a DeBERTa(V2) model pre-trained on Ainu texts (in カタカナ, Roman, and Кириллица) for POS-tagging and dependency-parsing, derived from [deberta-base-ainu](https://huggingface.co/KoichiYasuoka/deberta-base-ainu). Every word is tagged by [UPOS](https://universaldependencies.org/u/pos/) (Universal Part-Of-Speech).
21
 
22
  ## How to Use
23
 
config.json CHANGED
@@ -89,121 +89,120 @@
89
  "77": "B-VERT|\u4ed6\u52d5\u8a5e|_",
90
  "78": "CCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
91
  "79": "CCONJ|\u63a5\u7d9a\u8a5e|_",
92
- "80": "DET|\u81ea\u52d5\u8a5e|_",
93
- "81": "DET|\u9023\u4f53\u8a5e|_",
94
- "82": "DET|\u9023\u4f53\u8a5e|_+NOUN|\u540d\u8a5e|_",
95
- "83": "DET|\u9023\u4f53\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_+VERB|\u81ea\u52d5\u8a5e|_",
96
- "84": "I-ADP|\u526f\u52a9\u8a5e|_",
97
- "85": "I-ADP|\u5f8c\u7f6e\u526f\u8a5e|_",
98
- "86": "I-ADP|\u683c\u52a9\u8a5e|_",
99
- "87": "I-ADP|\u683c\u52a9\u8a5e|_+VERB|\u81ea\u52d5\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
100
- "88": "I-ADV|\u526f\u8a5e|_",
101
- "89": "I-ADV|\u9593\u6295\u8a5e|_",
102
- "90": "I-AUX|\u30c7\u30a2\u30eb\u52d5\u8a5e|_",
103
- "91": "I-AUX|\u52a9\u52d5\u8a5e|_",
104
- "92": "I-AUX|\u52a9\u52d5\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
105
- "93": "I-AUX|\u52a9\u52d5\u8a5e|_+PART|\u7d42\u52a9\u8a5e|_",
106
- "94": "I-CCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
107
- "95": "I-CCONJ|\u63a5\u7d9a\u8a5e|_",
108
- "96": "I-DET|\u526f\u8a5e|_",
109
- "97": "I-DET|\u9023\u4f53\u8a5e|_",
110
- "98": "I-DET|\u9023\u4f53\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
111
- "99": "I-INFR.EV|\u5f62\u5f0f\u540d\u8a5e|_",
112
- "100": "I-INTJ|\u9593\u6295\u8a5e|_",
113
- "101": "I-NOUN|\u4eba\u79f0\u63a5\u8f9e|_",
114
- "102": "I-NOUN|\u4ee3\u540d\u8a5e|_",
115
- "103": "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_",
116
- "104": "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_",
117
- "105": "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_+NOUN|\u540d\u8a5e|_",
118
- "106": "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_",
119
- "107": "I-NOUN|\u540d\u8a5e|_",
120
- "108": "I-NOUN|\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_",
121
- "109": "I-NOUN|\u540d\u8a5e|_+ADV|\u526f\u8a5e|_",
122
- "110": "I-NOUN|\u540d\u8a5e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_",
123
- "111": "I-NOUN|\u540d\u8a5e|_+NOUN|\u540d\u8a5e|_",
124
- "112": "I-NOUN|\u540d\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
125
- "113": "I-NOUN|\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_",
126
- "114": "I-NOUN|\u56fa\u6709\u540d\u8a5e|_",
127
- "115": "I-NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
128
- "116": "I-NUM|\u6570\u8a5e|_",
129
- "117": "I-NUM|\u6570\u8a5e|_+NOUN|\u540d\u8a5e|_",
130
- "118": "I-PART|[\u7d42\u52a9\u8a5e]|_",
131
- "119": "I-PART|\u4eba\u79f0\u63a5\u8f9e|_",
132
- "120": "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+AUX|\u30c7\u30a2\u30eb\u52d5\u8a5e|_",
133
- "121": "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_",
134
- "122": "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
135
- "123": "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+VERB|\u4ed6\u52d5\u8a5e|_",
136
- "124": "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+VERB|\u81ea\u52d5\u8a5e|_",
137
- "125": "I-PART|\u52a9\u52d5\u8a5e|_",
138
- "126": "I-PART|\u63a5\u5c3e\u8f9e|_",
139
- "127": "I-PART|\u63a5\u7d9a\u52a9\u8a5e|_",
140
- "128": "I-PART|\u63a5\u982d\u8f9e|_",
141
- "129": "I-PART|\u7d42\u52a9\u8a5e|_",
142
- "130": "I-PART|\u81ea\u52d5\u8a5e|_",
143
- "131": "I-PART|\uff08\u7d42\u52a9\u8a5e\uff09|_",
144
- "132": "I-PRON|\u4ee3\u540d\u8a5e|_",
145
- "133": "I-PROPN|\u56fa\u6709\u540d\u8a5e|_",
146
- "134": "I-PUNCT|\u8a18\u53f7|_",
147
- "135": "I-SCONJ|[\u63a5\u7d9a\u52a9\u8a5e]|_",
148
- "136": "I-SCONJ|\u4ed6\u52d5\u8a5e|_",
149
- "137": "I-SCONJ|\u526f\u8a5e|_",
150
- "138": "I-SCONJ|\u5f8c\u7f6e\u526f\u8a5e|_",
151
- "139": "I-SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
152
- "140": "I-SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_+ADV|\u526f\u8a5e|_",
153
- "141": "I-SCONJ|\u63a5\u7d9a\u8a5e|_",
154
- "142": "I-SCONJ|\u683c\u52a9\u8a5e|_",
155
- "143": "I-SCONJ|\u7d42\u52a9\u8a5e|_",
156
- "144": "I-VERB|[\u81ea\u52d5\u8a5e]|_",
157
- "145": "I-VERB|\u4ed6\u52d5\u8a5e|_",
158
- "146": "I-VERB|\u4ed6\u52d5\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
159
- "147": "I-VERB|\u5b8c\u5168\u52d5\u8a5e|_",
160
- "148": "I-VERB|\u683c\u52a9\u8a5e|_",
161
- "149": "I-VERB|\u81ea\u52d5\u8a5e|_",
162
- "150": "I-VERB|\u81ea\u52d5\u8a5e|_+PART|\u4eba\u79f0\u63a5\u8f9e|_",
163
- "151": "I-VERB|\u81ea\u52d5\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
164
- "152": "I-VERT|\u4ed6\u52d5\u8a5e|_",
165
- "153": "INTJ|\u9593\u6295\u8a5e|_",
166
- "154": "NOUN|\u4ee3\u540d\u8a5e|_",
167
- "155": "NOUN|\u4f4d\u7f6e\u540d\u8a5e|_",
168
- "156": "NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_",
169
- "157": "NOUN|\u540d\u8a5e|_",
170
- "158": "NOUN|\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_",
171
- "159": "NOUN|\u540d\u8a5e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_",
172
- "160": "NOUN|\u540d\u8a5e|_+PART|\u4eba\u79f0\u63a5\u8f9e|_",
173
- "161": "NOUN|\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_",
174
- "162": "NOUN|\u56fa\u6709\u540d\u8a5e|_",
175
- "163": "NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
176
- "164": "NUM|\u6570\u8a5e|_",
177
- "165": "PART|[\u7d42\u52a9\u8a5e]|_",
178
- "166": "PART|\u4eba\u79f0\u63a5\u8f9e|_",
179
- "167": "PART|\u4eba\u79f0\u63a5\u8f9e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
180
- "168": "PART|\u4eba\u79f0\u63a5\u8f9e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
181
- "169": "PART|\u4eba\u79f0\u63a5\u8f9e|_+VERB|\u4ed6\u52d5\u8a5e|_",
182
- "170": "PART|\u63a5\u5c3e\u8f9e|_",
183
- "171": "PART|\u63a5\u7d9a\u52a9\u8a5e|_",
184
- "172": "PART|\u63a5\u982d\u8f9e|_",
185
- "173": "PART|\u7d42\u52a9\u8a5e|_",
186
- "174": "PART|\u81ea\u52d5\u8a5e|_",
187
- "175": "PROPN|\u56fa\u6709\u540d\u8a5e|_",
188
- "176": "PUNCT|\u8a18\u53f7|_",
189
- "177": "SCONJ|[\u63a5\u7d9a\u52a9\u8a5e]|_",
190
- "178": "SCONJ|\u4ed6\u52d5\u8a5e|_",
191
- "179": "SCONJ|\u526f\u8a5e|_",
192
- "180": "SCONJ|\u5f8c\u7f6e\u526f\u8a5e|_",
193
- "181": "SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
194
- "182": "SCONJ|\u63a5\u7d9a\u8a5e|_",
195
- "183": "SCONJ|\u683c\u52a9\u8a5e|_",
196
- "184": "SCONJ|\u7d42\u52a9\u8a5e|_",
197
- "185": "SYM",
198
- "186": "VERB|\u4ed6\u52d5\u8a5e|_",
199
- "187": "VERB|\u4ed6\u52d5\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
200
- "188": "VERB|\u4ed6\u52d5\u8a5e|_+PART|\u63a5\u5c3e\u8f9e|_",
201
- "189": "VERB|\u5b8c\u5168\u52d5\u8a5e|_",
202
- "190": "VERB|\u81ea\u52d5\u8a5e|_",
203
- "191": "VERB|\u81ea\u52d5\u8a5e|_+AUX|\u52a9\u52d5\u8a5e|_",
204
- "192": "VERB|\u81ea\u52d5\u8a5e|_+NOUN|\u540d\u8a5e|_",
205
- "193": "VERB|\u81ea\u52d5\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
206
- "194": "VERB|\u81ea\u52d5\u8a5e|_+VERB|\u81ea\u52d5\u8a5e|_"
207
  },
208
  "initializer_range": 0.02,
209
  "intermediate_size": 3072,
@@ -288,121 +287,120 @@
288
  "B-VERT|\u4ed6\u52d5\u8a5e|_": 77,
289
  "CCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 78,
290
  "CCONJ|\u63a5\u7d9a\u8a5e|_": 79,
291
- "DET|\u81ea\u52d5\u8a5e|_": 80,
292
- "DET|\u9023\u4f53\u8a5e|_": 81,
293
- "DET|\u9023\u4f53\u8a5e|_+NOUN|\u540d\u8a5e|_": 82,
294
- "DET|\u9023\u4f53\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_+VERB|\u81ea\u52d5\u8a5e|_": 83,
295
- "I-ADP|\u526f\u52a9\u8a5e|_": 84,
296
- "I-ADP|\u5f8c\u7f6e\u526f\u8a5e|_": 85,
297
- "I-ADP|\u683c\u52a9\u8a5e|_": 86,
298
- "I-ADP|\u683c\u52a9\u8a5e|_+VERB|\u81ea\u52d5\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 87,
299
- "I-ADV|\u526f\u8a5e|_": 88,
300
- "I-ADV|\u9593\u6295\u8a5e|_": 89,
301
- "I-AUX|\u30c7\u30a2\u30eb\u52d5\u8a5e|_": 90,
302
- "I-AUX|\u52a9\u52d5\u8a5e|_": 91,
303
- "I-AUX|\u52a9\u52d5\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 92,
304
- "I-AUX|\u52a9\u52d5\u8a5e|_+PART|\u7d42\u52a9\u8a5e|_": 93,
305
- "I-CCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 94,
306
- "I-CCONJ|\u63a5\u7d9a\u8a5e|_": 95,
307
- "I-DET|\u526f\u8a5e|_": 96,
308
- "I-DET|\u9023\u4f53\u8a5e|_": 97,
309
- "I-DET|\u9023\u4f53\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 98,
310
- "I-INFR.EV|\u5f62\u5f0f\u540d\u8a5e|_": 99,
311
- "I-INTJ|\u9593\u6295\u8a5e|_": 100,
312
- "I-NOUN|\u4eba\u79f0\u63a5\u8f9e|_": 101,
313
- "I-NOUN|\u4ee3\u540d\u8a5e|_": 102,
314
- "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_": 103,
315
- "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_": 104,
316
- "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_+NOUN|\u540d\u8a5e|_": 105,
317
- "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_": 106,
318
- "I-NOUN|\u540d\u8a5e|_": 107,
319
- "I-NOUN|\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_": 108,
320
- "I-NOUN|\u540d\u8a5e|_+ADV|\u526f\u8a5e|_": 109,
321
- "I-NOUN|\u540d\u8a5e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_": 110,
322
- "I-NOUN|\u540d\u8a5e|_+NOUN|\u540d\u8a5e|_": 111,
323
- "I-NOUN|\u540d\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 112,
324
- "I-NOUN|\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_": 113,
325
- "I-NOUN|\u56fa\u6709\u540d\u8a5e|_": 114,
326
- "I-NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 115,
327
- "I-NUM|\u6570\u8a5e|_": 116,
328
- "I-NUM|\u6570\u8a5e|_+NOUN|\u540d\u8a5e|_": 117,
329
- "I-PART|[\u7d42\u52a9\u8a5e]|_": 118,
330
- "I-PART|\u4eba\u79f0\u63a5\u8f9e|_": 119,
331
- "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+AUX|\u30c7\u30a2\u30eb\u52d5\u8a5e|_": 120,
332
- "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_": 121,
333
- "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 122,
334
- "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+VERB|\u4ed6\u52d5\u8a5e|_": 123,
335
- "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+VERB|\u81ea\u52d5\u8a5e|_": 124,
336
- "I-PART|\u52a9\u52d5\u8a5e|_": 125,
337
- "I-PART|\u63a5\u5c3e\u8f9e|_": 126,
338
- "I-PART|\u63a5\u7d9a\u52a9\u8a5e|_": 127,
339
- "I-PART|\u63a5\u982d\u8f9e|_": 128,
340
- "I-PART|\u7d42\u52a9\u8a5e|_": 129,
341
- "I-PART|\u81ea\u52d5\u8a5e|_": 130,
342
- "I-PART|\uff08\u7d42\u52a9\u8a5e\uff09|_": 131,
343
- "I-PRON|\u4ee3\u540d\u8a5e|_": 132,
344
- "I-PROPN|\u56fa\u6709\u540d\u8a5e|_": 133,
345
- "I-PUNCT|\u8a18\u53f7|_": 134,
346
- "I-SCONJ|[\u63a5\u7d9a\u52a9\u8a5e]|_": 135,
347
- "I-SCONJ|\u4ed6\u52d5\u8a5e|_": 136,
348
- "I-SCONJ|\u526f\u8a5e|_": 137,
349
- "I-SCONJ|\u5f8c\u7f6e\u526f\u8a5e|_": 138,
350
- "I-SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 139,
351
- "I-SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_+ADV|\u526f\u8a5e|_": 140,
352
- "I-SCONJ|\u63a5\u7d9a\u8a5e|_": 141,
353
- "I-SCONJ|\u683c\u52a9\u8a5e|_": 142,
354
- "I-SCONJ|\u7d42\u52a9\u8a5e|_": 143,
355
- "I-VERB|[\u81ea\u52d5\u8a5e]|_": 144,
356
- "I-VERB|\u4ed6\u52d5\u8a5e|_": 145,
357
- "I-VERB|\u4ed6\u52d5\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 146,
358
- "I-VERB|\u5b8c\u5168\u52d5\u8a5e|_": 147,
359
- "I-VERB|\u683c\u52a9\u8a5e|_": 148,
360
- "I-VERB|\u81ea\u52d5\u8a5e|_": 149,
361
- "I-VERB|\u81ea\u52d5\u8a5e|_+PART|\u4eba\u79f0\u63a5\u8f9e|_": 150,
362
- "I-VERB|\u81ea\u52d5\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 151,
363
- "I-VERT|\u4ed6\u52d5\u8a5e|_": 152,
364
- "INTJ|\u9593\u6295\u8a5e|_": 153,
365
- "NOUN|\u4ee3\u540d\u8a5e|_": 154,
366
- "NOUN|\u4f4d\u7f6e\u540d\u8a5e|_": 155,
367
- "NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_": 156,
368
- "NOUN|\u540d\u8a5e|_": 157,
369
- "NOUN|\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_": 158,
370
- "NOUN|\u540d\u8a5e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_": 159,
371
- "NOUN|\u540d\u8a5e|_+PART|\u4eba\u79f0\u63a5\u8f9e|_": 160,
372
- "NOUN|\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_": 161,
373
- "NOUN|\u56fa\u6709\u540d\u8a5e|_": 162,
374
- "NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 163,
375
- "NUM|\u6570\u8a5e|_": 164,
376
- "PART|[\u7d42\u52a9\u8a5e]|_": 165,
377
- "PART|\u4eba\u79f0\u63a5\u8f9e|_": 166,
378
- "PART|\u4eba\u79f0\u63a5\u8f9e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 167,
379
- "PART|\u4eba\u79f0\u63a5\u8f9e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 168,
380
- "PART|\u4eba\u79f0\u63a5\u8f9e|_+VERB|\u4ed6\u52d5\u8a5e|_": 169,
381
- "PART|\u63a5\u5c3e\u8f9e|_": 170,
382
- "PART|\u63a5\u7d9a\u52a9\u8a5e|_": 171,
383
- "PART|\u63a5\u982d\u8f9e|_": 172,
384
- "PART|\u7d42\u52a9\u8a5e|_": 173,
385
- "PART|\u81ea\u52d5\u8a5e|_": 174,
386
- "PROPN|\u56fa\u6709\u540d\u8a5e|_": 175,
387
- "PUNCT|\u8a18\u53f7|_": 176,
388
- "SCONJ|[\u63a5\u7d9a\u52a9\u8a5e]|_": 177,
389
- "SCONJ|\u4ed6\u52d5\u8a5e|_": 178,
390
- "SCONJ|\u526f\u8a5e|_": 179,
391
- "SCONJ|\u5f8c\u7f6e\u526f\u8a5e|_": 180,
392
- "SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 181,
393
- "SCONJ|\u63a5\u7d9a\u8a5e|_": 182,
394
- "SCONJ|\u683c\u52a9\u8a5e|_": 183,
395
- "SCONJ|\u7d42\u52a9\u8a5e|_": 184,
396
- "SYM": 185,
397
- "VERB|\u4ed6\u52d5\u8a5e|_": 186,
398
- "VERB|\u4ed6\u52d5\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 187,
399
- "VERB|\u4ed6\u52d5\u8a5e|_+PART|\u63a5\u5c3e\u8f9e|_": 188,
400
- "VERB|\u5b8c\u5168\u52d5\u8a5e|_": 189,
401
- "VERB|\u81ea\u52d5\u8a5e|_": 190,
402
- "VERB|\u81ea\u52d5\u8a5e|_+AUX|\u52a9\u52d5\u8a5e|_": 191,
403
- "VERB|\u81ea\u52d5\u8a5e|_+NOUN|\u540d\u8a5e|_": 192,
404
- "VERB|\u81ea\u52d5\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 193,
405
- "VERB|\u81ea\u52d5\u8a5e|_+VERB|\u81ea\u52d5\u8a5e|_": 194
406
  },
407
  "layer_norm_eps": 1e-07,
408
  "max_position_embeddings": 512,
@@ -570,6 +568,10 @@
570
  "Kunnei",
571
  "wano"
572
  ],
 
 
 
 
573
  "cheppone": [
574
  "cheppo",
575
  "ne"
@@ -586,6 +588,10 @@
586
  ]
587
  },
588
  "NOUN|\u540d\u8a5e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_": {
 
 
 
 
589
  "Petetoko": [
590
  "Pet",
591
  "etoko"
 
89
  "77": "B-VERT|\u4ed6\u52d5\u8a5e|_",
90
  "78": "CCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
91
  "79": "CCONJ|\u63a5\u7d9a\u8a5e|_",
92
+ "80": "DET|\u9023\u4f53\u8a5e|_",
93
+ "81": "DET|\u9023\u4f53\u8a5e|_+NOUN|\u540d\u8a5e|_",
94
+ "82": "DET|\u9023\u4f53\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_+VERB|\u81ea\u52d5\u8a5e|_",
95
+ "83": "I-ADP|\u526f\u52a9\u8a5e|_",
96
+ "84": "I-ADP|\u5f8c\u7f6e\u526f\u8a5e|_",
97
+ "85": "I-ADP|\u683c\u52a9\u8a5e|_",
98
+ "86": "I-ADP|\u683c\u52a9\u8a5e|_+VERB|\u81ea\u52d5\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
99
+ "87": "I-ADV|\u526f\u8a5e|_",
100
+ "88": "I-ADV|\u9593\u6295\u8a5e|_",
101
+ "89": "I-AUX|\u30c7\u30a2\u30eb\u52d5\u8a5e|_",
102
+ "90": "I-AUX|\u52a9\u52d5\u8a5e|_",
103
+ "91": "I-AUX|\u52a9\u52d5\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
104
+ "92": "I-AUX|\u52a9\u52d5\u8a5e|_+PART|\u7d42\u52a9\u8a5e|_",
105
+ "93": "I-CCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
106
+ "94": "I-CCONJ|\u63a5\u7d9a\u8a5e|_",
107
+ "95": "I-DET|\u526f\u8a5e|_",
108
+ "96": "I-DET|\u9023\u4f53\u8a5e|_",
109
+ "97": "I-DET|\u9023\u4f53\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
110
+ "98": "I-INFR.EV|\u5f62\u5f0f\u540d\u8a5e|_",
111
+ "99": "I-INTJ|\u9593\u6295\u8a5e|_",
112
+ "100": "I-NOUN|\u4eba\u79f0\u63a5\u8f9e|_",
113
+ "101": "I-NOUN|\u4ee3\u540d\u8a5e|_",
114
+ "102": "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_",
115
+ "103": "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_",
116
+ "104": "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_+NOUN|\u540d\u8a5e|_",
117
+ "105": "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_",
118
+ "106": "I-NOUN|\u540d\u8a5e|_",
119
+ "107": "I-NOUN|\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_",
120
+ "108": "I-NOUN|\u540d\u8a5e|_+ADV|\u526f\u8a5e|_",
121
+ "109": "I-NOUN|\u540d\u8a5e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_",
122
+ "110": "I-NOUN|\u540d\u8a5e|_+NOUN|\u540d\u8a5e|_",
123
+ "111": "I-NOUN|\u540d\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
124
+ "112": "I-NOUN|\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_",
125
+ "113": "I-NOUN|\u56fa\u6709\u540d\u8a5e|_",
126
+ "114": "I-NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
127
+ "115": "I-NUM|\u6570\u8a5e|_",
128
+ "116": "I-NUM|\u6570\u8a5e|_+NOUN|\u540d\u8a5e|_",
129
+ "117": "I-PART|[\u7d42\u52a9\u8a5e]|_",
130
+ "118": "I-PART|\u4eba\u79f0\u63a5\u8f9e|_",
131
+ "119": "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+AUX|\u30c7\u30a2\u30eb\u52d5\u8a5e|_",
132
+ "120": "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_",
133
+ "121": "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
134
+ "122": "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+VERB|\u4ed6\u52d5\u8a5e|_",
135
+ "123": "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+VERB|\u81ea\u52d5\u8a5e|_",
136
+ "124": "I-PART|\u52a9\u52d5\u8a5e|_",
137
+ "125": "I-PART|\u63a5\u5c3e\u8f9e|_",
138
+ "126": "I-PART|\u63a5\u7d9a\u52a9\u8a5e|_",
139
+ "127": "I-PART|\u63a5\u982d\u8f9e|_",
140
+ "128": "I-PART|\u7d42\u52a9\u8a5e|_",
141
+ "129": "I-PART|\u81ea\u52d5\u8a5e|_",
142
+ "130": "I-PART|\uff08\u7d42\u52a9\u8a5e\uff09|_",
143
+ "131": "I-PRON|\u4ee3\u540d\u8a5e|_",
144
+ "132": "I-PROPN|\u56fa\u6709\u540d\u8a5e|_",
145
+ "133": "I-PUNCT|\u8a18\u53f7|_",
146
+ "134": "I-SCONJ|[\u63a5\u7d9a\u52a9\u8a5e]|_",
147
+ "135": "I-SCONJ|\u4ed6\u52d5\u8a5e|_",
148
+ "136": "I-SCONJ|\u526f\u8a5e|_",
149
+ "137": "I-SCONJ|\u5f8c\u7f6e\u526f\u8a5e|_",
150
+ "138": "I-SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
151
+ "139": "I-SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_+ADV|\u526f\u8a5e|_",
152
+ "140": "I-SCONJ|\u63a5\u7d9a\u8a5e|_",
153
+ "141": "I-SCONJ|\u683c\u52a9\u8a5e|_",
154
+ "142": "I-SCONJ|\u7d42\u52a9\u8a5e|_",
155
+ "143": "I-VERB|[\u81ea\u52d5\u8a5e]|_",
156
+ "144": "I-VERB|\u4ed6\u52d5\u8a5e|_",
157
+ "145": "I-VERB|\u4ed6\u52d5\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
158
+ "146": "I-VERB|\u5b8c\u5168\u52d5\u8a5e|_",
159
+ "147": "I-VERB|\u683c\u52a9\u8a5e|_",
160
+ "148": "I-VERB|\u81ea\u52d5\u8a5e|_",
161
+ "149": "I-VERB|\u81ea\u52d5\u8a5e|_+PART|\u4eba\u79f0\u63a5\u8f9e|_",
162
+ "150": "I-VERB|\u81ea\u52d5\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
163
+ "151": "I-VERT|\u4ed6\u52d5\u8a5e|_",
164
+ "152": "INTJ|\u9593\u6295\u8a5e|_",
165
+ "153": "NOUN|\u4ee3\u540d\u8a5e|_",
166
+ "154": "NOUN|\u4f4d\u7f6e\u540d\u8a5e|_",
167
+ "155": "NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_",
168
+ "156": "NOUN|\u540d\u8a5e|_",
169
+ "157": "NOUN|\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_",
170
+ "158": "NOUN|\u540d\u8a5e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_",
171
+ "159": "NOUN|\u540d\u8a5e|_+PART|\u4eba\u79f0\u63a5\u8f9e|_",
172
+ "160": "NOUN|\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_",
173
+ "161": "NOUN|\u56fa\u6709\u540d\u8a5e|_",
174
+ "162": "NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
175
+ "163": "NUM|\u6570\u8a5e|_",
176
+ "164": "PART|[\u7d42\u52a9\u8a5e]|_",
177
+ "165": "PART|\u4eba\u79f0\u63a5\u8f9e|_",
178
+ "166": "PART|\u4eba\u79f0\u63a5\u8f9e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
179
+ "167": "PART|\u4eba\u79f0\u63a5\u8f9e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
180
+ "168": "PART|\u4eba\u79f0\u63a5\u8f9e|_+VERB|\u4ed6\u52d5\u8a5e|_",
181
+ "169": "PART|\u63a5\u5c3e\u8f9e|_",
182
+ "170": "PART|\u63a5\u7d9a\u52a9\u8a5e|_",
183
+ "171": "PART|\u63a5\u982d\u8f9e|_",
184
+ "172": "PART|\u7d42\u52a9\u8a5e|_",
185
+ "173": "PART|\u81ea\u52d5\u8a5e|_",
186
+ "174": "PROPN|\u56fa\u6709\u540d\u8a5e|_",
187
+ "175": "PUNCT|\u8a18\u53f7|_",
188
+ "176": "SCONJ|[\u63a5\u7d9a\u52a9\u8a5e]|_",
189
+ "177": "SCONJ|\u4ed6\u52d5\u8a5e|_",
190
+ "178": "SCONJ|\u526f\u8a5e|_",
191
+ "179": "SCONJ|\u5f8c\u7f6e\u526f\u8a5e|_",
192
+ "180": "SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
193
+ "181": "SCONJ|\u63a5\u7d9a\u8a5e|_",
194
+ "182": "SCONJ|\u683c\u52a9\u8a5e|_",
195
+ "183": "SCONJ|\u7d42\u52a9\u8a5e|_",
196
+ "184": "SYM",
197
+ "185": "VERB|\u4ed6\u52d5\u8a5e|_",
198
+ "186": "VERB|\u4ed6\u52d5\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
199
+ "187": "VERB|\u4ed6\u52d5\u8a5e|_+PART|\u63a5\u5c3e\u8f9e|_",
200
+ "188": "VERB|\u5b8c\u5168\u52d5\u8a5e|_",
201
+ "189": "VERB|\u81ea\u52d5\u8a5e|_",
202
+ "190": "VERB|\u81ea\u52d5\u8a5e|_+AUX|\u52a9\u52d5\u8a5e|_",
203
+ "191": "VERB|\u81ea\u52d5\u8a5e|_+NOUN|\u540d\u8a5e|_",
204
+ "192": "VERB|\u81ea\u52d5\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
205
+ "193": "VERB|\u81ea\u52d5\u8a5e|_+VERB|\u81ea\u52d5\u8a5e|_"
 
206
  },
207
  "initializer_range": 0.02,
208
  "intermediate_size": 3072,
 
287
  "B-VERT|\u4ed6\u52d5\u8a5e|_": 77,
288
  "CCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 78,
289
  "CCONJ|\u63a5\u7d9a\u8a5e|_": 79,
290
+ "DET|\u9023\u4f53\u8a5e|_": 80,
291
+ "DET|\u9023\u4f53\u8a5e|_+NOUN|\u540d\u8a5e|_": 81,
292
+ "DET|\u9023\u4f53\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_+VERB|\u81ea\u52d5\u8a5e|_": 82,
293
+ "I-ADP|\u526f\u52a9\u8a5e|_": 83,
294
+ "I-ADP|\u5f8c\u7f6e\u526f\u8a5e|_": 84,
295
+ "I-ADP|\u683c\u52a9\u8a5e|_": 85,
296
+ "I-ADP|\u683c\u52a9\u8a5e|_+VERB|\u81ea\u52d5\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 86,
297
+ "I-ADV|\u526f\u8a5e|_": 87,
298
+ "I-ADV|\u9593\u6295\u8a5e|_": 88,
299
+ "I-AUX|\u30c7\u30a2\u30eb\u52d5\u8a5e|_": 89,
300
+ "I-AUX|\u52a9\u52d5\u8a5e|_": 90,
301
+ "I-AUX|\u52a9\u52d5\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 91,
302
+ "I-AUX|\u52a9\u52d5\u8a5e|_+PART|\u7d42\u52a9\u8a5e|_": 92,
303
+ "I-CCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 93,
304
+ "I-CCONJ|\u63a5\u7d9a\u8a5e|_": 94,
305
+ "I-DET|\u526f\u8a5e|_": 95,
306
+ "I-DET|\u9023\u4f53\u8a5e|_": 96,
307
+ "I-DET|\u9023\u4f53\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 97,
308
+ "I-INFR.EV|\u5f62\u5f0f\u540d\u8a5e|_": 98,
309
+ "I-INTJ|\u9593\u6295\u8a5e|_": 99,
310
+ "I-NOUN|\u4eba\u79f0\u63a5\u8f9e|_": 100,
311
+ "I-NOUN|\u4ee3\u540d\u8a5e|_": 101,
312
+ "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_": 102,
313
+ "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_": 103,
314
+ "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_+NOUN|\u540d\u8a5e|_": 104,
315
+ "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_": 105,
316
+ "I-NOUN|\u540d\u8a5e|_": 106,
317
+ "I-NOUN|\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_": 107,
318
+ "I-NOUN|\u540d\u8a5e|_+ADV|\u526f\u8a5e|_": 108,
319
+ "I-NOUN|\u540d\u8a5e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_": 109,
320
+ "I-NOUN|\u540d\u8a5e|_+NOUN|\u540d\u8a5e|_": 110,
321
+ "I-NOUN|\u540d\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 111,
322
+ "I-NOUN|\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_": 112,
323
+ "I-NOUN|\u56fa\u6709\u540d\u8a5e|_": 113,
324
+ "I-NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 114,
325
+ "I-NUM|\u6570\u8a5e|_": 115,
326
+ "I-NUM|\u6570\u8a5e|_+NOUN|\u540d\u8a5e|_": 116,
327
+ "I-PART|[\u7d42\u52a9\u8a5e]|_": 117,
328
+ "I-PART|\u4eba\u79f0\u63a5\u8f9e|_": 118,
329
+ "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+AUX|\u30c7\u30a2\u30eb\u52d5\u8a5e|_": 119,
330
+ "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_": 120,
331
+ "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 121,
332
+ "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+VERB|\u4ed6\u52d5\u8a5e|_": 122,
333
+ "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+VERB|\u81ea\u52d5\u8a5e|_": 123,
334
+ "I-PART|\u52a9\u52d5\u8a5e|_": 124,
335
+ "I-PART|\u63a5\u5c3e\u8f9e|_": 125,
336
+ "I-PART|\u63a5\u7d9a\u52a9\u8a5e|_": 126,
337
+ "I-PART|\u63a5\u982d\u8f9e|_": 127,
338
+ "I-PART|\u7d42\u52a9\u8a5e|_": 128,
339
+ "I-PART|\u81ea\u52d5\u8a5e|_": 129,
340
+ "I-PART|\uff08\u7d42\u52a9\u8a5e\uff09|_": 130,
341
+ "I-PRON|\u4ee3\u540d\u8a5e|_": 131,
342
+ "I-PROPN|\u56fa\u6709\u540d\u8a5e|_": 132,
343
+ "I-PUNCT|\u8a18\u53f7|_": 133,
344
+ "I-SCONJ|[\u63a5\u7d9a\u52a9\u8a5e]|_": 134,
345
+ "I-SCONJ|\u4ed6\u52d5\u8a5e|_": 135,
346
+ "I-SCONJ|\u526f\u8a5e|_": 136,
347
+ "I-SCONJ|\u5f8c\u7f6e\u526f\u8a5e|_": 137,
348
+ "I-SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 138,
349
+ "I-SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_+ADV|\u526f\u8a5e|_": 139,
350
+ "I-SCONJ|\u63a5\u7d9a\u8a5e|_": 140,
351
+ "I-SCONJ|\u683c\u52a9\u8a5e|_": 141,
352
+ "I-SCONJ|\u7d42\u52a9\u8a5e|_": 142,
353
+ "I-VERB|[\u81ea\u52d5\u8a5e]|_": 143,
354
+ "I-VERB|\u4ed6\u52d5\u8a5e|_": 144,
355
+ "I-VERB|\u4ed6\u52d5\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 145,
356
+ "I-VERB|\u5b8c\u5168\u52d5\u8a5e|_": 146,
357
+ "I-VERB|\u683c\u52a9\u8a5e|_": 147,
358
+ "I-VERB|\u81ea\u52d5\u8a5e|_": 148,
359
+ "I-VERB|\u81ea\u52d5\u8a5e|_+PART|\u4eba\u79f0\u63a5\u8f9e|_": 149,
360
+ "I-VERB|\u81ea\u52d5\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 150,
361
+ "I-VERT|\u4ed6\u52d5\u8a5e|_": 151,
362
+ "INTJ|\u9593\u6295\u8a5e|_": 152,
363
+ "NOUN|\u4ee3\u540d\u8a5e|_": 153,
364
+ "NOUN|\u4f4d\u7f6e\u540d\u8a5e|_": 154,
365
+ "NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_": 155,
366
+ "NOUN|\u540d\u8a5e|_": 156,
367
+ "NOUN|\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_": 157,
368
+ "NOUN|\u540d\u8a5e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_": 158,
369
+ "NOUN|\u540d\u8a5e|_+PART|\u4eba\u79f0\u63a5\u8f9e|_": 159,
370
+ "NOUN|\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_": 160,
371
+ "NOUN|\u56fa\u6709\u540d\u8a5e|_": 161,
372
+ "NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 162,
373
+ "NUM|\u6570\u8a5e|_": 163,
374
+ "PART|[\u7d42\u52a9\u8a5e]|_": 164,
375
+ "PART|\u4eba\u79f0\u63a5\u8f9e|_": 165,
376
+ "PART|\u4eba\u79f0\u63a5\u8f9e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 166,
377
+ "PART|\u4eba\u79f0\u63a5\u8f9e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 167,
378
+ "PART|\u4eba\u79f0\u63a5\u8f9e|_+VERB|\u4ed6\u52d5\u8a5e|_": 168,
379
+ "PART|\u63a5\u5c3e\u8f9e|_": 169,
380
+ "PART|\u63a5\u7d9a\u52a9\u8a5e|_": 170,
381
+ "PART|\u63a5\u982d\u8f9e|_": 171,
382
+ "PART|\u7d42\u52a9\u8a5e|_": 172,
383
+ "PART|\u81ea\u52d5\u8a5e|_": 173,
384
+ "PROPN|\u56fa\u6709\u540d\u8a5e|_": 174,
385
+ "PUNCT|\u8a18\u53f7|_": 175,
386
+ "SCONJ|[\u63a5\u7d9a\u52a9\u8a5e]|_": 176,
387
+ "SCONJ|\u4ed6\u52d5\u8a5e|_": 177,
388
+ "SCONJ|\u526f\u8a5e|_": 178,
389
+ "SCONJ|\u5f8c\u7f6e\u526f\u8a5e|_": 179,
390
+ "SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 180,
391
+ "SCONJ|\u63a5\u7d9a\u8a5e|_": 181,
392
+ "SCONJ|\u683c\u52a9\u8a5e|_": 182,
393
+ "SCONJ|\u7d42\u52a9\u8a5e|_": 183,
394
+ "SYM": 184,
395
+ "VERB|\u4ed6\u52d5\u8a5e|_": 185,
396
+ "VERB|\u4ed6\u52d5\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 186,
397
+ "VERB|\u4ed6\u52d5\u8a5e|_+PART|\u63a5\u5c3e\u8f9e|_": 187,
398
+ "VERB|\u5b8c\u5168\u52d5\u8a5e|_": 188,
399
+ "VERB|\u81ea\u52d5\u8a5e|_": 189,
400
+ "VERB|\u81ea\u52d5\u8a5e|_+AUX|\u52a9\u52d5\u8a5e|_": 190,
401
+ "VERB|\u81ea\u52d5\u8a5e|_+NOUN|\u540d\u8a5e|_": 191,
402
+ "VERB|\u81ea\u52d5\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 192,
403
+ "VERB|\u81ea\u52d5\u8a5e|_+VERB|\u81ea\u52d5\u8a5e|_": 193
 
404
  },
405
  "layer_norm_eps": 1e-07,
406
  "max_position_embeddings": 512,
 
568
  "Kunnei",
569
  "wano"
570
  ],
571
+ "Neita": [
572
+ "Nei",
573
+ "ta"
574
+ ],
575
  "cheppone": [
576
  "cheppo",
577
  "ne"
 
588
  ]
589
  },
590
  "NOUN|\u540d\u8a5e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_": {
591
+ "Harikisam": [
592
+ "Hariki",
593
+ "sam"
594
+ ],
595
  "Petetoko": [
596
  "Pet",
597
  "etoko"
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cb8510827824e4d93b9dc9caff0fa6ad5395cafa4d43a25dc4008aac3acc4692
3
- size 419625491
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bdc0f5ddc0c03d2cfabf438c329c6f3c3a2d49980c21aede63cefbed5838aaba
3
+ size 419622419
supar.model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cda2046f9a72623127792c63c4e27212bc7fba493eaebadbfd453db6c55f1d9d
3
- size 464336203
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97c168233779fe33bfb0ae58b65812282c7cc38ba310ed4e09eaa2e54a00af92
3
+ size 464342155
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff