kiansheik commited on
Commit
c34680d
1 Parent(s): de2cf81
Files changed (4) hide show
  1. config.json +1 -1
  2. model.safetensors +1 -1
  3. special_tokens_map.json +103 -103
  4. tokenizer_config.json +84 -84
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "t5-small",
3
  "architectures": [
4
  "T5ForConditionalGeneration"
5
  ],
 
1
  {
2
+ "_name_or_path": "models/t5-1.0/",
3
  "architectures": [
4
  "T5ForConditionalGeneration"
5
  ],
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bda335eee6b0b71e68ba47a22d86956045c03b150668db8544eba78f3d01fb03
3
  size 242175016
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f79b9b04086111aba561d6b4686c472571fb1cdebd00e0436b11f6a6b72d9ed6
3
  size 242175016
special_tokens_map.json CHANGED
@@ -1,721 +1,721 @@
1
  {
2
  "additional_special_tokens": [
3
  {
4
- "content": "[GERUND_SUFFIX:CLASS_1]",
5
  "lstrip": false,
6
  "normalized": false,
7
  "rstrip": false,
8
  "single_word": false
9
  },
10
  {
11
- "content": "[NEGATION_SUFFIX:VOWEL_ENDING]",
12
  "lstrip": false,
13
  "normalized": false,
14
  "rstrip": false,
15
  "single_word": false
16
  },
17
  {
18
- "content": "[OBJECT:2pp]",
19
  "lstrip": false,
20
  "normalized": false,
21
  "rstrip": false,
22
  "single_word": false
23
  },
24
  {
25
- "content": "[NEGATION_SUFFIX:CONSONANT_ENDING]",
26
  "lstrip": false,
27
  "normalized": false,
28
  "rstrip": false,
29
  "single_word": false
30
  },
31
  {
32
- "content": "amo",
33
  "lstrip": false,
34
  "normalized": false,
35
  "rstrip": false,
36
  "single_word": false
37
  },
38
  {
39
- "content": "oro",
40
  "lstrip": false,
41
  "normalized": false,
42
  "rstrip": false,
43
  "single_word": false
44
  },
45
  {
46
- "content": "[OBJECT:MUTUAL]",
47
  "lstrip": false,
48
  "normalized": false,
49
  "rstrip": false,
50
  "single_word": false
51
  },
52
  {
53
- "content": "[SUBJECT_PREFIX:1ppi]",
54
  "lstrip": false,
55
  "normalized": false,
56
  "rstrip": false,
57
  "single_word": false
58
  },
59
  {
60
- "content": "[OBJECT_MARKER:3p:MONOSYLLABIC]",
61
  "lstrip": false,
62
  "normalized": false,
63
  "rstrip": false,
64
  "single_word": false
65
  },
66
  {
67
- "content": "[GERUND_SUFFIX:CLASS_1:NASAL_VOWEL]",
68
  "lstrip": false,
69
  "normalized": false,
70
  "rstrip": false,
71
  "single_word": false
72
  },
73
  {
74
- "content": "bo",
75
  "lstrip": false,
76
  "normalized": false,
77
  "rstrip": false,
78
  "single_word": false
79
  },
80
  {
81
- "content": "́",
82
  "lstrip": false,
83
  "normalized": false,
84
  "rstrip": false,
85
  "single_word": false
86
  },
87
  {
88
- "content": "[SUBJECT:1ps]",
89
  "lstrip": false,
90
  "normalized": false,
91
  "rstrip": false,
92
  "single_word": false
93
  },
94
  {
95
- "content": "[SUBJECT:3p]",
96
  "lstrip": false,
97
  "normalized": false,
98
  "rstrip": false,
99
  "single_word": false
100
  },
101
  {
102
- "content": "a",
103
  "lstrip": false,
104
  "normalized": false,
105
  "rstrip": false,
106
  "single_word": false
107
  },
108
  {
109
- "content": "[OBJECT_MARKER:3p:DEFAULT]",
110
  "lstrip": false,
111
  "normalized": false,
112
  "rstrip": false,
113
  "single_word": false
114
  },
115
  {
116
- "content": "îandé",
117
  "lstrip": false,
118
  "normalized": false,
119
  "rstrip": false,
120
  "single_word": false
121
  },
122
  {
123
- "content": "[OBJECT:1ppe]",
124
  "lstrip": false,
125
  "normalized": false,
126
  "rstrip": false,
127
  "single_word": false
128
  },
129
  {
130
- "content": "peîepé",
131
  "lstrip": false,
132
  "normalized": false,
133
  "rstrip": false,
134
  "single_word": false
135
  },
136
  {
137
- "content": "[PERMISSIVE_PREFIX:VOWEL]",
138
  "lstrip": false,
139
  "normalized": false,
140
  "rstrip": false,
141
  "single_word": false
142
  },
143
  {
144
- "content": "t",
145
  "lstrip": false,
146
  "normalized": false,
147
  "rstrip": false,
148
  "single_word": false
149
  },
150
  {
151
- "content": "[SUBJECT_PREFIX:2pp]",
152
  "lstrip": false,
153
  "normalized": false,
154
  "rstrip": false,
155
  "single_word": false
156
  },
157
  {
158
- "content": "[SUBJECT:1ppi]",
159
  "lstrip": false,
160
  "normalized": false,
161
  "rstrip": false,
162
  "single_word": false
163
  },
164
  {
165
- "content": "í",
166
  "lstrip": false,
167
  "normalized": false,
168
  "rstrip": false,
169
  "single_word": false
170
  },
171
  {
172
- "content": "[GERUND_SUBJECT_PREFIX:2pp]",
173
  "lstrip": false,
174
  "normalized": false,
175
  "rstrip": false,
176
  "single_word": false
177
  },
178
  {
179
- "content": "[GERUND_SUBJECT_PREFIX:2ps]",
180
  "lstrip": false,
181
  "normalized": false,
182
  "rstrip": false,
183
  "single_word": false
184
  },
185
  {
186
- "content": "[OBJECT:1ps]",
187
  "lstrip": false,
188
  "normalized": false,
189
  "rstrip": false,
190
  "single_word": false
191
  },
192
  {
193
- "content": "[GERUND_SUFFIX:CLASS_1:IYU]",
194
  "lstrip": false,
195
  "normalized": false,
196
  "rstrip": false,
197
  "single_word": false
198
  },
199
  {
200
- "content": "pe",
201
  "lstrip": false,
202
  "normalized": false,
203
  "rstrip": false,
204
  "single_word": false
205
  },
206
  {
207
- "content": "n'",
208
  "lstrip": false,
209
  "normalized": false,
210
  "rstrip": false,
211
  "single_word": false
212
  },
213
  {
214
- "content": "s",
215
  "lstrip": false,
216
  "normalized": false,
217
  "rstrip": false,
218
  "single_word": false
219
  },
220
  {
221
- "content": "a'e",
222
  "lstrip": false,
223
  "normalized": false,
224
  "rstrip": false,
225
  "single_word": false
226
  },
227
  {
228
- "content": "endé",
229
  "lstrip": false,
230
  "normalized": false,
231
  "rstrip": false,
232
  "single_word": false
233
  },
234
  {
235
- "content": "ta",
236
  "lstrip": false,
237
  "normalized": false,
238
  "rstrip": false,
239
  "single_word": false
240
  },
241
  {
242
- "content": "[SUBJECT_PREFIX:2ps]",
243
  "lstrip": false,
244
  "normalized": false,
245
  "rstrip": false,
246
  "single_word": false
247
  },
248
  {
249
- "content": "[SUBJECT:2pp:OBJECT_1P]",
250
  "lstrip": false,
251
  "normalized": false,
252
  "rstrip": false,
253
  "single_word": false
254
  },
255
  {
256
- "content": "[GERUND_SUBJECT_PREFIX:3p]",
257
  "lstrip": false,
258
  "normalized": false,
259
  "rstrip": false,
260
  "single_word": false
261
  },
262
  {
263
- "content": "[CIRCUMSTANTIAL_SUFFIX:CONSONANT_ENDING]",
264
  "lstrip": false,
265
  "normalized": false,
266
  "rstrip": false,
267
  "single_word": false
268
  },
269
  {
270
- "content": "îos",
271
  "lstrip": false,
272
  "normalized": false,
273
  "rstrip": false,
274
  "single_word": false
275
  },
276
  {
277
- "content": "[NEGATION_PARTICLE:UME]",
278
  "lstrip": false,
279
  "normalized": false,
280
  "rstrip": false,
281
  "single_word": false
282
  },
283
  {
284
- "content": "pa",
285
  "lstrip": false,
286
  "normalized": false,
287
  "rstrip": false,
288
  "single_word": false
289
  },
290
  {
291
- "content": "[OBJECT:3p]",
292
  "lstrip": false,
293
  "normalized": false,
294
  "rstrip": false,
295
  "single_word": false
296
  },
297
  {
298
- "content": "peẽ",
299
  "lstrip": false,
300
  "normalized": false,
301
  "rstrip": false,
302
  "single_word": false
303
  },
304
  {
305
- "content": "e'ym",
306
  "lstrip": false,
307
  "normalized": false,
308
  "rstrip": false,
309
  "single_word": false
310
  },
311
  {
312
- "content": "îo",
313
  "lstrip": false,
314
  "normalized": false,
315
  "rstrip": false,
316
  "single_word": false
317
  },
318
  {
319
- "content": "[PLURIFORM_PREFIX:R]",
320
  "lstrip": false,
321
  "normalized": false,
322
  "rstrip": false,
323
  "single_word": false
324
  },
325
  {
326
- "content": "namo",
327
  "lstrip": false,
328
  "normalized": false,
329
  "rstrip": false,
330
  "single_word": false
331
  },
332
  {
333
- "content": "[NEGATION_PREFIX]",
334
  "lstrip": false,
335
  "normalized": false,
336
  "rstrip": false,
337
  "single_word": false
338
  },
339
  {
340
- "content": "[IMPERATIVE_PREFIX:2pp]",
341
  "lstrip": false,
342
  "normalized": false,
343
  "rstrip": false,
344
  "single_word": false
345
  },
346
  {
347
- "content": "[OBJECT:2pp:SUBJECT_1P]",
348
  "lstrip": false,
349
  "normalized": false,
350
  "rstrip": false,
351
  "single_word": false
352
  },
353
  {
354
- "content": "[GERUND_SUFFIX:CLASS_1:NASAL_IYU]",
355
  "lstrip": false,
356
  "normalized": false,
357
  "rstrip": false,
358
  "single_word": false
359
  },
360
  {
361
- "content": "îe",
362
  "lstrip": false,
363
  "normalized": false,
364
  "rstrip": false,
365
  "single_word": false
366
  },
367
  {
368
- "content": "[OBJECT:REFLEXIVE]",
369
  "lstrip": false,
370
  "normalized": false,
371
  "rstrip": false,
372
  "single_word": false
373
  },
374
  {
375
- "content": "[PERMISSIVE_PREFIX:CONSONANT]",
376
  "lstrip": false,
377
  "normalized": false,
378
  "rstrip": false,
379
  "single_word": false
380
  },
381
  {
382
- "content": "[GERUND_SUBJECT_PREFIX:1ppi]",
383
  "lstrip": false,
384
  "normalized": false,
385
  "rstrip": false,
386
  "single_word": false
387
  },
388
  {
389
- "content": "[OBJECT_MARKER:3p:PLURIFORM_PREFIX:MONOSYLLABIC]",
390
  "lstrip": false,
391
  "normalized": false,
392
  "rstrip": false,
393
  "single_word": false
394
  },
395
  {
396
- "content": "[NEGATION_PARTICLE:NA]",
397
  "lstrip": false,
398
  "normalized": false,
399
  "rstrip": false,
400
  "single_word": false
401
  },
402
  {
403
- "content": "[IMPERATIVE_PREFIX:2ps]",
404
  "lstrip": false,
405
  "normalized": false,
406
  "rstrip": false,
407
  "single_word": false
408
  },
409
  {
410
- "content": "r",
411
  "lstrip": false,
412
  "normalized": false,
413
  "rstrip": false,
414
  "single_word": false
415
  },
416
  {
417
- "content": "[PLURIFORM_PREFIX:S]",
418
  "lstrip": false,
419
  "normalized": false,
420
  "rstrip": false,
421
  "single_word": false
422
  },
423
  {
424
- "content": "na",
425
  "lstrip": false,
426
  "normalized": false,
427
  "rstrip": false,
428
  "single_word": false
429
  },
430
  {
431
- "content": "[NEGATION_SUFFIX]",
432
  "lstrip": false,
433
  "normalized": false,
434
  "rstrip": false,
435
  "single_word": false
436
  },
437
  {
438
- "content": "ere",
439
  "lstrip": false,
440
  "normalized": false,
441
  "rstrip": false,
442
  "single_word": false
443
  },
444
  {
445
- "content": "[SUBJECT:1ppe]",
446
  "lstrip": false,
447
  "normalized": false,
448
  "rstrip": false,
449
  "single_word": false
450
  },
451
  {
452
- "content": "[SUBJECT_PREFIX:1ps]",
453
  "lstrip": false,
454
  "normalized": false,
455
  "rstrip": false,
456
  "single_word": false
457
  },
458
  {
459
- "content": "[CIRCUMSTANTIAL_SUFFIX:VOWEL_ENDING]",
460
  "lstrip": false,
461
  "normalized": false,
462
  "rstrip": false,
463
  "single_word": false
464
  },
465
  {
466
- "content": "i",
467
  "lstrip": false,
468
  "normalized": false,
469
  "rstrip": false,
470
  "single_word": false
471
  },
472
  {
473
- "content": "abo",
474
  "lstrip": false,
475
  "normalized": false,
476
  "rstrip": false,
477
  "single_word": false
478
  },
479
  {
480
- "content": "î",
481
  "lstrip": false,
482
  "normalized": false,
483
  "rstrip": false,
484
  "single_word": false
485
  },
486
  {
487
- "content": "ramo",
488
  "lstrip": false,
489
  "normalized": false,
490
  "rstrip": false,
491
  "single_word": false
492
  },
493
  {
494
- "content": "e",
495
  "lstrip": false,
496
  "normalized": false,
497
  "rstrip": false,
498
  "single_word": false
499
  },
500
  {
501
- "content": "û",
502
  "lstrip": false,
503
  "normalized": false,
504
  "rstrip": false,
505
  "single_word": false
506
  },
507
  {
508
- "content": "[GERUND_SUFFIX:CLASS_1:R]",
509
  "lstrip": false,
510
  "normalized": false,
511
  "rstrip": false,
512
  "single_word": false
513
  },
514
  {
515
- "content": "[ROOT]",
516
  "lstrip": false,
517
  "normalized": false,
518
  "rstrip": false,
519
  "single_word": false
520
  },
521
  {
522
- "content": "mo",
523
  "lstrip": false,
524
  "normalized": false,
525
  "rstrip": false,
526
  "single_word": false
527
  },
528
  {
529
- "content": "ixé",
530
  "lstrip": false,
531
  "normalized": false,
532
  "rstrip": false,
533
  "single_word": false
534
  },
535
  {
536
- "content": "[GERUND_SUFFIX:CLASS_2:NASAL_VOWEL_ENDING]",
537
  "lstrip": false,
538
  "normalized": false,
539
  "rstrip": false,
540
  "single_word": false
541
  },
542
  {
543
- "content": "[OBJECT:3p:MONOSYLLABIC]",
544
  "lstrip": false,
545
  "normalized": false,
546
  "rstrip": false,
547
  "single_word": false
548
  },
549
  {
550
- "content": "[GERUND_SUBJECT_PREFIX:1ppe]",
551
  "lstrip": false,
552
  "normalized": false,
553
  "rstrip": false,
554
  "single_word": false
555
  },
556
  {
557
- "content": "oré",
558
  "lstrip": false,
559
  "normalized": false,
560
  "rstrip": false,
561
  "single_word": false
562
  },
563
  {
564
- "content": "[GERUND_SUFFIX:CLASS_2:ORAL_VOWEL_ENDING]",
565
  "lstrip": false,
566
  "normalized": false,
567
  "rstrip": false,
568
  "single_word": false
569
  },
570
  {
571
- "content": "[SUBJECT_PREFIX:3p]",
572
  "lstrip": false,
573
  "normalized": false,
574
  "rstrip": false,
575
  "single_word": false
576
  },
577
  {
578
- "content": "[SUBJECT:2pp]",
579
  "lstrip": false,
580
  "normalized": false,
581
  "rstrip": false,
582
  "single_word": false
583
  },
584
  {
585
- "content": "[SUBJECT:2ps]",
586
  "lstrip": false,
587
  "normalized": false,
588
  "rstrip": false,
589
  "single_word": false
590
  },
591
  {
592
- "content": "[GERUND_SUFFIX:CLASS_1:ORAL_VOWEL]",
593
  "lstrip": false,
594
  "normalized": false,
595
  "rstrip": false,
596
  "single_word": false
597
  },
598
  {
599
- "content": "[GERUND_SUFFIX:CLASS_1:CONSONANT]",
600
  "lstrip": false,
601
  "normalized": false,
602
  "rstrip": false,
603
  "single_word": false
604
  },
605
  {
606
- "content": "[GERUND_SUFFIX:CLASS_2:DEFAULT]",
607
  "lstrip": false,
608
  "normalized": false,
609
  "rstrip": false,
610
  "single_word": false
611
  },
612
  {
613
- "content": "[GERUND_SUFFIX:CLASS_1:B]",
614
  "lstrip": false,
615
  "normalized": false,
616
  "rstrip": false,
617
  "single_word": false
618
  },
619
  {
620
- "content": "[SUBJECT:2ps:OBJECT_1P]",
621
  "lstrip": false,
622
  "normalized": false,
623
  "rstrip": false,
624
  "single_word": false
625
  },
626
  {
627
- "content": "[OBJECT:2ps]",
628
  "lstrip": false,
629
  "normalized": false,
630
  "rstrip": false,
631
  "single_word": false
632
  },
633
  {
634
- "content": "[CIRCUMSTANTIAL_SUFFIX:NULL_ENDING]",
635
  "lstrip": false,
636
  "normalized": false,
637
  "rstrip": false,
638
  "single_word": false
639
  },
640
  {
641
- "content": "nde",
642
  "lstrip": false,
643
  "normalized": false,
644
  "rstrip": false,
645
  "single_word": false
646
  },
647
  {
648
- "content": "o",
649
  "lstrip": false,
650
  "normalized": false,
651
  "rstrip": false,
652
  "single_word": false
653
  },
654
  {
655
- "content": "xe",
656
  "lstrip": false,
657
  "normalized": false,
658
  "rstrip": false,
659
  "single_word": false
660
  },
661
  {
662
- "content": "opo",
663
  "lstrip": false,
664
  "normalized": false,
665
  "rstrip": false,
666
  "single_word": false
667
  },
668
  {
669
- "content": "[GERUND_SUBJECT_PREFIX:1ps]",
670
  "lstrip": false,
671
  "normalized": false,
672
  "rstrip": false,
673
  "single_word": false
674
  },
675
  {
676
- "content": "gûi",
677
  "lstrip": false,
678
  "normalized": false,
679
  "rstrip": false,
680
  "single_word": false
681
  },
682
  {
683
- "content": "[OBJECT:2ps:SUBJECT_1P]",
684
  "lstrip": false,
685
  "normalized": false,
686
  "rstrip": false,
687
  "single_word": false
688
  },
689
  {
690
- "content": "îa",
691
  "lstrip": false,
692
  "normalized": false,
693
  "rstrip": false,
694
  "single_word": false
695
  },
696
  {
697
- "content": "îepé",
698
  "lstrip": false,
699
  "normalized": false,
700
  "rstrip": false,
701
  "single_word": false
702
  },
703
  {
704
- "content": "[SUBJECT_PREFIX:1ppe]",
705
  "lstrip": false,
706
  "normalized": false,
707
  "rstrip": false,
708
  "single_word": false
709
  },
710
  {
711
- "content": "[OBJECT:1ppi]",
712
  "lstrip": false,
713
  "normalized": false,
714
  "rstrip": false,
715
  "single_word": false
716
  },
717
  {
718
- "content": "umẽ",
719
  "lstrip": false,
720
  "normalized": false,
721
  "rstrip": false,
 
1
  {
2
  "additional_special_tokens": [
3
  {
4
+ "content": "e'ym",
5
  "lstrip": false,
6
  "normalized": false,
7
  "rstrip": false,
8
  "single_word": false
9
  },
10
  {
11
+ "content": "îepé",
12
  "lstrip": false,
13
  "normalized": false,
14
  "rstrip": false,
15
  "single_word": false
16
  },
17
  {
18
+ "content": "[ROOT]",
19
  "lstrip": false,
20
  "normalized": false,
21
  "rstrip": false,
22
  "single_word": false
23
  },
24
  {
25
+ "content": "[PLURIFORM_PREFIX:S]",
26
  "lstrip": false,
27
  "normalized": false,
28
  "rstrip": false,
29
  "single_word": false
30
  },
31
  {
32
+ "content": "[OBJECT:1ps]",
33
  "lstrip": false,
34
  "normalized": false,
35
  "rstrip": false,
36
  "single_word": false
37
  },
38
  {
39
+ "content": "[GERUND_SUFFIX:CLASS_1]",
40
  "lstrip": false,
41
  "normalized": false,
42
  "rstrip": false,
43
  "single_word": false
44
  },
45
  {
46
+ "content": "[OBJECT:2ps:SUBJECT_1P]",
47
  "lstrip": false,
48
  "normalized": false,
49
  "rstrip": false,
50
  "single_word": false
51
  },
52
  {
53
+ "content": "[NEGATION_PARTICLE:NA]",
54
  "lstrip": false,
55
  "normalized": false,
56
  "rstrip": false,
57
  "single_word": false
58
  },
59
  {
60
+ "content": "îe",
61
  "lstrip": false,
62
  "normalized": false,
63
  "rstrip": false,
64
  "single_word": false
65
  },
66
  {
67
+ "content": "́",
68
  "lstrip": false,
69
  "normalized": false,
70
  "rstrip": false,
71
  "single_word": false
72
  },
73
  {
74
+ "content": "amo",
75
  "lstrip": false,
76
  "normalized": false,
77
  "rstrip": false,
78
  "single_word": false
79
  },
80
  {
81
+ "content": "[GERUND_SUBJECT_PREFIX:1ppi]",
82
  "lstrip": false,
83
  "normalized": false,
84
  "rstrip": false,
85
  "single_word": false
86
  },
87
  {
88
+ "content": "îa",
89
  "lstrip": false,
90
  "normalized": false,
91
  "rstrip": false,
92
  "single_word": false
93
  },
94
  {
95
+ "content": "umẽ",
96
  "lstrip": false,
97
  "normalized": false,
98
  "rstrip": false,
99
  "single_word": false
100
  },
101
  {
102
+ "content": "[GERUND_SUBJECT_PREFIX:1ps]",
103
  "lstrip": false,
104
  "normalized": false,
105
  "rstrip": false,
106
  "single_word": false
107
  },
108
  {
109
+ "content": "[IMPERATIVE_PREFIX:2pp]",
110
  "lstrip": false,
111
  "normalized": false,
112
  "rstrip": false,
113
  "single_word": false
114
  },
115
  {
116
+ "content": "o",
117
  "lstrip": false,
118
  "normalized": false,
119
  "rstrip": false,
120
  "single_word": false
121
  },
122
  {
123
+ "content": "[SUBJECT_PREFIX:1ppi]",
124
  "lstrip": false,
125
  "normalized": false,
126
  "rstrip": false,
127
  "single_word": false
128
  },
129
  {
130
+ "content": "xe",
131
  "lstrip": false,
132
  "normalized": false,
133
  "rstrip": false,
134
  "single_word": false
135
  },
136
  {
137
+ "content": "[SUBJECT_PREFIX:1ps]",
138
  "lstrip": false,
139
  "normalized": false,
140
  "rstrip": false,
141
  "single_word": false
142
  },
143
  {
144
+ "content": "[PLURIFORM_PREFIX:R]",
145
  "lstrip": false,
146
  "normalized": false,
147
  "rstrip": false,
148
  "single_word": false
149
  },
150
  {
151
+ "content": "í",
152
  "lstrip": false,
153
  "normalized": false,
154
  "rstrip": false,
155
  "single_word": false
156
  },
157
  {
158
+ "content": "n'",
159
  "lstrip": false,
160
  "normalized": false,
161
  "rstrip": false,
162
  "single_word": false
163
  },
164
  {
165
+ "content": "[OBJECT:2pp:SUBJECT_1P]",
166
  "lstrip": false,
167
  "normalized": false,
168
  "rstrip": false,
169
  "single_word": false
170
  },
171
  {
172
+ "content": "[PERMISSIVE_PREFIX:CONSONANT]",
173
  "lstrip": false,
174
  "normalized": false,
175
  "rstrip": false,
176
  "single_word": false
177
  },
178
  {
179
+ "content": "[SUBJECT:1ps]",
180
  "lstrip": false,
181
  "normalized": false,
182
  "rstrip": false,
183
  "single_word": false
184
  },
185
  {
186
+ "content": "î",
187
  "lstrip": false,
188
  "normalized": false,
189
  "rstrip": false,
190
  "single_word": false
191
  },
192
  {
193
+ "content": "[SUBJECT:2ps]",
194
  "lstrip": false,
195
  "normalized": false,
196
  "rstrip": false,
197
  "single_word": false
198
  },
199
  {
200
+ "content": "[OBJECT_MARKER:3p:PLURIFORM_PREFIX:MONOSYLLABIC]",
201
  "lstrip": false,
202
  "normalized": false,
203
  "rstrip": false,
204
  "single_word": false
205
  },
206
  {
207
+ "content": "pe",
208
  "lstrip": false,
209
  "normalized": false,
210
  "rstrip": false,
211
  "single_word": false
212
  },
213
  {
214
+ "content": "[NEGATION_PREFIX]",
215
  "lstrip": false,
216
  "normalized": false,
217
  "rstrip": false,
218
  "single_word": false
219
  },
220
  {
221
+ "content": "[OBJECT:2pp]",
222
  "lstrip": false,
223
  "normalized": false,
224
  "rstrip": false,
225
  "single_word": false
226
  },
227
  {
228
+ "content": "abo",
229
  "lstrip": false,
230
  "normalized": false,
231
  "rstrip": false,
232
  "single_word": false
233
  },
234
  {
235
+ "content": "na",
236
  "lstrip": false,
237
  "normalized": false,
238
  "rstrip": false,
239
  "single_word": false
240
  },
241
  {
242
+ "content": "[GERUND_SUFFIX:CLASS_1:R]",
243
  "lstrip": false,
244
  "normalized": false,
245
  "rstrip": false,
246
  "single_word": false
247
  },
248
  {
249
+ "content": "[SUBJECT_PREFIX:3p]",
250
  "lstrip": false,
251
  "normalized": false,
252
  "rstrip": false,
253
  "single_word": false
254
  },
255
  {
256
+ "content": "[OBJECT:1ppi]",
257
  "lstrip": false,
258
  "normalized": false,
259
  "rstrip": false,
260
  "single_word": false
261
  },
262
  {
263
+ "content": "[NEGATION_PARTICLE:UME]",
264
  "lstrip": false,
265
  "normalized": false,
266
  "rstrip": false,
267
  "single_word": false
268
  },
269
  {
270
+ "content": "îandé",
271
  "lstrip": false,
272
  "normalized": false,
273
  "rstrip": false,
274
  "single_word": false
275
  },
276
  {
277
+ "content": "[GERUND_SUFFIX:CLASS_1:ORAL_VOWEL]",
278
  "lstrip": false,
279
  "normalized": false,
280
  "rstrip": false,
281
  "single_word": false
282
  },
283
  {
284
+ "content": "[NEGATION_SUFFIX:CONSONANT_ENDING]",
285
  "lstrip": false,
286
  "normalized": false,
287
  "rstrip": false,
288
  "single_word": false
289
  },
290
  {
291
+ "content": "[GERUND_SUBJECT_PREFIX:2pp]",
292
  "lstrip": false,
293
  "normalized": false,
294
  "rstrip": false,
295
  "single_word": false
296
  },
297
  {
298
+ "content": "[CIRCUMSTANTIAL_SUFFIX:CONSONANT_ENDING]",
299
  "lstrip": false,
300
  "normalized": false,
301
  "rstrip": false,
302
  "single_word": false
303
  },
304
  {
305
+ "content": "[GERUND_SUFFIX:CLASS_2:ORAL_VOWEL_ENDING]",
306
  "lstrip": false,
307
  "normalized": false,
308
  "rstrip": false,
309
  "single_word": false
310
  },
311
  {
312
+ "content": "gûi",
313
  "lstrip": false,
314
  "normalized": false,
315
  "rstrip": false,
316
  "single_word": false
317
  },
318
  {
319
+ "content": "[GERUND_SUBJECT_PREFIX:2ps]",
320
  "lstrip": false,
321
  "normalized": false,
322
  "rstrip": false,
323
  "single_word": false
324
  },
325
  {
326
+ "content": "ixé",
327
  "lstrip": false,
328
  "normalized": false,
329
  "rstrip": false,
330
  "single_word": false
331
  },
332
  {
333
+ "content": "namo",
334
  "lstrip": false,
335
  "normalized": false,
336
  "rstrip": false,
337
  "single_word": false
338
  },
339
  {
340
+ "content": "[OBJECT:3p]",
341
  "lstrip": false,
342
  "normalized": false,
343
  "rstrip": false,
344
  "single_word": false
345
  },
346
  {
347
+ "content": "ere",
348
  "lstrip": false,
349
  "normalized": false,
350
  "rstrip": false,
351
  "single_word": false
352
  },
353
  {
354
+ "content": "mo",
355
  "lstrip": false,
356
  "normalized": false,
357
  "rstrip": false,
358
  "single_word": false
359
  },
360
  {
361
+ "content": "[GERUND_SUFFIX:CLASS_2:NASAL_VOWEL_ENDING]",
362
  "lstrip": false,
363
  "normalized": false,
364
  "rstrip": false,
365
  "single_word": false
366
  },
367
  {
368
+ "content": "[SUBJECT:1ppe]",
369
  "lstrip": false,
370
  "normalized": false,
371
  "rstrip": false,
372
  "single_word": false
373
  },
374
  {
375
+ "content": "[GERUND_SUBJECT_PREFIX:3p]",
376
  "lstrip": false,
377
  "normalized": false,
378
  "rstrip": false,
379
  "single_word": false
380
  },
381
  {
382
+ "content": "[OBJECT_MARKER:3p:DEFAULT]",
383
  "lstrip": false,
384
  "normalized": false,
385
  "rstrip": false,
386
  "single_word": false
387
  },
388
  {
389
+ "content": "[SUBJECT:1ppi]",
390
  "lstrip": false,
391
  "normalized": false,
392
  "rstrip": false,
393
  "single_word": false
394
  },
395
  {
396
+ "content": "[GERUND_SUFFIX:CLASS_1:NASAL_VOWEL]",
397
  "lstrip": false,
398
  "normalized": false,
399
  "rstrip": false,
400
  "single_word": false
401
  },
402
  {
403
+ "content": "peẽ",
404
  "lstrip": false,
405
  "normalized": false,
406
  "rstrip": false,
407
  "single_word": false
408
  },
409
  {
410
+ "content": "s",
411
  "lstrip": false,
412
  "normalized": false,
413
  "rstrip": false,
414
  "single_word": false
415
  },
416
  {
417
+ "content": "[SUBJECT:3p]",
418
  "lstrip": false,
419
  "normalized": false,
420
  "rstrip": false,
421
  "single_word": false
422
  },
423
  {
424
+ "content": "û",
425
  "lstrip": false,
426
  "normalized": false,
427
  "rstrip": false,
428
  "single_word": false
429
  },
430
  {
431
+ "content": "[SUBJECT:2ps:OBJECT_1P]",
432
  "lstrip": false,
433
  "normalized": false,
434
  "rstrip": false,
435
  "single_word": false
436
  },
437
  {
438
+ "content": "îos",
439
  "lstrip": false,
440
  "normalized": false,
441
  "rstrip": false,
442
  "single_word": false
443
  },
444
  {
445
+ "content": "nde",
446
  "lstrip": false,
447
  "normalized": false,
448
  "rstrip": false,
449
  "single_word": false
450
  },
451
  {
452
+ "content": "endé",
453
  "lstrip": false,
454
  "normalized": false,
455
  "rstrip": false,
456
  "single_word": false
457
  },
458
  {
459
+ "content": "[OBJECT:MUTUAL]",
460
  "lstrip": false,
461
  "normalized": false,
462
  "rstrip": false,
463
  "single_word": false
464
  },
465
  {
466
+ "content": "[GERUND_SUFFIX:CLASS_1:CONSONANT]",
467
  "lstrip": false,
468
  "normalized": false,
469
  "rstrip": false,
470
  "single_word": false
471
  },
472
  {
473
+ "content": "oré",
474
  "lstrip": false,
475
  "normalized": false,
476
  "rstrip": false,
477
  "single_word": false
478
  },
479
  {
480
+ "content": "t",
481
  "lstrip": false,
482
  "normalized": false,
483
  "rstrip": false,
484
  "single_word": false
485
  },
486
  {
487
+ "content": "bo",
488
  "lstrip": false,
489
  "normalized": false,
490
  "rstrip": false,
491
  "single_word": false
492
  },
493
  {
494
+ "content": "[GERUND_SUFFIX:CLASS_1:IYU]",
495
  "lstrip": false,
496
  "normalized": false,
497
  "rstrip": false,
498
  "single_word": false
499
  },
500
  {
501
+ "content": "r",
502
  "lstrip": false,
503
  "normalized": false,
504
  "rstrip": false,
505
  "single_word": false
506
  },
507
  {
508
+ "content": "i",
509
  "lstrip": false,
510
  "normalized": false,
511
  "rstrip": false,
512
  "single_word": false
513
  },
514
  {
515
+ "content": "ramo",
516
  "lstrip": false,
517
  "normalized": false,
518
  "rstrip": false,
519
  "single_word": false
520
  },
521
  {
522
+ "content": "[OBJECT:1ppe]",
523
  "lstrip": false,
524
  "normalized": false,
525
  "rstrip": false,
526
  "single_word": false
527
  },
528
  {
529
+ "content": "[OBJECT:3p:MONOSYLLABIC]",
530
  "lstrip": false,
531
  "normalized": false,
532
  "rstrip": false,
533
  "single_word": false
534
  },
535
  {
536
+ "content": "ta",
537
  "lstrip": false,
538
  "normalized": false,
539
  "rstrip": false,
540
  "single_word": false
541
  },
542
  {
543
+ "content": "[SUBJECT_PREFIX:2ps]",
544
  "lstrip": false,
545
  "normalized": false,
546
  "rstrip": false,
547
  "single_word": false
548
  },
549
  {
550
+ "content": "a'e",
551
  "lstrip": false,
552
  "normalized": false,
553
  "rstrip": false,
554
  "single_word": false
555
  },
556
  {
557
+ "content": "peîepé",
558
  "lstrip": false,
559
  "normalized": false,
560
  "rstrip": false,
561
  "single_word": false
562
  },
563
  {
564
+ "content": "a",
565
  "lstrip": false,
566
  "normalized": false,
567
  "rstrip": false,
568
  "single_word": false
569
  },
570
  {
571
+ "content": "[GERUND_SUBJECT_PREFIX:1ppe]",
572
  "lstrip": false,
573
  "normalized": false,
574
  "rstrip": false,
575
  "single_word": false
576
  },
577
  {
578
+ "content": "[GERUND_SUFFIX:CLASS_2:DEFAULT]",
579
  "lstrip": false,
580
  "normalized": false,
581
  "rstrip": false,
582
  "single_word": false
583
  },
584
  {
585
+ "content": "[SUBJECT:2pp]",
586
  "lstrip": false,
587
  "normalized": false,
588
  "rstrip": false,
589
  "single_word": false
590
  },
591
  {
592
+ "content": "[GERUND_SUFFIX:CLASS_1:NASAL_IYU]",
593
  "lstrip": false,
594
  "normalized": false,
595
  "rstrip": false,
596
  "single_word": false
597
  },
598
  {
599
+ "content": "[OBJECT:2ps]",
600
  "lstrip": false,
601
  "normalized": false,
602
  "rstrip": false,
603
  "single_word": false
604
  },
605
  {
606
+ "content": "[SUBJECT_PREFIX:1ppe]",
607
  "lstrip": false,
608
  "normalized": false,
609
  "rstrip": false,
610
  "single_word": false
611
  },
612
  {
613
+ "content": "[NEGATION_SUFFIX]",
614
  "lstrip": false,
615
  "normalized": false,
616
  "rstrip": false,
617
  "single_word": false
618
  },
619
  {
620
+ "content": "e",
621
  "lstrip": false,
622
  "normalized": false,
623
  "rstrip": false,
624
  "single_word": false
625
  },
626
  {
627
+ "content": "[PERMISSIVE_PREFIX:VOWEL]",
628
  "lstrip": false,
629
  "normalized": false,
630
  "rstrip": false,
631
  "single_word": false
632
  },
633
  {
634
+ "content": "[OBJECT:REFLEXIVE]",
635
  "lstrip": false,
636
  "normalized": false,
637
  "rstrip": false,
638
  "single_word": false
639
  },
640
  {
641
+ "content": "pa",
642
  "lstrip": false,
643
  "normalized": false,
644
  "rstrip": false,
645
  "single_word": false
646
  },
647
  {
648
+ "content": "[SUBJECT_PREFIX:2pp]",
649
  "lstrip": false,
650
  "normalized": false,
651
  "rstrip": false,
652
  "single_word": false
653
  },
654
  {
655
+ "content": "[GERUND_SUFFIX:CLASS_1:B]",
656
  "lstrip": false,
657
  "normalized": false,
658
  "rstrip": false,
659
  "single_word": false
660
  },
661
  {
662
+ "content": "[SUBJECT:2pp:OBJECT_1P]",
663
  "lstrip": false,
664
  "normalized": false,
665
  "rstrip": false,
666
  "single_word": false
667
  },
668
  {
669
+ "content": "oro",
670
  "lstrip": false,
671
  "normalized": false,
672
  "rstrip": false,
673
  "single_word": false
674
  },
675
  {
676
+ "content": "[NEGATION_SUFFIX:VOWEL_ENDING]",
677
  "lstrip": false,
678
  "normalized": false,
679
  "rstrip": false,
680
  "single_word": false
681
  },
682
  {
683
+ "content": "[CIRCUMSTANTIAL_SUFFIX:VOWEL_ENDING]",
684
  "lstrip": false,
685
  "normalized": false,
686
  "rstrip": false,
687
  "single_word": false
688
  },
689
  {
690
+ "content": "[CIRCUMSTANTIAL_SUFFIX:NULL_ENDING]",
691
  "lstrip": false,
692
  "normalized": false,
693
  "rstrip": false,
694
  "single_word": false
695
  },
696
  {
697
+ "content": "[IMPERATIVE_PREFIX:2ps]",
698
  "lstrip": false,
699
  "normalized": false,
700
  "rstrip": false,
701
  "single_word": false
702
  },
703
  {
704
+ "content": "[OBJECT_MARKER:3p:MONOSYLLABIC]",
705
  "lstrip": false,
706
  "normalized": false,
707
  "rstrip": false,
708
  "single_word": false
709
  },
710
  {
711
+ "content": "opo",
712
  "lstrip": false,
713
  "normalized": false,
714
  "rstrip": false,
715
  "single_word": false
716
  },
717
  {
718
+ "content": "îo",
719
  "lstrip": false,
720
  "normalized": false,
721
  "rstrip": false,
tokenizer_config.json CHANGED
@@ -1659,109 +1659,109 @@
1659
  }
1660
  },
1661
  "additional_special_tokens": [
 
 
 
 
 
1662
  "[GERUND_SUFFIX:CLASS_1]",
1663
- "[NEGATION_SUFFIX:VOWEL_ENDING]",
1664
- "[OBJECT:2pp]",
1665
- "[NEGATION_SUFFIX:CONSONANT_ENDING]",
 
1666
  "amo",
1667
- "oro",
1668
- "[OBJECT:MUTUAL]",
 
 
 
 
1669
  "[SUBJECT_PREFIX:1ppi]",
1670
- "[OBJECT_MARKER:3p:MONOSYLLABIC]",
1671
- "[GERUND_SUFFIX:CLASS_1:NASAL_VOWEL]",
1672
- "bo",
1673
- "́",
1674
- "[SUBJECT:1ps]",
1675
- "[SUBJECT:3p]",
1676
- "a",
1677
- "[OBJECT_MARKER:3p:DEFAULT]",
1678
- "îandé",
1679
- "[OBJECT:1ppe]",
1680
- "peîepé",
1681
- "[PERMISSIVE_PREFIX:VOWEL]",
1682
- "t",
1683
- "[SUBJECT_PREFIX:2pp]",
1684
- "[SUBJECT:1ppi]",
1685
  "í",
1686
- "[GERUND_SUBJECT_PREFIX:2pp]",
1687
- "[GERUND_SUBJECT_PREFIX:2ps]",
1688
- "[OBJECT:1ps]",
1689
- "[GERUND_SUFFIX:CLASS_1:IYU]",
1690
- "pe",
1691
  "n'",
1692
- "s",
1693
- "a'e",
1694
- "endé",
1695
- "ta",
1696
- "[SUBJECT_PREFIX:2ps]",
1697
- "[SUBJECT:2pp:OBJECT_1P]",
1698
- "[GERUND_SUBJECT_PREFIX:3p]",
1699
- "[CIRCUMSTANTIAL_SUFFIX:CONSONANT_ENDING]",
1700
- "îos",
1701
- "[NEGATION_PARTICLE:UME]",
1702
- "pa",
1703
- "[OBJECT:3p]",
1704
- "peẽ",
1705
- "e'ym",
1706
- "îo",
1707
- "[PLURIFORM_PREFIX:R]",
1708
- "namo",
1709
- "[NEGATION_PREFIX]",
1710
- "[IMPERATIVE_PREFIX:2pp]",
1711
  "[OBJECT:2pp:SUBJECT_1P]",
1712
- "[GERUND_SUFFIX:CLASS_1:NASAL_IYU]",
1713
- "îe",
1714
- "[OBJECT:REFLEXIVE]",
1715
  "[PERMISSIVE_PREFIX:CONSONANT]",
1716
- "[GERUND_SUBJECT_PREFIX:1ppi]",
 
 
1717
  "[OBJECT_MARKER:3p:PLURIFORM_PREFIX:MONOSYLLABIC]",
1718
- "[NEGATION_PARTICLE:NA]",
1719
- "[IMPERATIVE_PREFIX:2ps]",
1720
- "r",
1721
- "[PLURIFORM_PREFIX:S]",
1722
  "na",
1723
- "[NEGATION_SUFFIX]",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1724
  "ere",
 
 
1725
  "[SUBJECT:1ppe]",
1726
- "[SUBJECT_PREFIX:1ps]",
1727
- "[CIRCUMSTANTIAL_SUFFIX:VOWEL_ENDING]",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1728
  "i",
1729
- "abo",
1730
- "î",
1731
  "ramo",
1732
- "e",
1733
- "û",
1734
- "[GERUND_SUFFIX:CLASS_1:R]",
1735
- "[ROOT]",
1736
- "mo",
1737
- "ixé",
1738
- "[GERUND_SUFFIX:CLASS_2:NASAL_VOWEL_ENDING]",
1739
  "[OBJECT:3p:MONOSYLLABIC]",
 
 
 
 
 
1740
  "[GERUND_SUBJECT_PREFIX:1ppe]",
1741
- "oré",
1742
- "[GERUND_SUFFIX:CLASS_2:ORAL_VOWEL_ENDING]",
1743
- "[SUBJECT_PREFIX:3p]",
1744
- "[SUBJECT:2pp]",
1745
- "[SUBJECT:2ps]",
1746
- "[GERUND_SUFFIX:CLASS_1:ORAL_VOWEL]",
1747
- "[GERUND_SUFFIX:CLASS_1:CONSONANT]",
1748
  "[GERUND_SUFFIX:CLASS_2:DEFAULT]",
1749
- "[GERUND_SUFFIX:CLASS_1:B]",
1750
- "[SUBJECT:2ps:OBJECT_1P]",
1751
  "[OBJECT:2ps]",
 
 
 
 
 
 
 
 
 
 
 
 
1752
  "[CIRCUMSTANTIAL_SUFFIX:NULL_ENDING]",
1753
- "nde",
1754
- "o",
1755
- "xe",
1756
  "opo",
1757
- "[GERUND_SUBJECT_PREFIX:1ps]",
1758
- "gûi",
1759
- "[OBJECT:2ps:SUBJECT_1P]",
1760
- "îa",
1761
- "îepé",
1762
- "[SUBJECT_PREFIX:1ppe]",
1763
- "[OBJECT:1ppi]",
1764
- "umẽ"
1765
  ],
1766
  "clean_up_tokenization_spaces": true,
1767
  "eos_token": "</s>",
 
1659
  }
1660
  },
1661
  "additional_special_tokens": [
1662
+ "e'ym",
1663
+ "îepé",
1664
+ "[ROOT]",
1665
+ "[PLURIFORM_PREFIX:S]",
1666
+ "[OBJECT:1ps]",
1667
  "[GERUND_SUFFIX:CLASS_1]",
1668
+ "[OBJECT:2ps:SUBJECT_1P]",
1669
+ "[NEGATION_PARTICLE:NA]",
1670
+ "îe",
1671
+ "́",
1672
  "amo",
1673
+ "[GERUND_SUBJECT_PREFIX:1ppi]",
1674
+ "îa",
1675
+ "umẽ",
1676
+ "[GERUND_SUBJECT_PREFIX:1ps]",
1677
+ "[IMPERATIVE_PREFIX:2pp]",
1678
+ "o",
1679
  "[SUBJECT_PREFIX:1ppi]",
1680
+ "xe",
1681
+ "[SUBJECT_PREFIX:1ps]",
1682
+ "[PLURIFORM_PREFIX:R]",
 
 
 
 
 
 
 
 
 
 
 
 
1683
  "í",
 
 
 
 
 
1684
  "n'",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1685
  "[OBJECT:2pp:SUBJECT_1P]",
 
 
 
1686
  "[PERMISSIVE_PREFIX:CONSONANT]",
1687
+ "[SUBJECT:1ps]",
1688
+ "î",
1689
+ "[SUBJECT:2ps]",
1690
  "[OBJECT_MARKER:3p:PLURIFORM_PREFIX:MONOSYLLABIC]",
1691
+ "pe",
1692
+ "[NEGATION_PREFIX]",
1693
+ "[OBJECT:2pp]",
1694
+ "abo",
1695
  "na",
1696
+ "[GERUND_SUFFIX:CLASS_1:R]",
1697
+ "[SUBJECT_PREFIX:3p]",
1698
+ "[OBJECT:1ppi]",
1699
+ "[NEGATION_PARTICLE:UME]",
1700
+ "îandé",
1701
+ "[GERUND_SUFFIX:CLASS_1:ORAL_VOWEL]",
1702
+ "[NEGATION_SUFFIX:CONSONANT_ENDING]",
1703
+ "[GERUND_SUBJECT_PREFIX:2pp]",
1704
+ "[CIRCUMSTANTIAL_SUFFIX:CONSONANT_ENDING]",
1705
+ "[GERUND_SUFFIX:CLASS_2:ORAL_VOWEL_ENDING]",
1706
+ "gûi",
1707
+ "[GERUND_SUBJECT_PREFIX:2ps]",
1708
+ "ixé",
1709
+ "namo",
1710
+ "[OBJECT:3p]",
1711
  "ere",
1712
+ "mo",
1713
+ "[GERUND_SUFFIX:CLASS_2:NASAL_VOWEL_ENDING]",
1714
  "[SUBJECT:1ppe]",
1715
+ "[GERUND_SUBJECT_PREFIX:3p]",
1716
+ "[OBJECT_MARKER:3p:DEFAULT]",
1717
+ "[SUBJECT:1ppi]",
1718
+ "[GERUND_SUFFIX:CLASS_1:NASAL_VOWEL]",
1719
+ "peẽ",
1720
+ "s",
1721
+ "[SUBJECT:3p]",
1722
+ "û",
1723
+ "[SUBJECT:2ps:OBJECT_1P]",
1724
+ "îos",
1725
+ "nde",
1726
+ "endé",
1727
+ "[OBJECT:MUTUAL]",
1728
+ "[GERUND_SUFFIX:CLASS_1:CONSONANT]",
1729
+ "oré",
1730
+ "t",
1731
+ "bo",
1732
+ "[GERUND_SUFFIX:CLASS_1:IYU]",
1733
+ "r",
1734
  "i",
 
 
1735
  "ramo",
1736
+ "[OBJECT:1ppe]",
 
 
 
 
 
 
1737
  "[OBJECT:3p:MONOSYLLABIC]",
1738
+ "ta",
1739
+ "[SUBJECT_PREFIX:2ps]",
1740
+ "a'e",
1741
+ "peîepé",
1742
+ "a",
1743
  "[GERUND_SUBJECT_PREFIX:1ppe]",
 
 
 
 
 
 
 
1744
  "[GERUND_SUFFIX:CLASS_2:DEFAULT]",
1745
+ "[SUBJECT:2pp]",
1746
+ "[GERUND_SUFFIX:CLASS_1:NASAL_IYU]",
1747
  "[OBJECT:2ps]",
1748
+ "[SUBJECT_PREFIX:1ppe]",
1749
+ "[NEGATION_SUFFIX]",
1750
+ "e",
1751
+ "[PERMISSIVE_PREFIX:VOWEL]",
1752
+ "[OBJECT:REFLEXIVE]",
1753
+ "pa",
1754
+ "[SUBJECT_PREFIX:2pp]",
1755
+ "[GERUND_SUFFIX:CLASS_1:B]",
1756
+ "[SUBJECT:2pp:OBJECT_1P]",
1757
+ "oro",
1758
+ "[NEGATION_SUFFIX:VOWEL_ENDING]",
1759
+ "[CIRCUMSTANTIAL_SUFFIX:VOWEL_ENDING]",
1760
  "[CIRCUMSTANTIAL_SUFFIX:NULL_ENDING]",
1761
+ "[IMPERATIVE_PREFIX:2ps]",
1762
+ "[OBJECT_MARKER:3p:MONOSYLLABIC]",
 
1763
  "opo",
1764
+ "îo"
 
 
 
 
 
 
 
1765
  ],
1766
  "clean_up_tokenization_spaces": true,
1767
  "eos_token": "</s>",