foxxy-hm commited on
Commit
dd0c1c7
·
1 Parent(s): 1ce0c5e

Upload processor

Browse files
Files changed (1) hide show
  1. vocab.json +112 -1
vocab.json CHANGED
@@ -1 +1,112 @@
1
- {"\u1ecf": 0, "\u1ef7": 1, "\u0301": 2, "u": 3, "%": 4, "\u1ee5": 5, "\u1ee1": 6, "\u0443": 7, "\u1eaf": 8, "\u00fd": 9, "9": 10, "k": 11, "\u0169": 12, "\u1ec5": 13, "\u1eeb": 14, "\u1eed": 15, "\u1ee7": 16, "e": 17, "\u1eb1": 18, "\u1ea9": 19, "\u1ec1": 20, "b": 21, "\u1ef1": 22, "\u1ead": 23, "\u00e0": 24, "\u00f2": 25, "t": 26, "\u1edb": 27, "q": 28, "0": 29, "\u0300": 30, "\u1ecb": 31, "\u1ec3": 32, "c": 33, "\u1eb7": 35, "\u1eab": 36, "\u00e9": 37, "\u1ea1": 38, "\u1ed9": 39, "o": 40, "\u1ed1": 41, "5": 42, "\u01a1": 43, "z": 44, "\u1ef5": 45, "i": 46, "\u0129": 47, "\u0111": 48, "v": 49, "\u1ea3": 50, "\u01b0": 51, "\u00f3": 52, "r": 53, "a": 54, "\u1ea7": 55, "s": 56, "y": 57, "\u00fa": 58, "\u1ef9": 59, "x": 60, "d": 61, "\u00ed": 62, "\u1eef": 63, "4": 64, "m": 65, "f": 66, "\u00ec": 67, "\u00e8": 68, "\u1ee9": 69, "\u0323": 70, "\u1eb3": 71, "\u1ecd": 72, "3": 73, "\u1ed3": 74, "\u1eb5": 75, "\u00f9": 76, "l": 77, "p": 78, "6": 79, "\u1eb9": 80, "\u00ea": 81, "\u00f4": 82, "\u00e1": 83, "\u1ea5": 84, "\u00e2": 85, "\u1ed7": 86, "\u1ebd": 87, "h": 88, "\u00f5": 89, "\u1ebb": 90, "g": 91, "\u1ee3": 92, "\u1edd": 93, "n": 94, "2": 95, "\u00e3": 96, "1": 97, "\u0103": 98, "7": 99, "w": 100, "\u1edf": 101, "\u1ebf": 102, "\u1ec7": 103, "\u1ed5": 104, "\u1ef3": 105, "\u1ec9": 106, "8": 107, "|": 34, "[UNK]": 108, "[PAD]": 109}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "%": 4,
3
+ "0": 29,
4
+ "1": 97,
5
+ "2": 95,
6
+ "3": 73,
7
+ "4": 64,
8
+ "5": 42,
9
+ "6": 79,
10
+ "7": 99,
11
+ "8": 107,
12
+ "9": 10,
13
+ "[PAD]": 109,
14
+ "[UNK]": 108,
15
+ "a": 54,
16
+ "b": 21,
17
+ "c": 33,
18
+ "d": 61,
19
+ "e": 17,
20
+ "f": 66,
21
+ "g": 91,
22
+ "h": 88,
23
+ "i": 46,
24
+ "k": 11,
25
+ "l": 77,
26
+ "m": 65,
27
+ "n": 94,
28
+ "o": 40,
29
+ "p": 78,
30
+ "q": 28,
31
+ "r": 53,
32
+ "s": 56,
33
+ "t": 26,
34
+ "u": 3,
35
+ "v": 49,
36
+ "w": 100,
37
+ "x": 60,
38
+ "y": 57,
39
+ "z": 44,
40
+ "|": 34,
41
+ "à": 24,
42
+ "á": 83,
43
+ "â": 85,
44
+ "ã": 96,
45
+ "è": 68,
46
+ "é": 37,
47
+ "ê": 81,
48
+ "ì": 67,
49
+ "í": 62,
50
+ "ò": 25,
51
+ "ó": 52,
52
+ "ô": 82,
53
+ "õ": 89,
54
+ "ù": 76,
55
+ "ú": 58,
56
+ "ý": 9,
57
+ "ă": 98,
58
+ "đ": 48,
59
+ "ĩ": 47,
60
+ "ũ": 12,
61
+ "ơ": 43,
62
+ "ư": 51,
63
+ "̀": 30,
64
+ "́": 2,
65
+ "̣": 70,
66
+ "у": 7,
67
+ "ạ": 38,
68
+ "ả": 50,
69
+ "ấ": 84,
70
+ "ầ": 55,
71
+ "ẩ": 19,
72
+ "ẫ": 36,
73
+ "ậ": 23,
74
+ "ắ": 8,
75
+ "ằ": 18,
76
+ "ẳ": 71,
77
+ "ẵ": 75,
78
+ "ặ": 35,
79
+ "ẹ": 80,
80
+ "ẻ": 90,
81
+ "ẽ": 87,
82
+ "ế": 102,
83
+ "ề": 20,
84
+ "ể": 32,
85
+ "ễ": 13,
86
+ "ệ": 103,
87
+ "ỉ": 106,
88
+ "ị": 31,
89
+ "ọ": 72,
90
+ "ỏ": 0,
91
+ "ố": 41,
92
+ "ồ": 74,
93
+ "ổ": 104,
94
+ "ỗ": 86,
95
+ "ộ": 39,
96
+ "ớ": 27,
97
+ "ờ": 93,
98
+ "ở": 101,
99
+ "ỡ": 6,
100
+ "ợ": 92,
101
+ "ụ": 5,
102
+ "ủ": 16,
103
+ "ứ": 69,
104
+ "ừ": 14,
105
+ "ử": 15,
106
+ "ữ": 63,
107
+ "ự": 22,
108
+ "ỳ": 105,
109
+ "ỵ": 45,
110
+ "ỷ": 1,
111
+ "ỹ": 59
112
+ }