kkuramitsu commited on
Commit
9d34a7a
1 Parent(s): 55ce49b

Upload tokenizer.json

Browse files
Files changed (1) hide show
  1. tokenizer.json +4 -22
tokenizer.json CHANGED
@@ -50,7 +50,7 @@
50
  },
51
  {
52
  "id": 5,
53
- "content": "<CLS|LLM-jp>",
54
  "single_word": false,
55
  "lstrip": false,
56
  "rstrip": false,
@@ -59,7 +59,7 @@
59
  },
60
  {
61
  "id": 6,
62
- "content": "<SEP|LLM-jp>",
63
  "single_word": false,
64
  "lstrip": false,
65
  "rstrip": false,
@@ -104,12 +104,6 @@
104
  "id": "A",
105
  "type_id": 0
106
  }
107
- },
108
- {
109
- "SpecialToken": {
110
- "id": "<EOD|LLM-jp>",
111
- "type_id": 0
112
- }
113
  }
114
  ],
115
  "pair": [
@@ -119,23 +113,11 @@
119
  "type_id": 0
120
  }
121
  },
122
- {
123
- "SpecialToken": {
124
- "id": "<EOD|LLM-jp>",
125
- "type_id": 0
126
- }
127
- },
128
  {
129
  "Sequence": {
130
  "id": "B",
131
  "type_id": 1
132
  }
133
- },
134
- {
135
- "SpecialToken": {
136
- "id": "<EOD|LLM-jp>",
137
- "type_id": 1
138
- }
139
  }
140
  ],
141
  "special_tokens": {
@@ -200,11 +182,11 @@
200
  0.0
201
  ],
202
  [
203
- "<CLS|LLM-jp>",
204
  0.0
205
  ],
206
  [
207
- "<SEP|LLM-jp>",
208
  0.0
209
  ],
210
  [
 
50
  },
51
  {
52
  "id": 5,
53
+ "content": "<|im_start|>",
54
  "single_word": false,
55
  "lstrip": false,
56
  "rstrip": false,
 
59
  },
60
  {
61
  "id": 6,
62
+ "content": "<|im_end|>",
63
  "single_word": false,
64
  "lstrip": false,
65
  "rstrip": false,
 
104
  "id": "A",
105
  "type_id": 0
106
  }
 
 
 
 
 
 
107
  }
108
  ],
109
  "pair": [
 
113
  "type_id": 0
114
  }
115
  },
 
 
 
 
 
 
116
  {
117
  "Sequence": {
118
  "id": "B",
119
  "type_id": 1
120
  }
 
 
 
 
 
 
121
  }
122
  ],
123
  "special_tokens": {
 
182
  0.0
183
  ],
184
  [
185
+ "<|im_start|>",
186
  0.0
187
  ],
188
  [
189
+ "<|im_end|>",
190
  0.0
191
  ],
192
  [