chrisociepa
commited on
Commit
•
474848e
1
Parent(s):
2c74a1f
Fix configs
Browse files- generation_config.json +4 -2
- special_tokens_map.json +1 -1
- tokenizer.json +29 -1
- tokenizer_config.json +1 -1
generation_config.json
CHANGED
@@ -1,6 +1,8 @@
|
|
1 |
{
|
2 |
"_from_model_config": true,
|
3 |
"bos_token_id": 1,
|
4 |
-
"eos_token_id":
|
5 |
-
"
|
|
|
|
|
6 |
}
|
|
|
1 |
{
|
2 |
"_from_model_config": true,
|
3 |
"bos_token_id": 1,
|
4 |
+
"eos_token_id": 32001,
|
5 |
+
"pad_token": 2,
|
6 |
+
"unk_token": 0,
|
7 |
+
"transformers_version": "4.39.3"
|
8 |
}
|
special_tokens_map.json
CHANGED
@@ -137,7 +137,7 @@
|
|
137 |
"single_word": false
|
138 |
},
|
139 |
"eos_token": {
|
140 |
-
"content": "
|
141 |
"lstrip": false,
|
142 |
"normalized": false,
|
143 |
"rstrip": false,
|
|
|
137 |
"single_word": false
|
138 |
},
|
139 |
"eos_token": {
|
140 |
+
"content": "<|im_end|>",
|
141 |
"lstrip": false,
|
142 |
"normalized": false,
|
143 |
"rstrip": false,
|
tokenizer.json
CHANGED
@@ -1203,6 +1203,12 @@
|
|
1203 |
"post_processor": {
|
1204 |
"type": "TemplateProcessing",
|
1205 |
"single": [
|
|
|
|
|
|
|
|
|
|
|
|
|
1206 |
{
|
1207 |
"Sequence": {
|
1208 |
"id": "A",
|
@@ -1211,12 +1217,24 @@
|
|
1211 |
}
|
1212 |
],
|
1213 |
"pair": [
|
|
|
|
|
|
|
|
|
|
|
|
|
1214 |
{
|
1215 |
"Sequence": {
|
1216 |
"id": "A",
|
1217 |
"type_id": 0
|
1218 |
}
|
1219 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
1220 |
{
|
1221 |
"Sequence": {
|
1222 |
"id": "B",
|
@@ -1224,7 +1242,17 @@
|
|
1224 |
}
|
1225 |
}
|
1226 |
],
|
1227 |
-
"special_tokens": {
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1228 |
},
|
1229 |
"decoder": {
|
1230 |
"type": "Sequence",
|
|
|
1203 |
"post_processor": {
|
1204 |
"type": "TemplateProcessing",
|
1205 |
"single": [
|
1206 |
+
{
|
1207 |
+
"SpecialToken": {
|
1208 |
+
"id": "<s>",
|
1209 |
+
"type_id": 0
|
1210 |
+
}
|
1211 |
+
},
|
1212 |
{
|
1213 |
"Sequence": {
|
1214 |
"id": "A",
|
|
|
1217 |
}
|
1218 |
],
|
1219 |
"pair": [
|
1220 |
+
{
|
1221 |
+
"SpecialToken": {
|
1222 |
+
"id": "<s>",
|
1223 |
+
"type_id": 0
|
1224 |
+
}
|
1225 |
+
},
|
1226 |
{
|
1227 |
"Sequence": {
|
1228 |
"id": "A",
|
1229 |
"type_id": 0
|
1230 |
}
|
1231 |
},
|
1232 |
+
{
|
1233 |
+
"SpecialToken": {
|
1234 |
+
"id": "<s>",
|
1235 |
+
"type_id": 1
|
1236 |
+
}
|
1237 |
+
},
|
1238 |
{
|
1239 |
"Sequence": {
|
1240 |
"id": "B",
|
|
|
1242 |
}
|
1243 |
}
|
1244 |
],
|
1245 |
+
"special_tokens": {
|
1246 |
+
"<s>": {
|
1247 |
+
"id": "<s>",
|
1248 |
+
"ids": [
|
1249 |
+
1
|
1250 |
+
],
|
1251 |
+
"tokens": [
|
1252 |
+
"<s>"
|
1253 |
+
]
|
1254 |
+
}
|
1255 |
+
}
|
1256 |
},
|
1257 |
"decoder": {
|
1258 |
"type": "Sequence",
|
tokenizer_config.json
CHANGED
@@ -1185,7 +1185,7 @@
|
|
1185 |
"bos_token": "<s>",
|
1186 |
"chat_template": "{{bos_token}}{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
|
1187 |
"clean_up_tokenization_spaces": true,
|
1188 |
-
"eos_token": "
|
1189 |
"legacy": true,
|
1190 |
"model_max_length": 1000000000000000019884624838656,
|
1191 |
"pad_token": "</s>",
|
|
|
1185 |
"bos_token": "<s>",
|
1186 |
"chat_template": "{{bos_token}}{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
|
1187 |
"clean_up_tokenization_spaces": true,
|
1188 |
+
"eos_token": "<|im_end|>",
|
1189 |
"legacy": true,
|
1190 |
"model_max_length": 1000000000000000019884624838656,
|
1191 |
"pad_token": "</s>",
|