Upload tokenizer.json
Browse files- tokenizer.json +4 -5
tokenizer.json
CHANGED
@@ -2097,15 +2097,15 @@
|
|
2097 |
"pre_tokenizer": {
|
2098 |
"type": "Metaspace",
|
2099 |
"replacement": "▁",
|
2100 |
-
"
|
2101 |
-
"
|
2102 |
},
|
2103 |
"post_processor": null,
|
2104 |
"decoder": {
|
2105 |
"type": "Metaspace",
|
2106 |
"replacement": "▁",
|
2107 |
-
"
|
2108 |
-
"
|
2109 |
},
|
2110 |
"model": {
|
2111 |
"type": "BPE",
|
@@ -2115,7 +2115,6 @@
|
|
2115 |
"end_of_word_suffix": null,
|
2116 |
"fuse_unk": false,
|
2117 |
"byte_fallback": false,
|
2118 |
-
"ignore_merges": false,
|
2119 |
"vocab": {
|
2120 |
"<s>": 0,
|
2121 |
"</s>": 1,
|
|
|
2097 |
"pre_tokenizer": {
|
2098 |
"type": "Metaspace",
|
2099 |
"replacement": "▁",
|
2100 |
+
"add_prefix_space": true,
|
2101 |
+
"prepend_scheme": "always"
|
2102 |
},
|
2103 |
"post_processor": null,
|
2104 |
"decoder": {
|
2105 |
"type": "Metaspace",
|
2106 |
"replacement": "▁",
|
2107 |
+
"add_prefix_space": true,
|
2108 |
+
"prepend_scheme": "always"
|
2109 |
},
|
2110 |
"model": {
|
2111 |
"type": "BPE",
|
|
|
2115 |
"end_of_word_suffix": null,
|
2116 |
"fuse_unk": false,
|
2117 |
"byte_fallback": false,
|
|
|
2118 |
"vocab": {
|
2119 |
"<s>": 0,
|
2120 |
"</s>": 1,
|