Upload tokenizer
Browse files- tokenizer_config.json +3 -4
tokenizer_config.json
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
{
|
2 |
"add_bos_token": true,
|
3 |
-
"add_pad_token":true,
|
4 |
"add_eos_token": false,
|
|
|
5 |
"added_tokens_decoder": {
|
6 |
"0": {
|
7 |
"content": "<unk>",
|
@@ -54,6 +54,8 @@
|
|
54 |
"rstrip": false,
|
55 |
"single_word": false
|
56 |
},
|
|
|
|
|
57 |
"pad_token": {
|
58 |
"__type": "AddedToken",
|
59 |
"content": "|<pad>|",
|
@@ -62,9 +64,6 @@
|
|
62 |
"rstrip": false,
|
63 |
"single_word": false
|
64 |
},
|
65 |
-
"legacy": false,
|
66 |
-
"model_max_length": 2048,
|
67 |
-
|
68 |
"padding_side": "left",
|
69 |
"sp_model_kwargs": {},
|
70 |
"tokenizer_class": "LlamaTokenizer",
|
|
|
1 |
{
|
2 |
"add_bos_token": true,
|
|
|
3 |
"add_eos_token": false,
|
4 |
+
"add_pad_token": true,
|
5 |
"added_tokens_decoder": {
|
6 |
"0": {
|
7 |
"content": "<unk>",
|
|
|
54 |
"rstrip": false,
|
55 |
"single_word": false
|
56 |
},
|
57 |
+
"legacy": false,
|
58 |
+
"model_max_length": 2048,
|
59 |
"pad_token": {
|
60 |
"__type": "AddedToken",
|
61 |
"content": "|<pad>|",
|
|
|
64 |
"rstrip": false,
|
65 |
"single_word": false
|
66 |
},
|
|
|
|
|
|
|
67 |
"padding_side": "left",
|
68 |
"sp_model_kwargs": {},
|
69 |
"tokenizer_class": "LlamaTokenizer",
|