Maxime62 commited on
Commit
4ca8a5c
·
verified ·
1 Parent(s): 217a890

Upload tokenizer

Browse files
Files changed (1) hide show
  1. tokenizer_config.json +2 -1
tokenizer_config.json CHANGED
@@ -1,7 +1,6 @@
1
  {
2
  "add_bos_token": true,
3
  "add_eos_token": false,
4
- "add_prefix_space": true,
5
  "added_tokens_decoder": {
6
  "0": {
7
  "content": "<unk>",
@@ -40,12 +39,14 @@
40
  "clean_up_tokenization_spaces": false,
41
  "eos_token": "</s>",
42
  "legacy": false,
 
43
  "model_max_length": 1000000000000000019884624838656,
44
  "pad_token": "<s>",
45
  "padding_side": "right",
46
  "sp_model_kwargs": {},
47
  "spaces_between_special_tokens": false,
48
  "tokenizer_class": "LlamaTokenizer",
 
49
  "unk_token": "<unk>",
50
  "use_default_system_prompt": false
51
  }
 
1
  {
2
  "add_bos_token": true,
3
  "add_eos_token": false,
 
4
  "added_tokens_decoder": {
5
  "0": {
6
  "content": "<unk>",
 
39
  "clean_up_tokenization_spaces": false,
40
  "eos_token": "</s>",
41
  "legacy": false,
42
+ "max_seq_length": 2048,
43
  "model_max_length": 1000000000000000019884624838656,
44
  "pad_token": "<s>",
45
  "padding_side": "right",
46
  "sp_model_kwargs": {},
47
  "spaces_between_special_tokens": false,
48
  "tokenizer_class": "LlamaTokenizer",
49
+ "truncation": true,
50
  "unk_token": "<unk>",
51
  "use_default_system_prompt": false
52
  }