julio-mm commited on
Commit
40a9660
·
1 Parent(s): ecf0957

Delete tokenizer

Browse files
tokenizer/special_tokens_map.json DELETED
@@ -1,7 +0,0 @@
1
- {
2
- "cls_token": "[CLS]",
3
- "mask_token": "[MASK]",
4
- "pad_token": "[PAD]",
5
- "sep_token": "[SEP]",
6
- "unk_token": "[UNK]"
7
- }
 
 
 
 
 
 
 
 
tokenizer/tokenizer.json DELETED
The diff for this file is too large to render. See raw diff
 
tokenizer/tokenizer_config.json DELETED
@@ -1,13 +0,0 @@
1
- {
2
- "cls_token": "[CLS]",
3
- "do_lower_case": true,
4
- "mask_token": "[MASK]",
5
- "model_max_length": 512,
6
- "pad_token": "[PAD]",
7
- "sep_token": "[SEP]",
8
- "special_tokens_map_file": null,
9
- "strip_accents": null,
10
- "tokenize_chinese_chars": true,
11
- "tokenizer_class": "DistilBertTokenizer",
12
- "unk_token": "[UNK]"
13
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tokenizer/vocab.txt DELETED
The diff for this file is too large to render. See raw diff