pglo commited on
Commit
d70d78e
1 Parent(s): 9c62ec0

update tokenizer config

Browse files
special_tokens_map.json CHANGED
@@ -23,12 +23,5 @@
23
  "normalized": false,
24
  "rstrip": false,
25
  "single_word": false
26
- },
27
- "unk_token": {
28
- "content": "<unk>",
29
- "lstrip": false,
30
- "normalized": false,
31
- "rstrip": false,
32
- "single_word": false
33
  }
34
  }
 
23
  "normalized": false,
24
  "rstrip": false,
25
  "single_word": false
 
 
 
 
 
 
 
26
  }
27
  }
tokenizer.json CHANGED
@@ -129,7 +129,7 @@
129
  "model": {
130
  "type": "BPE",
131
  "dropout": null,
132
- "unk_token": "<unk>",
133
  "continuing_subword_prefix": null,
134
  "end_of_word_suffix": null,
135
  "fuse_unk": true,
 
129
  "model": {
130
  "type": "BPE",
131
  "dropout": null,
132
+ "unk_token": null,
133
  "continuing_subword_prefix": null,
134
  "end_of_word_suffix": null,
135
  "fuse_unk": true,
tokenizer_config.json CHANGED
@@ -46,6 +46,6 @@
46
  "tokenizer_class": "LlamaTokenizer",
47
  "truncation_side": "right",
48
  "truncation_strategy": "longest_first",
49
- "unk_token": "<unk>",
50
  "use_default_system_prompt": false
51
  }
 
46
  "tokenizer_class": "LlamaTokenizer",
47
  "truncation_side": "right",
48
  "truncation_strategy": "longest_first",
49
+ "unk_token": null,
50
  "use_default_system_prompt": false
51
  }