mjbommar commited on
Commit
afc451b
·
verified ·
1 Parent(s): 9d1a15a

Fix tokenizer_config.json special token names

Browse files
Files changed (1) hide show
  1. tokenizer_config.json +8 -6
tokenizer_config.json CHANGED
@@ -1,9 +1,11 @@
1
  {
2
  "tokenizer_class": "PreTrainedTokenizerFast",
3
  "model_max_length": 512,
4
- "pad_token": "[PAD]",
5
- "mask_token": "[MASK]",
6
- "cls_token": "[CLS]",
7
- "sep_token": "[SEP]",
8
- "unk_token": "[UNK]"
9
- }
 
 
 
1
  {
2
  "tokenizer_class": "PreTrainedTokenizerFast",
3
  "model_max_length": 512,
4
+ "bos_token": "<|start|>",
5
+ "eos_token": "<|end|>",
6
+ "pad_token": "<|pad|>",
7
+ "unk_token": "<|unk|>",
8
+ "cls_token": "<|cls|>",
9
+ "sep_token": "<|sep|>",
10
+ "mask_token": "<|mask|>"
11
+ }