gbenson commited on
Commit
7bc4f29
·
1 Parent(s): e9fd7a4

Configure [BOS] and [EOS] properly

Browse files
Files changed (2) hide show
  1. special_tokens_map.json +2 -0
  2. tokenizer_config.json +2 -0
special_tokens_map.json CHANGED
@@ -8,7 +8,9 @@
8
  "[BASE64]",
9
  "[LONG]"
10
  ],
 
11
  "cls_token": "[CLS]",
 
12
  "mask_token": "[MASK]",
13
  "pad_token": "[PAD]",
14
  "sep_token": "[SEP]",
 
8
  "[BASE64]",
9
  "[LONG]"
10
  ],
11
+ "bos_token": "[BOS]",
12
  "cls_token": "[CLS]",
13
+ "eos_token": "[EOS]",
14
  "mask_token": "[MASK]",
15
  "pad_token": "[PAD]",
16
  "sep_token": "[SEP]",
tokenizer_config.json CHANGED
@@ -106,9 +106,11 @@
106
  "[BASE64]",
107
  "[LONG]"
108
  ],
 
109
  "clean_up_tokenization_spaces": true,
110
  "cls_token": "[CLS]",
111
  "do_lower_case": true,
 
112
  "mask_token": "[MASK]",
113
  "model_max_length": 512,
114
  "pad_token": "[PAD]",
 
106
  "[BASE64]",
107
  "[LONG]"
108
  ],
109
+ "bos_token": "[BOS]",
110
  "clean_up_tokenization_spaces": true,
111
  "cls_token": "[CLS]",
112
  "do_lower_case": true,
113
+ "eos_token": "[EOS]",
114
  "mask_token": "[MASK]",
115
  "model_max_length": 512,
116
  "pad_token": "[PAD]",