Configure [BOS] and [EOS] properly
Browse files- special_tokens_map.json +2 -0
- tokenizer_config.json +2 -0
special_tokens_map.json
CHANGED
@@ -8,7 +8,9 @@
|
|
8 |
"[BASE64]",
|
9 |
"[LONG]"
|
10 |
],
|
|
|
11 |
"cls_token": "[CLS]",
|
|
|
12 |
"mask_token": "[MASK]",
|
13 |
"pad_token": "[PAD]",
|
14 |
"sep_token": "[SEP]",
|
|
|
8 |
"[BASE64]",
|
9 |
"[LONG]"
|
10 |
],
|
11 |
+
"bos_token": "[BOS]",
|
12 |
"cls_token": "[CLS]",
|
13 |
+
"eos_token": "[EOS]",
|
14 |
"mask_token": "[MASK]",
|
15 |
"pad_token": "[PAD]",
|
16 |
"sep_token": "[SEP]",
|
tokenizer_config.json
CHANGED
@@ -106,9 +106,11 @@
|
|
106 |
"[BASE64]",
|
107 |
"[LONG]"
|
108 |
],
|
|
|
109 |
"clean_up_tokenization_spaces": true,
|
110 |
"cls_token": "[CLS]",
|
111 |
"do_lower_case": true,
|
|
|
112 |
"mask_token": "[MASK]",
|
113 |
"model_max_length": 512,
|
114 |
"pad_token": "[PAD]",
|
|
|
106 |
"[BASE64]",
|
107 |
"[LONG]"
|
108 |
],
|
109 |
+
"bos_token": "[BOS]",
|
110 |
"clean_up_tokenization_spaces": true,
|
111 |
"cls_token": "[CLS]",
|
112 |
"do_lower_case": true,
|
113 |
+
"eos_token": "[EOS]",
|
114 |
"mask_token": "[MASK]",
|
115 |
"model_max_length": 512,
|
116 |
"pad_token": "[PAD]",
|