danielhanchen commited on
Commit
a0d755f
·
verified ·
1 Parent(s): ec5423d

Upload tokenizer

Browse files
Files changed (2) hide show
  1. tokenizer.json +0 -0
  2. tokenizer_config.json +8 -0
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json CHANGED
@@ -137,6 +137,14 @@
137
  "single_word": false,
138
  "special": true
139
  },
 
 
 
 
 
 
 
 
140
  "49152": {
141
  "content": "<|PAD_TOKEN|>",
142
  "lstrip": false,
 
137
  "single_word": false,
138
  "special": true
139
  },
140
+ "24211": {
141
+ "content": "�",
142
+ "lstrip": false,
143
+ "normalized": false,
144
+ "rstrip": false,
145
+ "single_word": false,
146
+ "special": true
147
+ },
148
  "49152": {
149
  "content": "<|PAD_TOKEN|>",
150
  "lstrip": false,