Upload folder using huggingface_hub

Files changed (4) hide show

added_tokens.json CHANGED Viewed

@@ -1,7 +1,4 @@
 {
-  "[CLS]": 8102,
-  "[MASK]": 8103,
-  "[PAD]": 8101,
-  "[SEP]": 8100,
-  "[UNK]": 8099
 }

 {
+  "[MASK]": 8105,
+  "[SEP]": 8104
 }

tokenizer.json CHANGED Viewed

@@ -4,7 +4,7 @@
   "padding": null,
   "added_tokens": [
     {
-      "id": 8099,
       "content": "[UNK]",
       "single_word": false,
       "lstrip": false,
@@ -13,8 +13,8 @@
       "special": true
     },
     {
-      "id": 8100,
-      "content": "[SEP]",
       "single_word": false,
       "lstrip": false,
       "rstrip": false,
@@ -22,8 +22,8 @@
       "special": true
     },
     {
-      "id": 8101,
-      "content": "[PAD]",
       "single_word": false,
       "lstrip": false,
       "rstrip": false,
@@ -31,8 +31,8 @@
       "special": true
     },
     {
-      "id": 8102,
-      "content": "[CLS]",
       "single_word": false,
       "lstrip": false,
       "rstrip": false,
@@ -40,7 +40,7 @@
       "special": true
     },
     {
-      "id": 8103,
       "content": "[MASK]",
       "single_word": false,
       "lstrip": false,
@@ -117,7 +117,7 @@
       "[CLS]": {
         "id": "[CLS]",
         "ids": [
-          8102
         ],
         "tokens": [
           "[CLS]"
@@ -126,7 +126,7 @@
       "[SEP]": {
         "id": "[SEP]",
         "ids": [
-          8100
         ],
         "tokens": [
           "[SEP]"
@@ -8243,7 +8243,12 @@
       "}": 8098,
       "~": 8099,
       "": 8100,
-      "�": 8101
     }
   }
 }

   "padding": null,
   "added_tokens": [
     {
+      "id": 8101,
       "content": "[UNK]",
       "single_word": false,
       "lstrip": false,
       "special": true
     },
     {
+      "id": 8102,
+      "content": "[PAD]",
       "single_word": false,
       "lstrip": false,
       "rstrip": false,
       "special": true
     },
     {
+      "id": 8103,
+      "content": "[CLS]",
       "single_word": false,
       "lstrip": false,
       "rstrip": false,
       "special": true
     },
     {
+      "id": 8104,
+      "content": "[SEP]",
       "single_word": false,
       "lstrip": false,
       "rstrip": false,
       "special": true
     },
     {
+      "id": 8105,
       "content": "[MASK]",
       "single_word": false,
       "lstrip": false,
       "[CLS]": {
         "id": "[CLS]",
         "ids": [
+          8103
         ],
         "tokens": [
           "[CLS]"
       "[SEP]": {
         "id": "[SEP]",
         "ids": [
+          8104
         ],
         "tokens": [
           "[SEP]"
       "}": 8098,
       "~": 8099,
       "": 8100,
+      "[UNK]": 8101,
+      "[PAD]": 8102,
+      "[CLS]": 8103,
+      "[SEP]": 8104,
+      "[MASK]": 8105,
+      "�": 8106
     }
   }
 }

tokenizer_config.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "added_tokens_decoder": {
-    "8099": {
       "content": "[UNK]",
       "lstrip": false,
       "normalized": false,
@@ -8,31 +8,31 @@
       "single_word": false,
       "special": true
     },
-    "8100": {
-      "content": "[SEP]",
       "lstrip": false,
       "normalized": false,
       "rstrip": false,
       "single_word": false,
       "special": true
     },
-    "8101": {
-      "content": "[PAD]",
       "lstrip": false,
       "normalized": false,
       "rstrip": false,
       "single_word": false,
       "special": true
     },
-    "8102": {
-      "content": "[CLS]",
       "lstrip": false,
       "normalized": false,
       "rstrip": false,
       "single_word": false,
       "special": true
     },
-    "8103": {
       "content": "[MASK]",
       "lstrip": false,
       "normalized": false,

 {
   "added_tokens_decoder": {
+    "8101": {
       "content": "[UNK]",
       "lstrip": false,
       "normalized": false,
       "single_word": false,
       "special": true
     },
+    "8102": {
+      "content": "[PAD]",
       "lstrip": false,
       "normalized": false,
       "rstrip": false,
       "single_word": false,
       "special": true
     },
+    "8103": {
+      "content": "[CLS]",
       "lstrip": false,
       "normalized": false,
       "rstrip": false,
       "single_word": false,
       "special": true
     },
+    "8104": {
+      "content": "[SEP]",
       "lstrip": false,
       "normalized": false,
       "rstrip": false,
       "single_word": false,
       "special": true
     },
+    "8105": {
       "content": "[MASK]",
       "lstrip": false,
       "normalized": false,

vocab.txt CHANGED Viewed

@@ -8096,4 +8096,9 @@ z
 }
 ~
 �

 }
 ~
+[UNK]
+[PAD]
+[CLS]
+[SEP]
+[MASK]
 �