DylanJHJ
/

glove.6B.300d

Model card Files Files and versions

DylanJHJ commited on Feb 2

Commit

eb9ab75

·

verified ·

1 Parent(s): 8a1fe7b

Upload tokenizer

Files changed (3) hide show

special_tokens_map.json +3 -1
tokenizer.json +21 -1
tokenizer_config.json +18 -0

special_tokens_map.json CHANGED Viewed

@@ -1,4 +1,6 @@
 {
   "mask_token": "[MASK]",
-  "pad_token": "PADDING_TOKEN"
 }

 {
+  "cls_token": "[CLS]",
   "mask_token": "[MASK]",
+  "pad_token": "PADDING_TOKEN",
+  "sep_token": "[SEP]"
 }

tokenizer.json CHANGED Viewed

@@ -14,6 +14,24 @@
     },
     {
       "id": 400006,
       "content": "[MASK]",
       "single_word": false,
       "lstrip": false,
@@ -400036,7 +400054,9 @@
       "[unused0]": 400002,
       "[unused1]": 400003,
       "[Q]": 400004,
-      "[D]": 400005
     },
     "unk_token": "[UNK]"
   }

     },
     {
       "id": 400006,
+      "content": "[CLS]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 400007,
+      "content": "[SEP]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 400008,
       "content": "[MASK]",
       "single_word": false,
       "lstrip": false,
       "[unused0]": 400002,
       "[unused1]": 400003,
       "[Q]": 400004,
+      "[D]": 400005,
+      "[CLS]": 400006,
+      "[SEP]": 400007
     },
     "unk_token": "[UNK]"
   }

tokenizer_config.json CHANGED Viewed

@@ -9,6 +9,22 @@
       "special": true
     },
     "400006": {
       "content": "[MASK]",
       "lstrip": false,
       "normalized": false,
@@ -18,8 +34,10 @@
     }
   },
   "clean_up_tokenization_spaces": false,
   "mask_token": "[MASK]",
   "model_max_length": 1000000000000000019884624838656,
   "pad_token": "PADDING_TOKEN",
   "tokenizer_class": "PreTrainedTokenizerFast"
 }

       "special": true
     },
     "400006": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "400007": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "400008": {
       "content": "[MASK]",
       "lstrip": false,
       "normalized": false,
     }
   },
   "clean_up_tokenization_spaces": false,
+  "cls_token": "[CLS]",
   "mask_token": "[MASK]",
   "model_max_length": 1000000000000000019884624838656,
   "pad_token": "PADDING_TOKEN",
+  "sep_token": "[SEP]",
   "tokenizer_class": "PreTrainedTokenizerFast"
 }