Upload tokenizer

Files changed (2) hide show

tokenizer.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json CHANGED Viewed

@@ -2168,7 +2168,6 @@
   "clean_up_tokenization_spaces": false,
   "cls_token": "[CLS]",
   "eos_token": "<|endoftext|>",
-  "extra_special_tokens": {},
   "fast_tokenizer": true,
   "gmask_token": "[gMASK]",
   "merges_file": null,
@@ -2178,6 +2177,7 @@
   ],
   "model_max_length": 1000000000000000019884624838656,
   "pad_token": "<|endoftext|>",
-  "tokenizer_class": "PreTrainedTokenizer",
-  "trust_remote_code": true
 }

   "clean_up_tokenization_spaces": false,
   "cls_token": "[CLS]",
   "eos_token": "<|endoftext|>",
   "fast_tokenizer": true,
   "gmask_token": "[gMASK]",
   "merges_file": null,
   ],
   "model_max_length": 1000000000000000019884624838656,
   "pad_token": "<|endoftext|>",
+  "tokenizer_class": "PreTrainedTokenizerFast",
+  "trust_remote_code": true,
+  "vocab_file": null
 }