Upload tokenizer

Files changed (3) hide show

special_tokens_map.json CHANGED Viewed

@@ -13,7 +13,7 @@
     "rstrip": false,
     "single_word": false
   },
-  "pad_token": "</s>",
   "unk_token": {
     "content": "<unk>",
     "lstrip": false,

     "rstrip": false,
     "single_word": false
   },
+  "pad_token": "<unk>",
   "unk_token": {
     "content": "<unk>",
     "lstrip": false,

tokenizer.json CHANGED Viewed

@@ -5,9 +5,9 @@
     "strategy": "BatchLongest",
     "direction": "Left",
     "pad_to_multiple_of": null,
-    "pad_id": 2,
     "pad_type_id": 0,
-    "pad_token": "</s>"
   },
   "added_tokens": [
     {

     "strategy": "BatchLongest",
     "direction": "Left",
     "pad_to_multiple_of": null,
+    "pad_id": 0,
     "pad_type_id": 0,
+    "pad_token": "<unk>"
   },
   "added_tokens": [
     {

tokenizer_config.json CHANGED Viewed

@@ -34,7 +34,7 @@
   "extra_special_tokens": {},
   "legacy": true,
   "model_max_length": 1000000000000000019884624838656,
-  "pad_token": "</s>",
   "sp_model_kwargs": {},
   "spaces_between_special_tokens": false,
   "tokenizer_class": "LlamaTokenizer",

   "extra_special_tokens": {},
   "legacy": true,
   "model_max_length": 1000000000000000019884624838656,
+  "pad_token": "<unk>",
   "sp_model_kwargs": {},
   "spaces_between_special_tokens": false,
   "tokenizer_class": "LlamaTokenizer",