Upload tokenizer

Files changed (4) hide show

added_tokens.json CHANGED Viewed

@@ -1,4 +1,3 @@
 {
-  "<image>": 100353,
   "<pad>": 100352
 }

 {
   "<pad>": 100352
 }

special_tokens_map.json CHANGED Viewed

@@ -1,6 +1,11 @@
 {
-  "image_token": "<image>",
-  "pad_token": "<pad>",
   "unk_token": {
     "content": "<unk>",
     "lstrip": false,

 {
+  "pad_token": {
+    "content": "<pad>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
   "unk_token": {
     "content": "<unk>",
     "lstrip": false,

tokenizer.json CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b4cab625c7efc4eea85b5cead9707d897291df9e02749ab16988086218c6589b
-size 11091666

 version https://git-lfs.github.com/spec/v1
+oid sha256:02702cce6c4de786d52a3dc624b39e86134c159b7490ea30630739c6f723e7f8
+size 11091481

tokenizer_config.json CHANGED Viewed

@@ -81,7 +81,7 @@
       "normalized": false,
       "rstrip": false,
       "single_word": false,
-      "special": false
     },
     "10": {
       "content": "<|reserved008|>",
@@ -4938,25 +4938,13 @@
       "rstrip": false,
       "single_word": false,
       "special": true
-    },
-    "100353": {
-      "content": "<image>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
     }
   },
   "bos_token": null,
   "chat_template": "{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% for message in messages %}<|im_start|>{{ message['role'] }}\n{% if message['content'] is string %}{{ message['content'] }}{% elif message['content'] is iterable %}{% for item in message['content'] %}{% if item['type'] == 'text' %}{{ item['text'] }}{% elif item['type'] == 'image' %}<fim_prefix><|img|><fim_suffix>{% endif %}{% endfor %}{% endif %}<|im_end|>\n{% endfor %}{% if add_generation_prompt %}<|im_start|>assistant\n{% endif %}",
   "clean_up_tokenization_spaces": false,
   "eos_token": null,
-  "extra_special_tokens": {
-    "image_token": "<image>",
-    "pad_token": "<pad>"
-  },
-  "image_token": "<image>",
   "legacy": true,
   "model_max_length": 1000000000000000019884624838656,
   "pad_token": "<pad>",

       "normalized": false,
       "rstrip": false,
       "single_word": false,
+      "special": true
     },
     "10": {
       "content": "<|reserved008|>",
       "rstrip": false,
       "single_word": false,
       "special": true
     }
   },
   "bos_token": null,
   "chat_template": "{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% for message in messages %}<|im_start|>{{ message['role'] }}\n{% if message['content'] is string %}{{ message['content'] }}{% elif message['content'] is iterable %}{% for item in message['content'] %}{% if item['type'] == 'text' %}{{ item['text'] }}{% elif item['type'] == 'image' %}<fim_prefix><|img|><fim_suffix>{% endif %}{% endfor %}{% endif %}<|im_end|>\n{% endfor %}{% if add_generation_prompt %}<|im_start|>assistant\n{% endif %}",
   "clean_up_tokenization_spaces": false,
   "eos_token": null,
+  "extra_special_tokens": {},
   "legacy": true,
   "model_max_length": 1000000000000000019884624838656,
   "pad_token": "<pad>",