Upload processor

Files changed (3) hide show

chat_template.jinja ADDED Viewed

+{%set seps=['
+','<｜end▁of▁sentence｜>']%}{%set i=0%}{%for message in messages%}{%if message['role']|lower=='user'%}<|User|>: {%elif message['role']|lower=='assistant'%}<|Assistant|>:{%if not (loop.last and not add_generation_prompt and message['content'][0]['type']=='text' and message['content'][0]['text']=='')%} {%endif%}{%else%}{{message['role'].capitalize()}}: {%endif%}{%for content in message['content']%}{%if content['type']=='image'%}{%if not loop.first%}{{'
+'}}{%endif%}<image_placeholder>{%if not loop.last%}{{'
+'}}{%endif%}{%elif content['type']=='text'%}{%set text=content['text']%}{%if loop.first%}{%set text=text.lstrip()%}{%endif%}{%if loop.last%}{%set text=text.rstrip()%}{%endif%}{%if not loop.first and message['content'][loop.index0-1]['type']=='text'%}{{' '+text}}{%else%}{{text}}{%endif%}{%endif%}{%endfor%}{%if not loop.last or add_generation_prompt%}{%if message['role']|lower=='user'%}{{seps[0]}}{%else%}{{seps[1]}}{%endif%}{%endif%}{%endfor%}{%if add_generation_prompt%}<|Assistant|>:{%endif%}

special_tokens_map.json CHANGED Viewed

@@ -10,6 +10,7 @@
     "<|User|>",
     "<|Assistant|>"
   ],
   "bos_token": {
     "content": "<｜begin▁of▁sentence｜>",
     "lstrip": false,
@@ -17,6 +18,7 @@
     "rstrip": false,
     "single_word": false
   },
   "eos_token": {
     "content": "<｜end▁of▁sentence｜>",
     "lstrip": false,
@@ -24,6 +26,7 @@
     "rstrip": false,
     "single_word": false
   },
   "pad_token": {
     "content": "<｜▁pad▁｜>",
     "lstrip": false,

     "<|User|>",
     "<|Assistant|>"
   ],
+  "boi_token": "<begin_of_image>",
   "bos_token": {
     "content": "<｜begin▁of▁sentence｜>",
     "lstrip": false,
     "rstrip": false,
     "single_word": false
   },
+  "eoi_token": "<end_of_image>",
   "eos_token": {
     "content": "<｜end▁of▁sentence｜>",
     "lstrip": false,
     "rstrip": false,
     "single_word": false
   },
+  "image_token": "<image_placeholder>",
   "pad_token": {
     "content": "<｜▁pad▁｜>",
     "lstrip": false,

tokenizer_config.json CHANGED Viewed

@@ -4839,10 +4839,17 @@
     "<|User|>",
     "<|Assistant|>"
   ],
   "bos_token": "<｜begin▁of▁sentence｜>",
   "clean_up_tokenization_spaces": false,
   "eos_token": "<｜end▁of▁sentence｜>",
-  "extra_special_tokens": {},
   "legacy": true,
   "model_max_length": 16384,
   "pad_token": "<｜▁pad▁｜>",

     "<|User|>",
     "<|Assistant|>"
   ],
+  "boi_token": "<begin_of_image>",
   "bos_token": "<｜begin▁of▁sentence｜>",
   "clean_up_tokenization_spaces": false,
+  "eoi_token": "<end_of_image>",
   "eos_token": "<｜end▁of▁sentence｜>",
+  "extra_special_tokens": {
+    "boi_token": "<begin_of_image>",
+    "eoi_token": "<end_of_image>",
+    "image_token": "<image_placeholder>"
+  },
+  "image_token": "<image_placeholder>",
   "legacy": true,
   "model_max_length": 16384,
   "pad_token": "<｜▁pad▁｜>",