Upload processor
Browse files- added_tokens.json +1 -0
- chat_template.json +3 -3
- preprocessor_config.json +2 -7
- processor_config.json +8 -0
- tokenizer.json +9 -0
- tokenizer_config.json +9 -1
added_tokens.json
CHANGED
|
@@ -1,5 +1,6 @@
|
|
| 1 |
{
|
| 2 |
"<image>": 151646,
|
|
|
|
| 3 |
"<|endoftext|>": 151643,
|
| 4 |
"<|im_end|>": 151645,
|
| 5 |
"<|im_start|>": 151644
|
|
|
|
| 1 |
{
|
| 2 |
"<image>": 151646,
|
| 3 |
+
"<video>": 151647,
|
| 4 |
"<|endoftext|>": 151643,
|
| 5 |
"<|im_end|>": 151645,
|
| 6 |
"<|im_start|>": 151644
|
chat_template.json
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
-
{
|
| 2 |
-
"chat_template": "{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n'}}{# Render all images first #}{% for content in message['content'] | selectattr('type', 'equalto', 'image') %}{{ '<image>\n' }}{% endfor %}{# Render all text next #}{% if message['role'] != 'assistant' %}{% for content in message['content'] | selectattr('type', 'equalto', 'text') %}{{ content['text'] }}{% endfor %}{% else %}{% for content in message['content'] | selectattr('type', 'equalto', 'text') %}{% generation %}{{ content['text'] }}{% endgeneration %}{% endfor %}{% endif %}{{'<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}"
|
| 3 |
-
}
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"chat_template": "{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n'}}{# Render all images first #}{% for content in message['content'] | selectattr('type', 'equalto', 'image') %}{{ '<image>\n' }}{% endfor %}{# Render all video then #}{% for content in message['content'] | selectattr('type', 'equalto', 'video') %}{{ '<video>\n' }}{% endfor %}{# Render all text next #}{% if message['role'] != 'assistant' %}{% for content in message['content'] | selectattr('type', 'equalto', 'text') %}{{ content['text'] }}{% endfor %}{% else %}{% for content in message['content'] | selectattr('type', 'equalto', 'text') %}{% generation %}{{ content['text'] }}{% endgeneration %}{% endfor %}{% endif %}{{'<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}"
|
| 3 |
+
}
|
preprocessor_config.json
CHANGED
|
@@ -1,9 +1,4 @@
|
|
| 1 |
{
|
| 2 |
-
"crop_size": {
|
| 3 |
-
"height": 384,
|
| 4 |
-
"width": 384
|
| 5 |
-
},
|
| 6 |
-
"do_center_crop": true,
|
| 7 |
"do_convert_rgb": true,
|
| 8 |
"do_normalize": true,
|
| 9 |
"do_pad": true,
|
|
@@ -160,13 +155,13 @@
|
|
| 160 |
0.5,
|
| 161 |
0.5
|
| 162 |
],
|
| 163 |
-
"image_processor_type": "
|
| 164 |
"image_std": [
|
| 165 |
0.5,
|
| 166 |
0.5,
|
| 167 |
0.5
|
| 168 |
],
|
| 169 |
-
"processor_class": "
|
| 170 |
"resample": 3,
|
| 171 |
"rescale_factor": 0.00392156862745098,
|
| 172 |
"size": {
|
|
|
|
| 1 |
{
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2 |
"do_convert_rgb": true,
|
| 3 |
"do_normalize": true,
|
| 4 |
"do_pad": true,
|
|
|
|
| 155 |
0.5,
|
| 156 |
0.5
|
| 157 |
],
|
| 158 |
+
"image_processor_type": "LlavaOnevisionImageProcessor",
|
| 159 |
"image_std": [
|
| 160 |
0.5,
|
| 161 |
0.5,
|
| 162 |
0.5
|
| 163 |
],
|
| 164 |
+
"processor_class": "LlavaOnevisionProcessor",
|
| 165 |
"resample": 3,
|
| 166 |
"rescale_factor": 0.00392156862745098,
|
| 167 |
"size": {
|
processor_config.json
ADDED
|
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"chat_template": "{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n'}}{# Render all images first #}{% for content in message['content'] | selectattr('type', 'equalto', 'image') %}{{ '<image>\n' }}{% endfor %}{# Render all video then #}{% for content in message['content'] | selectattr('type', 'equalto', 'video') %}{{ '<video>\n' }}{% endfor %}{# Render all text next #}{% if message['role'] != 'assistant' %}{% for content in message['content'] | selectattr('type', 'equalto', 'text') %}{{ content['text'] }}{% endfor %}{% else %}{% for content in message['content'] | selectattr('type', 'equalto', 'text') %}{% generation %}{{ content['text'] }}{% endgeneration %}{% endfor %}{% endif %}{{'<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
|
| 3 |
+
"image_token": "<image>",
|
| 4 |
+
"patch_size": 14,
|
| 5 |
+
"processor_class": "LlavaOnevisionProcessor",
|
| 6 |
+
"video_token": "<video>",
|
| 7 |
+
"vision_feature_select_strategy": "full"
|
| 8 |
+
}
|
tokenizer.json
CHANGED
|
@@ -45,6 +45,15 @@
|
|
| 45 |
"rstrip": false,
|
| 46 |
"normalized": false,
|
| 47 |
"special": true
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 48 |
}
|
| 49 |
],
|
| 50 |
"normalizer": {
|
|
|
|
| 45 |
"rstrip": false,
|
| 46 |
"normalized": false,
|
| 47 |
"special": true
|
| 48 |
+
},
|
| 49 |
+
{
|
| 50 |
+
"id": 151647,
|
| 51 |
+
"content": "<video>",
|
| 52 |
+
"single_word": false,
|
| 53 |
+
"lstrip": false,
|
| 54 |
+
"rstrip": false,
|
| 55 |
+
"normalized": false,
|
| 56 |
+
"special": true
|
| 57 |
}
|
| 58 |
],
|
| 59 |
"normalizer": {
|
tokenizer_config.json
CHANGED
|
@@ -32,6 +32,14 @@
|
|
| 32 |
"rstrip": false,
|
| 33 |
"single_word": false,
|
| 34 |
"special": true
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 35 |
}
|
| 36 |
},
|
| 37 |
"additional_special_tokens": [
|
|
@@ -45,7 +53,7 @@
|
|
| 45 |
"errors": "replace",
|
| 46 |
"model_max_length": 32768,
|
| 47 |
"pad_token": "<|endoftext|>",
|
| 48 |
-
"processor_class": "
|
| 49 |
"split_special_tokens": false,
|
| 50 |
"tokenizer_class": "Qwen2Tokenizer",
|
| 51 |
"unk_token": null
|
|
|
|
| 32 |
"rstrip": false,
|
| 33 |
"single_word": false,
|
| 34 |
"special": true
|
| 35 |
+
},
|
| 36 |
+
"151647": {
|
| 37 |
+
"content": "<video>",
|
| 38 |
+
"lstrip": false,
|
| 39 |
+
"normalized": false,
|
| 40 |
+
"rstrip": false,
|
| 41 |
+
"single_word": false,
|
| 42 |
+
"special": true
|
| 43 |
}
|
| 44 |
},
|
| 45 |
"additional_special_tokens": [
|
|
|
|
| 53 |
"errors": "replace",
|
| 54 |
"model_max_length": 32768,
|
| 55 |
"pad_token": "<|endoftext|>",
|
| 56 |
+
"processor_class": "LlavaOnevisionProcessor",
|
| 57 |
"split_special_tokens": false,
|
| 58 |
"tokenizer_class": "Qwen2Tokenizer",
|
| 59 |
"unk_token": null
|