Upload processor

Files changed (5) hide show

chat_template.jinja ADDED Viewed

+{%- for message in messages %}
+        {%- if message['content'] is string %}
+{{ message['content'].rstrip() }}
+        {%- else %}
+            {%- set ns = namespace(previous_was_image=False) %}
+            {%- for content in message['content'] %}
+                {%- if content['type'] == 'image' %}
+<image>
+                    {%- set ns.previous_was_image = True %}
+                {%- elif content['type'] == 'text' %}
+{{- ('
+' if ns.previous_was_image else '') + content['text'].rstrip() }}
+                    {%- set ns.previous_was_image = False %}
+                {%- endif %}
+            {%- endfor %}
+        {%- endif %}
+        {%- if not loop.last %}
+        {%- endif %}
+    {%- endfor %}

processor_config.json ADDED Viewed

+{
+  "image_processor": {
+    "base_size": {
+      "height": 1024,
+      "width": 1024
+    },
+    "crop_size": null,
+    "data_format": "channels_first",
+    "device": null,
+    "disable_grouping": null,
+    "do_center_crop": null,
+    "do_convert_rgb": true,
+    "do_normalize": true,
+    "do_pad": null,
+    "do_rescale": true,
+    "do_resize": true,
+    "dynamic_hd": 36,
+    "image_mean": [
+      0.5,
+      0.5,
+      0.5
+    ],
+    "image_processor_type": "DeepseekOcrImageProcessorFast",
+    "image_std": [
+      0.5,
+      0.5,
+      0.5
+    ],
+    "input_data_format": null,
+    "pad_size": null,
+    "patch_size": 16,
+    "processor_class": "DeepseekOcrProcessor",
+    "resample": 3,
+    "rescale_factor": 0.00392156862745098,
+    "return_tensors": null,
+    "size": {
+      "height": 1024,
+      "width": 1024
+    }
+  },
+  "image_token": "<image>",
+  "processor_class": "DeepseekOcrProcessor"
+}

special_tokens_map.json ADDED Viewed

+{
+  "additional_special_tokens": [
+    "<|User|>",
+    "<|Assistant|>"
+  ],
+  "bos_token": {
+    "content": "<｜begin▁of▁sentence｜>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "<｜end▁of▁sentence｜>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "<｜▁pad▁｜>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json ADDED Viewed

The diff for this file is too large to render. See raw diff