Upload folder using huggingface_hub

Browse files

Files changed (12) hide show

config.json +190 -4
model-00001-of-00007.safetensors +2 -2
model-00002-of-00007.safetensors +2 -2
model-00003-of-00007.safetensors +2 -2
model-00004-of-00007.safetensors +2 -2
model-00005-of-00007.safetensors +2 -2
model-00006-of-00007.safetensors +2 -2
model-00007-of-00007.safetensors +2 -2
model.safetensors.index.json +0 -0
preprocessor_config.json +26 -0
processor_config.json +6 -0
tokenizer_config.json +2 -0

config.json CHANGED Viewed

@@ -1,4 +1,5 @@
 {
     "architectures": [
         "KimiVLForConditionalGeneration"
     ],
@@ -7,9 +8,56 @@
         "AutoModel": "modeling_kimi_vl.KimiVLForConditionalGeneration",
         "AutoModelForCausalLM": "modeling_kimi_vl.KimiVLForConditionalGeneration"
     },
     "ignore_index": -100,
     "media_placeholder_token_id": 163605,
     "model_type": "kimi_vl",
     "text_config": {
         "vocab_size": 163840,
         "max_position_embeddings": 131072,
@@ -17,6 +65,7 @@
         "intermediate_size": 11264,
         "moe_intermediate_size": 1408,
         "num_hidden_layers": 27,
         "num_attention_heads": 16,
         "n_shared_experts": 2,
         "n_routed_experts": 64,
@@ -47,14 +96,151 @@
         "rope_scaling": null,
         "attention_bias": false,
         "attention_dropout": 0.0,
         "bos_token_id": 163584,
         "pad_token_id": 163839,
         "eos_token_id": 163585,
-        "torch_dtype": "bfloat16",
-        "tie_word_embeddings": false
     },
     "tie_word_embeddings": false,
-    "torch_dtype": "bfloat16",
-    "transformers_version": "4.50.3",
     "vocab_size": 163840
 }

 {
+    "add_cross_attention": false,
     "architectures": [
         "KimiVLForConditionalGeneration"
     ],
         "AutoModel": "modeling_kimi_vl.KimiVLForConditionalGeneration",
         "AutoModelForCausalLM": "modeling_kimi_vl.KimiVLForConditionalGeneration"
     },
+    "bad_words_ids": null,
+    "begin_suppress_tokens": null,
+    "bos_token_id": null,
+    "chunk_size_feed_forward": 0,
+    "cross_attention_hidden_size": null,
+    "decoder_start_token_id": null,
+    "diversity_penalty": 0.0,
+    "do_sample": false,
+    "early_stopping": false,
+    "encoder_no_repeat_ngram_size": 0,
+    "eos_token_id": null,
+    "exponential_decay_length_penalty": null,
+    "finetuning_task": null,
+    "forced_bos_token_id": null,
+    "forced_eos_token_id": null,
+    "id2label": {
+        "0": "LABEL_0",
+        "1": "LABEL_1"
+    },
     "ignore_index": -100,
+    "is_decoder": false,
+    "is_encoder_decoder": false,
+    "label2id": {
+        "LABEL_0": 0,
+        "LABEL_1": 1
+    },
+    "length_penalty": 1.0,
+    "max_length": 20,
     "media_placeholder_token_id": 163605,
+    "min_length": 0,
     "model_type": "kimi_vl",
+    "no_repeat_ngram_size": 0,
+    "num_beam_groups": 1,
+    "num_beams": 1,
+    "num_return_sequences": 1,
+    "output_attentions": false,
+    "output_hidden_states": false,
+    "output_scores": false,
+    "pad_token_id": 0,
+    "prefix": null,
+    "problem_type": null,
+    "pruned_heads": {},
+    "remove_invalid_values": false,
+    "repetition_penalty": 1.0,
+    "return_dict": true,
+    "return_dict_in_generate": false,
+    "sep_token_id": null,
+    "suppress_tokens": null,
+    "task_specific_params": null,
+    "temperature": 1.0,
     "text_config": {
         "vocab_size": 163840,
         "max_position_embeddings": 131072,
         "intermediate_size": 11264,
         "moe_intermediate_size": 1408,
         "num_hidden_layers": 27,
+        "num_nextn_predict_layers": 1,
         "num_attention_heads": 16,
         "n_shared_experts": 2,
         "n_routed_experts": 64,
         "rope_scaling": null,
         "attention_bias": false,
         "attention_dropout": 0.0,
+        "return_dict": true,
+        "output_hidden_states": false,
+        "torchscript": false,
+        "torch_dtype": "bfloat16",
+        "use_bfloat16": false,
+        "tf_legacy_loss": false,
+        "pruned_heads": {},
+        "tie_word_embeddings": false,
+        "chunk_size_feed_forward": 0,
+        "is_encoder_decoder": false,
+        "is_decoder": false,
+        "cross_attention_hidden_size": null,
+        "add_cross_attention": false,
+        "tie_encoder_decoder": false,
+        "max_length": 20,
+        "min_length": 0,
+        "do_sample": false,
+        "early_stopping": false,
+        "num_beams": 1,
+        "num_beam_groups": 1,
+        "diversity_penalty": 0.0,
+        "temperature": 1.0,
+        "top_k": 50,
+        "top_p": 1.0,
+        "typical_p": 1.0,
+        "repetition_penalty": 1.0,
+        "length_penalty": 1.0,
+        "no_repeat_ngram_size": 0,
+        "encoder_no_repeat_ngram_size": 0,
+        "bad_words_ids": null,
+        "num_return_sequences": 1,
+        "output_scores": false,
+        "return_dict_in_generate": false,
+        "forced_bos_token_id": null,
+        "forced_eos_token_id": null,
+        "remove_invalid_values": false,
+        "exponential_decay_length_penalty": null,
+        "suppress_tokens": null,
+        "begin_suppress_tokens": null,
+        "architectures": null,
+        "finetuning_task": null,
+        "id2label": {
+            "0": "LABEL_0",
+            "1": "LABEL_1"
+        },
+        "label2id": {
+            "LABEL_0": 0,
+            "LABEL_1": 1
+        },
+        "tokenizer_class": null,
+        "prefix": null,
         "bos_token_id": 163584,
         "pad_token_id": 163839,
         "eos_token_id": 163585,
+        "sep_token_id": null,
+        "decoder_start_token_id": null,
+        "task_specific_params": null,
+        "problem_type": null,
+        "_name_or_path": "",
+        "model_type": "deepseek_v3",
+        "output_attentions": false
     },
+    "tf_legacy_loss": false,
+    "tie_encoder_decoder": false,
     "tie_word_embeddings": false,
+    "tokenizer_class": null,
+    "top_k": 50,
+    "top_p": 1.0,
+    "torchscript": false,
+    "transformers_version": "4.53.3",
+    "typical_p": 1.0,
+    "use_bfloat16": false,
+    "vision_config": {
+        "return_dict": true,
+        "output_hidden_states": false,
+        "torchscript": false,
+        "torch_dtype": "bfloat16",
+        "use_bfloat16": false,
+        "tf_legacy_loss": false,
+        "pruned_heads": {},
+        "tie_word_embeddings": true,
+        "chunk_size_feed_forward": 0,
+        "is_encoder_decoder": false,
+        "is_decoder": false,
+        "cross_attention_hidden_size": null,
+        "add_cross_attention": false,
+        "tie_encoder_decoder": false,
+        "max_length": 20,
+        "min_length": 0,
+        "do_sample": false,
+        "early_stopping": false,
+        "num_beams": 1,
+        "num_beam_groups": 1,
+        "diversity_penalty": 0.0,
+        "temperature": 1.0,
+        "top_k": 50,
+        "top_p": 1.0,
+        "typical_p": 1.0,
+        "repetition_penalty": 1.0,
+        "length_penalty": 1.0,
+        "no_repeat_ngram_size": 0,
+        "encoder_no_repeat_ngram_size": 0,
+        "bad_words_ids": null,
+        "num_return_sequences": 1,
+        "output_scores": false,
+        "return_dict_in_generate": false,
+        "forced_bos_token_id": null,
+        "forced_eos_token_id": null,
+        "remove_invalid_values": false,
+        "exponential_decay_length_penalty": null,
+        "suppress_tokens": null,
+        "begin_suppress_tokens": null,
+        "architectures": null,
+        "finetuning_task": null,
+        "id2label": {
+            "0": "LABEL_0",
+            "1": "LABEL_1"
+        },
+        "label2id": {
+            "LABEL_0": 0,
+            "LABEL_1": 1
+        },
+        "tokenizer_class": null,
+        "prefix": null,
+        "bos_token_id": null,
+        "pad_token_id": null,
+        "eos_token_id": null,
+        "sep_token_id": null,
+        "decoder_start_token_id": null,
+        "task_specific_params": null,
+        "problem_type": null,
+        "_name_or_path": "",
+        "model_type": "moonvit",
+        "patch_size": 14,
+        "init_pos_emb_height": 64,
+        "init_pos_emb_width": 64,
+        "num_hidden_layers": 27,
+        "num_attention_heads": 16,
+        "hidden_size": 1152,
+        "intermediate_size": 4304,
+        "merge_kernel_size": [
+            2,
+            2
+        ],
+        "output_attentions": false
+    },
     "vocab_size": 163840
 }

model-00001-of-00007.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c24e694b3f3d1d06801d8bb02b8a62859856558173851ba30d8abac0833686dd
-size 5111855204

 version https://git-lfs.github.com/spec/v1
+oid sha256:c2c40ab7ee663d1a9d8dfdf886f58fc1ed72360d3d040134903ab4a7d4f82c7f
+size 5207425600

model-00002-of-00007.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a3c8261e04730d6b462ac35ecad43f191e29705f2872313a0575c263258a09ba
-size 5110292434

 version https://git-lfs.github.com/spec/v1
+oid sha256:99400fb4a4db93191ee2f0eea827f5dbde491460729e221adcefef959d7934e3
+size 5047890573

model-00003-of-00007.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:504eb5d30887a1b5528e92bf1c998fdc41d0953961300176154846e041dd1c32
-size 5047891100

 version https://git-lfs.github.com/spec/v1
+oid sha256:f0b38aa086aa1bc5ec73f5a12065433f8e21a1cff8cb6586c1946d46b7b8e35f
+size 5047890606

model-00004-of-00007.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:57f92814de160583b888e8e97870aa6b403021fa6d289d3e6dd69fa1b495b777
-size 5047891154

 version https://git-lfs.github.com/spec/v1
+oid sha256:e0a8d9c435f8715067d9cf9b359a4226d5fa17e2a4c55c502d856a1cd8587511
+size 5110291870

model-00005-of-00007.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:66e89b2bd77900920a7e5570062c99d4998dade3ffc021bc82bf44c21f32dd00
-size 5110292473

 version https://git-lfs.github.com/spec/v1
+oid sha256:eca1fc288e7134dd07f4d15e9f2c457aa1fed551e39db8b60c2bc752cd53b98a
+size 5047890618

model-00006-of-00007.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c35578ce0f5cd495da6c2e949814821c811f9b838e5034d9e982dd082a3ce665
-size 5047891130

 version https://git-lfs.github.com/spec/v1
+oid sha256:9d1452ab13cc898a14c88ffc00a1e7226372d349707493dcffe58a7b718287de
+size 5047890650

model-00007-of-00007.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3f6c47402cf966197708a9813da7b13dcf562909bade7928ce1a19887cff8987
-size 1444165317

 version https://git-lfs.github.com/spec/v1
+oid sha256:625d4b768aa82c2e33050f24ea937de6def4937c1040ca60f35e0258f8de2ad9
+size 2306124504

model.safetensors.index.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+  "auto_map": {
+    "AutoImageProcessor": "image_processing_kimi_vl.KimiVLImageProcessor",
+    "AutoProcessor": "processing_kimi_vl.KimiVLProcessor"
+  },
+  "image_mean": [
+    0.5,
+    0.5,
+    0.5
+  ],
+  "image_processor_type": "KimiVLImageProcessor",
+  "image_std": [
+    0.5,
+    0.5,
+    0.5
+  ],
+  "in_token_limit": 16384,
+  "merge_kernel_size": [
+    2,
+    2
+  ],
+  "num_pooled_tokens": 1024,
+  "pad_input": true,
+  "patch_size": 14,
+  "processor_class": "KimiVLProcessor"
+}

processor_config.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "auto_map": {
+    "AutoProcessor": "processing_kimi_vl.KimiVLProcessor"
+  },
+  "processor_class": "KimiVLProcessor"
+}

tokenizer_config.json CHANGED Viewed

@@ -117,6 +117,7 @@
     "<|media_pad|>"
   ],
   "auto_map": {
     "AutoTokenizer": [
       "tokenization_moonshot.TikTokenTokenizer",
       null
@@ -128,6 +129,7 @@
   "extra_special_tokens": {},
   "model_max_length": 1048576,
   "pad_token": "[PAD]",
   "tokenizer_class": "TikTokenTokenizer",
   "unk_token": "[UNK]"
 }

     "<|media_pad|>"
   ],
   "auto_map": {
+    "AutoProcessor": "processing_kimi_vl.KimiVLProcessor",
     "AutoTokenizer": [
       "tokenization_moonshot.TikTokenTokenizer",
       null
   "extra_special_tokens": {},
   "model_max_length": 1048576,
   "pad_token": "[PAD]",
+  "processor_class": "KimiVLProcessor",
   "tokenizer_class": "TikTokenTokenizer",
   "unk_token": "[UNK]"
 }