Upload Qwen2_5_VLForConditionalGeneration

by albertvillanova HF Staff - opened 1 day ago

base: refs/heads/main

←

from: refs/pr/2

Discussion Files changed

-39

Files changed (3) hide show

config.json +3 -37
generation_config.json +1 -1
model.safetensors +1 -1

config.json CHANGED Viewed

@@ -4,6 +4,7 @@
   ],
   "attention_dropout": 0.0,
   "bos_token_id": 151643,
   "eos_token_id": 151645,
   "hidden_act": "silu",
   "hidden_size": 2048,
@@ -32,6 +33,7 @@
     ],
     "attention_dropout": 0.0,
     "bos_token_id": 151643,
     "eos_token_id": 151645,
     "hidden_act": "silu",
     "hidden_size": 16,
@@ -39,40 +41,6 @@
     "initializer_range": 0.02,
     "intermediate_size": 11008,
     "layer_types": [
-      "full_attention",
-      "full_attention",
-      "full_attention",
-      "full_attention",
-      "full_attention",
-      "full_attention",
-      "full_attention",
-      "full_attention",
-      "full_attention",
-      "full_attention",
-      "full_attention",
-      "full_attention",
-      "full_attention",
-      "full_attention",
-      "full_attention",
-      "full_attention",
-      "full_attention",
-      "full_attention",
-      "full_attention",
-      "full_attention",
-      "full_attention",
-      "full_attention",
-      "full_attention",
-      "full_attention",
-      "full_attention",
-      "full_attention",
-      "full_attention",
-      "full_attention",
-      "full_attention",
-      "full_attention",
-      "full_attention",
-      "full_attention",
-      "full_attention",
-      "full_attention",
       "full_attention",
       "full_attention"
     ],
@@ -93,7 +61,6 @@
     "rope_theta": 1000000.0,
     "sliding_window": null,
     "tie_word_embeddings": true,
-    "torch_dtype": "bfloat16",
     "use_cache": true,
     "use_sliding_window": false,
     "video_token_id": null,
@@ -102,8 +69,7 @@
     "vision_token_id": 151654,
     "vocab_size": 151936
   },
-  "torch_dtype": "bfloat16",
-  "transformers_version": "4.56.0.dev0",
   "use_cache": true,
   "use_sliding_window": false,
   "video_token_id": 151656,

   ],
   "attention_dropout": 0.0,
   "bos_token_id": 151643,
+  "dtype": "bfloat16",
   "eos_token_id": 151645,
   "hidden_act": "silu",
   "hidden_size": 2048,
     ],
     "attention_dropout": 0.0,
     "bos_token_id": 151643,
+    "dtype": "bfloat16",
     "eos_token_id": 151645,
     "hidden_act": "silu",
     "hidden_size": 16,
     "initializer_range": 0.02,
     "intermediate_size": 11008,
     "layer_types": [
       "full_attention",
       "full_attention"
     ],
     "rope_theta": 1000000.0,
     "sliding_window": null,
     "tie_word_embeddings": true,
     "use_cache": true,
     "use_sliding_window": false,
     "video_token_id": null,
     "vision_token_id": 151654,
     "vocab_size": 151936
   },
+  "transformers_version": "4.56.1",
   "use_cache": true,
   "use_sliding_window": false,
   "video_token_id": 151656,

generation_config.json CHANGED Viewed

@@ -2,5 +2,5 @@
   "_from_model_config": true,
   "bos_token_id": 151643,
   "eos_token_id": 151645,
-  "transformers_version": "4.56.0.dev0"
 }

   "_from_model_config": true,
   "bos_token_id": 151643,
   "eos_token_id": 151645,
+  "transformers_version": "4.56.1"
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:64f6d603334a11233717f2c62832c863394fc51cdbdabbd6a25dcdc4a6f26c8d
 size 18086192

 version https://git-lfs.github.com/spec/v1
+oid sha256:4f2af27576d9c46218d01c601ba63e99c39fa2ce0e7c817013c1b144864989e4
 size 18086192