masint
/

tiny-random-qwen2-vl

text-generation-inference

Model card Files Files and versions Community

gdiamos commited on 19 days ago

Commit

28d7478

·

verified ·

1 Parent(s): 58ec817

Upload Qwen2VLForConditionalGeneration

Files changed (2) hide show

config.json +73 -3
model.safetensors +1 -1

config.json CHANGED Viewed

@@ -19,15 +19,85 @@
   "rms_norm_eps": 1e-06,
   "rope_scaling": {
     "mrope_section": [
-      2,
-      2,
-      8
     ],
     "rope_type": "default",
     "type": "mrope"
   },
   "rope_theta": 1000000.0,
   "sliding_window": 32768,
   "torch_dtype": "float32",
   "transformers_version": "4.53.0",
   "use_cache": true,

   "rms_norm_eps": 1e-06,
   "rope_scaling": {
     "mrope_section": [
+      8,
+      8,
+      16
     ],
     "rope_type": "default",
     "type": "mrope"
   },
   "rope_theta": 1000000.0,
   "sliding_window": 32768,
+  "text_config": {
+    "architectures": [
+      "Qwen2VLForConditionalGeneration"
+    ],
+    "attention_dropout": 0.0,
+    "bos_token_id": 151643,
+    "eos_token_id": 151645,
+    "hidden_act": "silu",
+    "hidden_size": 64,
+    "image_token_id": null,
+    "initializer_range": 0.02,
+    "intermediate_size": 8960,
+    "layer_types": [
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention"
+    ],
+    "max_position_embeddings": 32768,
+    "max_window_layers": 28,
+    "model_type": "qwen2_vl_text",
+    "num_attention_heads": 1,
+    "num_hidden_layers": 1,
+    "num_key_value_heads": 2,
+    "rms_norm_eps": 1e-06,
+    "rope_scaling": {
+      "mrope_section": [
+        8,
+        8,
+        16
+      ],
+      "rope_type": "default",
+      "type": "mrope"
+    },
+    "rope_theta": 1000000.0,
+    "sliding_window": null,
+    "tie_word_embeddings": true,
+    "torch_dtype": "float32",
+    "use_cache": true,
+    "use_sliding_window": false,
+    "video_token_id": null,
+    "vision_end_token_id": 151653,
+    "vision_start_token_id": 151652,
+    "vision_token_id": 151654,
+    "vocab_size": 151936
+  },
   "torch_dtype": "float32",
   "transformers_version": "4.53.0",
   "use_cache": true,

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ace607c2712d320465044ef86e422d95146c66b5b956c92c669b9e5c52508042
 size 46711048

 version https://git-lfs.github.com/spec/v1
+oid sha256:746e651149d0c3fb563f963b92add3dc5c3bb14f46d8129cc8aa0ae1a658384f
 size 46711048