Add files using upload-large-folder tool
Browse files- config.json +62 -26
- generation_config.json +1 -1
- model.safetensors +2 -2
config.json
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "
|
3 |
"architectures": [
|
4 |
"Qwen2_5_VLForConditionalGeneration"
|
5 |
],
|
@@ -31,38 +31,74 @@
|
|
31 |
"multi_modal_projector",
|
32 |
"merger",
|
33 |
"modality_projection",
|
34 |
-
"visual.
|
35 |
-
"visual.blocks.
|
36 |
-
"
|
37 |
-
"visual.blocks.
|
38 |
-
"visual.blocks.
|
39 |
-
"visual.blocks.
|
40 |
-
"visual.blocks.
|
41 |
-
"visual.blocks.
|
42 |
-
"visual.blocks.
|
43 |
-
"visual.blocks.
|
44 |
-
"visual.blocks.
|
45 |
-
"visual.blocks.
|
46 |
-
"visual.blocks.
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
47 |
"visual.blocks.6.mlp",
|
48 |
-
"visual.blocks.
|
49 |
-
"visual.blocks.
|
50 |
-
"visual.blocks.8.attn",
|
51 |
-
"visual.blocks.8.mlp",
|
52 |
"visual.blocks.9.attn",
|
53 |
-
"
|
|
|
|
|
|
|
54 |
"visual.blocks.11.mlp",
|
|
|
55 |
"visual.blocks.12.mlp",
|
|
|
|
|
56 |
"visual.blocks.13.mlp",
|
57 |
-
"visual.blocks.
|
|
|
|
|
58 |
"visual.blocks.14.mlp",
|
59 |
-
"visual.blocks.15.attn",
|
60 |
"visual.blocks.15.mlp",
|
61 |
-
"visual.blocks.
|
|
|
62 |
"visual.blocks.17.mlp",
|
63 |
-
"visual.blocks.
|
64 |
-
"
|
65 |
-
"visual.blocks.
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
66 |
],
|
67 |
"llm_int8_threshold": 6.0,
|
68 |
"load_in_4bit": true,
|
@@ -83,7 +119,7 @@
|
|
83 |
"sliding_window": 32768,
|
84 |
"tie_word_embeddings": true,
|
85 |
"torch_dtype": "bfloat16",
|
86 |
-
"transformers_version": "4.
|
87 |
"unsloth_fixed": true,
|
88 |
"use_cache": true,
|
89 |
"use_sliding_window": false,
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "unsloth/Qwen2.5-VL-3B-Instruct",
|
3 |
"architectures": [
|
4 |
"Qwen2_5_VLForConditionalGeneration"
|
5 |
],
|
|
|
31 |
"multi_modal_projector",
|
32 |
"merger",
|
33 |
"modality_projection",
|
34 |
+
"visual.merger.mlp",
|
35 |
+
"visual.blocks.28.attn",
|
36 |
+
"model.layers.5.mlp",
|
37 |
+
"visual.blocks.25.attn",
|
38 |
+
"visual.blocks.26.attn",
|
39 |
+
"visual.blocks.31.attn",
|
40 |
+
"visual.blocks.22.attn",
|
41 |
+
"visual.blocks.27.attn",
|
42 |
+
"visual.blocks.24.attn",
|
43 |
+
"visual.blocks.29.attn",
|
44 |
+
"visual.blocks.21.attn",
|
45 |
+
"visual.blocks.30.mlp",
|
46 |
+
"visual.blocks.30.attn",
|
47 |
+
"visual.blocks.25.mlp",
|
48 |
+
"visual.blocks.27.mlp",
|
49 |
+
"visual.blocks.23.attn",
|
50 |
+
"visual.blocks.20.attn",
|
51 |
+
"visual.blocks.29.mlp",
|
52 |
+
"visual.blocks.24.mlp",
|
53 |
+
"visual.blocks.18.attn",
|
54 |
+
"visual.blocks.31.mlp",
|
55 |
+
"visual.blocks.19.attn",
|
56 |
+
"visual.blocks.26.mlp",
|
57 |
+
"visual.blocks.28.mlp",
|
58 |
+
"visual.blocks.23.mlp",
|
59 |
+
"visual.blocks.21.mlp",
|
60 |
+
"visual.blocks.13.attn",
|
61 |
+
"visual.blocks.17.attn",
|
62 |
+
"visual.blocks.20.mlp",
|
63 |
+
"model.layers.2.mlp",
|
64 |
+
"visual.blocks.22.mlp",
|
65 |
+
"visual.blocks.18.mlp",
|
66 |
+
"visual.blocks.16.attn",
|
67 |
+
"visual.blocks.12.attn",
|
68 |
+
"visual.blocks.19.mlp",
|
69 |
+
"visual.blocks.9.mlp",
|
70 |
"visual.blocks.6.mlp",
|
71 |
+
"visual.blocks.16.mlp",
|
72 |
+
"visual.blocks.10.mlp",
|
|
|
|
|
73 |
"visual.blocks.9.attn",
|
74 |
+
"model.layers.1.mlp",
|
75 |
+
"visual.blocks.10.attn",
|
76 |
+
"visual.blocks.14.attn",
|
77 |
+
"visual.blocks.6.attn",
|
78 |
"visual.blocks.11.mlp",
|
79 |
+
"visual.blocks.11.attn",
|
80 |
"visual.blocks.12.mlp",
|
81 |
+
"visual.blocks.7.mlp",
|
82 |
+
"visual.blocks.2.mlp",
|
83 |
"visual.blocks.13.mlp",
|
84 |
+
"visual.blocks.8.attn",
|
85 |
+
"visual.blocks.5.mlp",
|
86 |
+
"visual.blocks.8.mlp",
|
87 |
"visual.blocks.14.mlp",
|
|
|
88 |
"visual.blocks.15.mlp",
|
89 |
+
"visual.blocks.4.mlp",
|
90 |
+
"visual.blocks.5.attn",
|
91 |
"visual.blocks.17.mlp",
|
92 |
+
"visual.blocks.3.mlp",
|
93 |
+
"visual.blocks.15.attn",
|
94 |
+
"visual.blocks.1.attn",
|
95 |
+
"visual.blocks.1.mlp",
|
96 |
+
"visual.blocks.7.attn",
|
97 |
+
"visual.blocks.2.attn",
|
98 |
+
"visual.blocks.4.attn",
|
99 |
+
"visual.blocks.0.mlp",
|
100 |
+
"visual.blocks.0.attn",
|
101 |
+
"visual.blocks.3.attn"
|
102 |
],
|
103 |
"llm_int8_threshold": 6.0,
|
104 |
"load_in_4bit": true,
|
|
|
119 |
"sliding_window": 32768,
|
120 |
"tie_word_embeddings": true,
|
121 |
"torch_dtype": "bfloat16",
|
122 |
+
"transformers_version": "4.49.0",
|
123 |
"unsloth_fixed": true,
|
124 |
"use_cache": true,
|
125 |
"use_sliding_window": false,
|
generation_config.json
CHANGED
@@ -11,5 +11,5 @@
|
|
11 |
"temperature": 0.1,
|
12 |
"top_k": 1,
|
13 |
"top_p": 0.001,
|
14 |
-
"transformers_version": "4.
|
15 |
}
|
|
|
11 |
"temperature": 0.1,
|
12 |
"top_k": 1,
|
13 |
"top_p": 0.001,
|
14 |
+
"transformers_version": "4.49.0"
|
15 |
}
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e556b1118e6c6b9fdf3b37804ba4ec3d5ae37aa63013f9e92c4f2859ef481375
|
3 |
+
size 3693149642
|