AyaKhaled commited on
Commit
f7a2f2b
·
verified ·
1 Parent(s): 20d96c1

Training in progress, step 100

Browse files
Files changed (3) hide show
  1. adapter_config.json +3 -3
  2. adapter_model.safetensors +1 -1
  3. config.json +149 -0
adapter_config.json CHANGED
@@ -24,10 +24,10 @@
24
  "rank_pattern": {},
25
  "revision": null,
26
  "target_modules": [
27
- "k_proj",
28
- "o_proj",
29
  "q_proj",
30
- "v_proj"
 
31
  ],
32
  "task_type": "CAUSAL_LM",
33
  "trainable_token_indices": null,
 
24
  "rank_pattern": {},
25
  "revision": null,
26
  "target_modules": [
27
+ "v_proj",
 
28
  "q_proj",
29
+ "o_proj",
30
+ "k_proj"
31
  ],
32
  "task_type": "CAUSAL_LM",
33
  "trainable_token_indices": null,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:279a476fa4fb0eeaa1336eaf2c15c5248c02ed64a9d492084f3d67a9b199d24c
3
  size 11045424
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4bf25761f5424420496bc0d750f2735aeb3d704b2d30d5d36c5920da5d4c755
3
  size 11045424
config.json ADDED
@@ -0,0 +1,149 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "Phi3VForCausalLM"
4
+ ],
5
+ "attention_dropout": 0.0,
6
+ "auto_map": {
7
+ "AutoConfig": "microsoft/Phi-3.5-vision-instruct--configuration_phi3_v.Phi3VConfig",
8
+ "AutoModelForCausalLM": "microsoft/Phi-3.5-vision-instruct--modeling_phi3_v.Phi3VForCausalLM"
9
+ },
10
+ "bos_token_id": 1,
11
+ "embd_layer": {
12
+ "embedding_cls": "image",
13
+ "hd_transform_order": "sub_glb",
14
+ "projection_cls": "mlp",
15
+ "use_hd_transform": true,
16
+ "with_learnable_separator": true
17
+ },
18
+ "embd_pdrop": 0.0,
19
+ "eos_token_id": 2,
20
+ "hidden_act": "silu",
21
+ "hidden_size": 3072,
22
+ "img_processor": {
23
+ "image_dim_out": 1024,
24
+ "model_name": "openai/clip-vit-large-patch14-336",
25
+ "name": "clip_vision_model",
26
+ "num_img_tokens": 144
27
+ },
28
+ "initializer_range": 0.02,
29
+ "intermediate_size": 8192,
30
+ "max_position_embeddings": 131072,
31
+ "model_type": "phi3_v",
32
+ "num_attention_heads": 32,
33
+ "num_hidden_layers": 32,
34
+ "num_key_value_heads": 32,
35
+ "original_max_position_embeddings": 4096,
36
+ "pad_token_id": 32000,
37
+ "resid_pdrop": 0.0,
38
+ "rms_norm_eps": 1e-05,
39
+ "rope_scaling": {
40
+ "long_factor": [
41
+ 1.0800000429153442,
42
+ 1.1100000143051147,
43
+ 1.1399999856948853,
44
+ 1.340000033378601,
45
+ 1.5899999141693115,
46
+ 1.600000023841858,
47
+ 1.6200000047683716,
48
+ 2.620000123977661,
49
+ 3.2300000190734863,
50
+ 3.2300000190734863,
51
+ 4.789999961853027,
52
+ 7.400000095367432,
53
+ 7.700000286102295,
54
+ 9.09000015258789,
55
+ 12.199999809265137,
56
+ 17.670000076293945,
57
+ 24.46000099182129,
58
+ 28.57000160217285,
59
+ 30.420001983642578,
60
+ 30.840002059936523,
61
+ 32.590003967285156,
62
+ 32.93000411987305,
63
+ 42.320003509521484,
64
+ 44.96000289916992,
65
+ 50.340003967285156,
66
+ 50.45000457763672,
67
+ 57.55000305175781,
68
+ 57.93000411987305,
69
+ 58.21000289916992,
70
+ 60.1400032043457,
71
+ 62.61000442504883,
72
+ 62.62000274658203,
73
+ 62.71000289916992,
74
+ 63.1400032043457,
75
+ 63.1400032043457,
76
+ 63.77000427246094,
77
+ 63.93000411987305,
78
+ 63.96000289916992,
79
+ 63.970001220703125,
80
+ 64.02999877929688,
81
+ 64.06999969482422,
82
+ 64.08000183105469,
83
+ 64.12000274658203,
84
+ 64.41000366210938,
85
+ 64.4800033569336,
86
+ 64.51000213623047,
87
+ 64.52999877929688,
88
+ 64.83999633789062
89
+ ],
90
+ "short_factor": [
91
+ 1.08,
92
+ 1.1,
93
+ 1.1300000000000001,
94
+ 1.2800000000000002,
95
+ 1.3100000000000003,
96
+ 1.4500000000000004,
97
+ 1.4500000000000004,
98
+ 1.9500000000000008,
99
+ 2.030000000000001,
100
+ 2.4299999999999926,
101
+ 2.5699999999999896,
102
+ 2.9499999999999815,
103
+ 3.729999999999965,
104
+ 3.869999999999962,
105
+ 4.189999999999955,
106
+ 4.43999999999995,
107
+ 4.6399999999999455,
108
+ 4.979999999999938,
109
+ 5.159999999999934,
110
+ 5.279999999999932,
111
+ 5.759999999999922,
112
+ 5.889999999999919,
113
+ 5.889999999999919,
114
+ 5.969999999999917,
115
+ 6.089999999999915,
116
+ 6.2799999999999105,
117
+ 6.7699999999999,
118
+ 6.8899999999998975,
119
+ 7.109999999999893,
120
+ 7.129999999999892,
121
+ 7.179999999999891,
122
+ 7.289999999999889,
123
+ 7.339999999999888,
124
+ 7.559999999999883,
125
+ 7.619999999999882,
126
+ 7.69999999999988,
127
+ 7.879999999999876,
128
+ 7.879999999999876,
129
+ 7.879999999999876,
130
+ 7.939999999999875,
131
+ 7.949999999999875,
132
+ 7.979999999999874,
133
+ 8.19999999999987,
134
+ 8.439999999999864,
135
+ 8.469999999999864,
136
+ 8.589999999999861,
137
+ 8.809999999999857,
138
+ 8.999999999999853
139
+ ],
140
+ "type": "su"
141
+ },
142
+ "rope_theta": 10000.0,
143
+ "sliding_window": 262144,
144
+ "tie_word_embeddings": false,
145
+ "torch_dtype": "bfloat16",
146
+ "transformers_version": "4.51.2",
147
+ "use_cache": true,
148
+ "vocab_size": 32064
149
+ }