asabet commited on
Commit
b5edd44
·
verified ·
1 Parent(s): 3637fe8

Upload folder using huggingface_hub

Browse files
config.json CHANGED
@@ -1,293 +1,10 @@
1
  {
2
- "_name_or_path": "/mnt/asabet/llama-recipes/finetuned_model/fine-tuned-meta-llama/Llama-3.2-11B-Vision-Instruct/hf-weights",
3
  "architectures": [
4
  "MllamaForConditionalGeneration"
5
  ],
6
  "image_token_index": 128256,
7
  "model_type": "mllama",
8
- "quantization_config": {
9
- "config_groups": {
10
- "group_0": {
11
- "input_activations": {
12
- "actorder": null,
13
- "block_structure": null,
14
- "dynamic": true,
15
- "group_size": null,
16
- "num_bits": 8,
17
- "observer": null,
18
- "observer_kwargs": {},
19
- "strategy": "token",
20
- "symmetric": true,
21
- "type": "int"
22
- },
23
- "output_activations": null,
24
- "targets": [
25
- "Linear"
26
- ],
27
- "weights": {
28
- "actorder": null,
29
- "block_structure": null,
30
- "dynamic": false,
31
- "group_size": null,
32
- "num_bits": 8,
33
- "observer": "minmax",
34
- "observer_kwargs": {},
35
- "strategy": "channel",
36
- "symmetric": true,
37
- "type": "int"
38
- }
39
- }
40
- },
41
- "format": "int-quantized",
42
- "global_compression_ratio": 1.3639314687910544,
43
- "ignore": [
44
- "vision_model.transformer.layers.0.self_attn.q_proj",
45
- "vision_model.transformer.layers.0.self_attn.k_proj",
46
- "vision_model.transformer.layers.0.self_attn.v_proj",
47
- "vision_model.transformer.layers.0.self_attn.o_proj",
48
- "vision_model.transformer.layers.0.mlp.fc1",
49
- "vision_model.transformer.layers.0.mlp.fc2",
50
- "vision_model.transformer.layers.1.self_attn.q_proj",
51
- "vision_model.transformer.layers.1.self_attn.k_proj",
52
- "vision_model.transformer.layers.1.self_attn.v_proj",
53
- "vision_model.transformer.layers.1.self_attn.o_proj",
54
- "vision_model.transformer.layers.1.mlp.fc1",
55
- "vision_model.transformer.layers.1.mlp.fc2",
56
- "vision_model.transformer.layers.2.self_attn.q_proj",
57
- "vision_model.transformer.layers.2.self_attn.k_proj",
58
- "vision_model.transformer.layers.2.self_attn.v_proj",
59
- "vision_model.transformer.layers.2.self_attn.o_proj",
60
- "vision_model.transformer.layers.2.mlp.fc1",
61
- "vision_model.transformer.layers.2.mlp.fc2",
62
- "vision_model.transformer.layers.3.self_attn.q_proj",
63
- "vision_model.transformer.layers.3.self_attn.k_proj",
64
- "vision_model.transformer.layers.3.self_attn.v_proj",
65
- "vision_model.transformer.layers.3.self_attn.o_proj",
66
- "vision_model.transformer.layers.3.mlp.fc1",
67
- "vision_model.transformer.layers.3.mlp.fc2",
68
- "vision_model.transformer.layers.4.self_attn.q_proj",
69
- "vision_model.transformer.layers.4.self_attn.k_proj",
70
- "vision_model.transformer.layers.4.self_attn.v_proj",
71
- "vision_model.transformer.layers.4.self_attn.o_proj",
72
- "vision_model.transformer.layers.4.mlp.fc1",
73
- "vision_model.transformer.layers.4.mlp.fc2",
74
- "vision_model.transformer.layers.5.self_attn.q_proj",
75
- "vision_model.transformer.layers.5.self_attn.k_proj",
76
- "vision_model.transformer.layers.5.self_attn.v_proj",
77
- "vision_model.transformer.layers.5.self_attn.o_proj",
78
- "vision_model.transformer.layers.5.mlp.fc1",
79
- "vision_model.transformer.layers.5.mlp.fc2",
80
- "vision_model.transformer.layers.6.self_attn.q_proj",
81
- "vision_model.transformer.layers.6.self_attn.k_proj",
82
- "vision_model.transformer.layers.6.self_attn.v_proj",
83
- "vision_model.transformer.layers.6.self_attn.o_proj",
84
- "vision_model.transformer.layers.6.mlp.fc1",
85
- "vision_model.transformer.layers.6.mlp.fc2",
86
- "vision_model.transformer.layers.7.self_attn.q_proj",
87
- "vision_model.transformer.layers.7.self_attn.k_proj",
88
- "vision_model.transformer.layers.7.self_attn.v_proj",
89
- "vision_model.transformer.layers.7.self_attn.o_proj",
90
- "vision_model.transformer.layers.7.mlp.fc1",
91
- "vision_model.transformer.layers.7.mlp.fc2",
92
- "vision_model.transformer.layers.8.self_attn.q_proj",
93
- "vision_model.transformer.layers.8.self_attn.k_proj",
94
- "vision_model.transformer.layers.8.self_attn.v_proj",
95
- "vision_model.transformer.layers.8.self_attn.o_proj",
96
- "vision_model.transformer.layers.8.mlp.fc1",
97
- "vision_model.transformer.layers.8.mlp.fc2",
98
- "vision_model.transformer.layers.9.self_attn.q_proj",
99
- "vision_model.transformer.layers.9.self_attn.k_proj",
100
- "vision_model.transformer.layers.9.self_attn.v_proj",
101
- "vision_model.transformer.layers.9.self_attn.o_proj",
102
- "vision_model.transformer.layers.9.mlp.fc1",
103
- "vision_model.transformer.layers.9.mlp.fc2",
104
- "vision_model.transformer.layers.10.self_attn.q_proj",
105
- "vision_model.transformer.layers.10.self_attn.k_proj",
106
- "vision_model.transformer.layers.10.self_attn.v_proj",
107
- "vision_model.transformer.layers.10.self_attn.o_proj",
108
- "vision_model.transformer.layers.10.mlp.fc1",
109
- "vision_model.transformer.layers.10.mlp.fc2",
110
- "vision_model.transformer.layers.11.self_attn.q_proj",
111
- "vision_model.transformer.layers.11.self_attn.k_proj",
112
- "vision_model.transformer.layers.11.self_attn.v_proj",
113
- "vision_model.transformer.layers.11.self_attn.o_proj",
114
- "vision_model.transformer.layers.11.mlp.fc1",
115
- "vision_model.transformer.layers.11.mlp.fc2",
116
- "vision_model.transformer.layers.12.self_attn.q_proj",
117
- "vision_model.transformer.layers.12.self_attn.k_proj",
118
- "vision_model.transformer.layers.12.self_attn.v_proj",
119
- "vision_model.transformer.layers.12.self_attn.o_proj",
120
- "vision_model.transformer.layers.12.mlp.fc1",
121
- "vision_model.transformer.layers.12.mlp.fc2",
122
- "vision_model.transformer.layers.13.self_attn.q_proj",
123
- "vision_model.transformer.layers.13.self_attn.k_proj",
124
- "vision_model.transformer.layers.13.self_attn.v_proj",
125
- "vision_model.transformer.layers.13.self_attn.o_proj",
126
- "vision_model.transformer.layers.13.mlp.fc1",
127
- "vision_model.transformer.layers.13.mlp.fc2",
128
- "vision_model.transformer.layers.14.self_attn.q_proj",
129
- "vision_model.transformer.layers.14.self_attn.k_proj",
130
- "vision_model.transformer.layers.14.self_attn.v_proj",
131
- "vision_model.transformer.layers.14.self_attn.o_proj",
132
- "vision_model.transformer.layers.14.mlp.fc1",
133
- "vision_model.transformer.layers.14.mlp.fc2",
134
- "vision_model.transformer.layers.15.self_attn.q_proj",
135
- "vision_model.transformer.layers.15.self_attn.k_proj",
136
- "vision_model.transformer.layers.15.self_attn.v_proj",
137
- "vision_model.transformer.layers.15.self_attn.o_proj",
138
- "vision_model.transformer.layers.15.mlp.fc1",
139
- "vision_model.transformer.layers.15.mlp.fc2",
140
- "vision_model.transformer.layers.16.self_attn.q_proj",
141
- "vision_model.transformer.layers.16.self_attn.k_proj",
142
- "vision_model.transformer.layers.16.self_attn.v_proj",
143
- "vision_model.transformer.layers.16.self_attn.o_proj",
144
- "vision_model.transformer.layers.16.mlp.fc1",
145
- "vision_model.transformer.layers.16.mlp.fc2",
146
- "vision_model.transformer.layers.17.self_attn.q_proj",
147
- "vision_model.transformer.layers.17.self_attn.k_proj",
148
- "vision_model.transformer.layers.17.self_attn.v_proj",
149
- "vision_model.transformer.layers.17.self_attn.o_proj",
150
- "vision_model.transformer.layers.17.mlp.fc1",
151
- "vision_model.transformer.layers.17.mlp.fc2",
152
- "vision_model.transformer.layers.18.self_attn.q_proj",
153
- "vision_model.transformer.layers.18.self_attn.k_proj",
154
- "vision_model.transformer.layers.18.self_attn.v_proj",
155
- "vision_model.transformer.layers.18.self_attn.o_proj",
156
- "vision_model.transformer.layers.18.mlp.fc1",
157
- "vision_model.transformer.layers.18.mlp.fc2",
158
- "vision_model.transformer.layers.19.self_attn.q_proj",
159
- "vision_model.transformer.layers.19.self_attn.k_proj",
160
- "vision_model.transformer.layers.19.self_attn.v_proj",
161
- "vision_model.transformer.layers.19.self_attn.o_proj",
162
- "vision_model.transformer.layers.19.mlp.fc1",
163
- "vision_model.transformer.layers.19.mlp.fc2",
164
- "vision_model.transformer.layers.20.self_attn.q_proj",
165
- "vision_model.transformer.layers.20.self_attn.k_proj",
166
- "vision_model.transformer.layers.20.self_attn.v_proj",
167
- "vision_model.transformer.layers.20.self_attn.o_proj",
168
- "vision_model.transformer.layers.20.mlp.fc1",
169
- "vision_model.transformer.layers.20.mlp.fc2",
170
- "vision_model.transformer.layers.21.self_attn.q_proj",
171
- "vision_model.transformer.layers.21.self_attn.k_proj",
172
- "vision_model.transformer.layers.21.self_attn.v_proj",
173
- "vision_model.transformer.layers.21.self_attn.o_proj",
174
- "vision_model.transformer.layers.21.mlp.fc1",
175
- "vision_model.transformer.layers.21.mlp.fc2",
176
- "vision_model.transformer.layers.22.self_attn.q_proj",
177
- "vision_model.transformer.layers.22.self_attn.k_proj",
178
- "vision_model.transformer.layers.22.self_attn.v_proj",
179
- "vision_model.transformer.layers.22.self_attn.o_proj",
180
- "vision_model.transformer.layers.22.mlp.fc1",
181
- "vision_model.transformer.layers.22.mlp.fc2",
182
- "vision_model.transformer.layers.23.self_attn.q_proj",
183
- "vision_model.transformer.layers.23.self_attn.k_proj",
184
- "vision_model.transformer.layers.23.self_attn.v_proj",
185
- "vision_model.transformer.layers.23.self_attn.o_proj",
186
- "vision_model.transformer.layers.23.mlp.fc1",
187
- "vision_model.transformer.layers.23.mlp.fc2",
188
- "vision_model.transformer.layers.24.self_attn.q_proj",
189
- "vision_model.transformer.layers.24.self_attn.k_proj",
190
- "vision_model.transformer.layers.24.self_attn.v_proj",
191
- "vision_model.transformer.layers.24.self_attn.o_proj",
192
- "vision_model.transformer.layers.24.mlp.fc1",
193
- "vision_model.transformer.layers.24.mlp.fc2",
194
- "vision_model.transformer.layers.25.self_attn.q_proj",
195
- "vision_model.transformer.layers.25.self_attn.k_proj",
196
- "vision_model.transformer.layers.25.self_attn.v_proj",
197
- "vision_model.transformer.layers.25.self_attn.o_proj",
198
- "vision_model.transformer.layers.25.mlp.fc1",
199
- "vision_model.transformer.layers.25.mlp.fc2",
200
- "vision_model.transformer.layers.26.self_attn.q_proj",
201
- "vision_model.transformer.layers.26.self_attn.k_proj",
202
- "vision_model.transformer.layers.26.self_attn.v_proj",
203
- "vision_model.transformer.layers.26.self_attn.o_proj",
204
- "vision_model.transformer.layers.26.mlp.fc1",
205
- "vision_model.transformer.layers.26.mlp.fc2",
206
- "vision_model.transformer.layers.27.self_attn.q_proj",
207
- "vision_model.transformer.layers.27.self_attn.k_proj",
208
- "vision_model.transformer.layers.27.self_attn.v_proj",
209
- "vision_model.transformer.layers.27.self_attn.o_proj",
210
- "vision_model.transformer.layers.27.mlp.fc1",
211
- "vision_model.transformer.layers.27.mlp.fc2",
212
- "vision_model.transformer.layers.28.self_attn.q_proj",
213
- "vision_model.transformer.layers.28.self_attn.k_proj",
214
- "vision_model.transformer.layers.28.self_attn.v_proj",
215
- "vision_model.transformer.layers.28.self_attn.o_proj",
216
- "vision_model.transformer.layers.28.mlp.fc1",
217
- "vision_model.transformer.layers.28.mlp.fc2",
218
- "vision_model.transformer.layers.29.self_attn.q_proj",
219
- "vision_model.transformer.layers.29.self_attn.k_proj",
220
- "vision_model.transformer.layers.29.self_attn.v_proj",
221
- "vision_model.transformer.layers.29.self_attn.o_proj",
222
- "vision_model.transformer.layers.29.mlp.fc1",
223
- "vision_model.transformer.layers.29.mlp.fc2",
224
- "vision_model.transformer.layers.30.self_attn.q_proj",
225
- "vision_model.transformer.layers.30.self_attn.k_proj",
226
- "vision_model.transformer.layers.30.self_attn.v_proj",
227
- "vision_model.transformer.layers.30.self_attn.o_proj",
228
- "vision_model.transformer.layers.30.mlp.fc1",
229
- "vision_model.transformer.layers.30.mlp.fc2",
230
- "vision_model.transformer.layers.31.self_attn.q_proj",
231
- "vision_model.transformer.layers.31.self_attn.k_proj",
232
- "vision_model.transformer.layers.31.self_attn.v_proj",
233
- "vision_model.transformer.layers.31.self_attn.o_proj",
234
- "vision_model.transformer.layers.31.mlp.fc1",
235
- "vision_model.transformer.layers.31.mlp.fc2",
236
- "vision_model.global_transformer.layers.0.self_attn.q_proj",
237
- "vision_model.global_transformer.layers.0.self_attn.k_proj",
238
- "vision_model.global_transformer.layers.0.self_attn.v_proj",
239
- "vision_model.global_transformer.layers.0.self_attn.o_proj",
240
- "vision_model.global_transformer.layers.0.mlp.fc1",
241
- "vision_model.global_transformer.layers.0.mlp.fc2",
242
- "vision_model.global_transformer.layers.1.self_attn.q_proj",
243
- "vision_model.global_transformer.layers.1.self_attn.k_proj",
244
- "vision_model.global_transformer.layers.1.self_attn.v_proj",
245
- "vision_model.global_transformer.layers.1.self_attn.o_proj",
246
- "vision_model.global_transformer.layers.1.mlp.fc1",
247
- "vision_model.global_transformer.layers.1.mlp.fc2",
248
- "vision_model.global_transformer.layers.2.self_attn.q_proj",
249
- "vision_model.global_transformer.layers.2.self_attn.k_proj",
250
- "vision_model.global_transformer.layers.2.self_attn.v_proj",
251
- "vision_model.global_transformer.layers.2.self_attn.o_proj",
252
- "vision_model.global_transformer.layers.2.mlp.fc1",
253
- "vision_model.global_transformer.layers.2.mlp.fc2",
254
- "vision_model.global_transformer.layers.3.self_attn.q_proj",
255
- "vision_model.global_transformer.layers.3.self_attn.k_proj",
256
- "vision_model.global_transformer.layers.3.self_attn.v_proj",
257
- "vision_model.global_transformer.layers.3.self_attn.o_proj",
258
- "vision_model.global_transformer.layers.3.mlp.fc1",
259
- "vision_model.global_transformer.layers.3.mlp.fc2",
260
- "vision_model.global_transformer.layers.4.self_attn.q_proj",
261
- "vision_model.global_transformer.layers.4.self_attn.k_proj",
262
- "vision_model.global_transformer.layers.4.self_attn.v_proj",
263
- "vision_model.global_transformer.layers.4.self_attn.o_proj",
264
- "vision_model.global_transformer.layers.4.mlp.fc1",
265
- "vision_model.global_transformer.layers.4.mlp.fc2",
266
- "vision_model.global_transformer.layers.5.self_attn.q_proj",
267
- "vision_model.global_transformer.layers.5.self_attn.k_proj",
268
- "vision_model.global_transformer.layers.5.self_attn.v_proj",
269
- "vision_model.global_transformer.layers.5.self_attn.o_proj",
270
- "vision_model.global_transformer.layers.5.mlp.fc1",
271
- "vision_model.global_transformer.layers.5.mlp.fc2",
272
- "vision_model.global_transformer.layers.6.self_attn.q_proj",
273
- "vision_model.global_transformer.layers.6.self_attn.k_proj",
274
- "vision_model.global_transformer.layers.6.self_attn.v_proj",
275
- "vision_model.global_transformer.layers.6.self_attn.o_proj",
276
- "vision_model.global_transformer.layers.6.mlp.fc1",
277
- "vision_model.global_transformer.layers.6.mlp.fc2",
278
- "vision_model.global_transformer.layers.7.self_attn.q_proj",
279
- "vision_model.global_transformer.layers.7.self_attn.k_proj",
280
- "vision_model.global_transformer.layers.7.self_attn.v_proj",
281
- "vision_model.global_transformer.layers.7.self_attn.o_proj",
282
- "vision_model.global_transformer.layers.7.mlp.fc1",
283
- "vision_model.global_transformer.layers.7.mlp.fc2",
284
- "language_model.lm_head",
285
- "multi_modal_projector"
286
- ],
287
- "kv_cache_scheme": null,
288
- "quant_method": "compressed-tensors",
289
- "quantization_status": "compressed"
290
- },
291
  "text_config": {
292
  "_name_or_path": "",
293
  "add_cross_attention": false,
@@ -504,4 +221,4 @@
504
  "use_bfloat16": false,
505
  "vision_output_dim": 7680
506
  }
507
- }
 
1
  {
2
+ "_name_or_path": "meta-llama/Llama-3.2-11B-Vision-Instruct",
3
  "architectures": [
4
  "MllamaForConditionalGeneration"
5
  ],
6
  "image_token_index": 128256,
7
  "model_type": "mllama",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
8
  "text_config": {
9
  "_name_or_path": "",
10
  "add_cross_attention": false,
 
221
  "use_bfloat16": false,
222
  "vision_output_dim": 7680
223
  }
224
+ }
model-00001-of-00009.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52afbb29bfe008fa22a7d707eb4167ac76b872054de14a664f20b0f755b66368
3
+ size 3454336036
model-00002-of-00009.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c824e075243363e5ccaf8af15c90a939f9f07c3bd3649d0b29ef326160c45db
3
+ size 4886615752
model-00003-of-00009.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b8a3acb48223e6d7466c318db5fdcac09f8c94144fc02574f6ba48e502e3d04
3
+ size 4832009696
model-00004-of-00009.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d62ae738a977fc5294c5a36d731a08d1c0270bc0aeee49ccfff92c2cf8400022
3
+ size 4999798928
model-00005-of-00009.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eecf2fc2fd34ed9f9ddb7c61750691eb294d83000a031e89c093ddbabaaf01cc
3
+ size 4999815448
model-00006-of-00009.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76507f859b0f34afc37471cd706d46f2af915c5d92dc92a4cf3c374292483b19
3
+ size 4832009736
model-00007-of-00009.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b45ea0558d1a8cb6df9c32e8368c95f5e063f13d547c7493ab0fe1541c8ae47
3
+ size 4999815448
model-00008-of-00009.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03352956bb59ec1bd19dd02794af121262427f6257285d736e97029055962df1
3
+ size 4999815448
model-00009-of-00009.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f2a33560433b818a6ef8af701a181f850a0828bb4bc65670df5a40447a229fc
3
+ size 4676785016
model.safetensors.index.json CHANGED
The diff for this file is too large to render. See raw diff