michalk8 commited on
Commit
0d704ad
·
verified ·
1 Parent(s): 70810b6

Add HF compatible checkpoints (#3)

Browse files

- Upload folder using huggingface_hub (545cedc82d1e8c090dfab9c189334960e3e34f33)
- Remove old file (fb256d38b0379522815acaef3afcce8c3491a913)

config.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "architectures": [
3
- "AIMv2Model"
4
  ],
5
  "attention_dropout": 0.0,
6
  "auto_map": {
@@ -8,10 +8,14 @@
8
  "AutoModel": "modeling_aimv2.AIMv2Model",
9
  "FlaxAutoModel": "modeling_flax_aimv2.FlaxAIMv2Model"
10
  },
 
11
  "hidden_size": 3072,
12
  "image_size": 448,
 
13
  "intermediate_size": 8192,
14
- "model_type": "aimv2",
 
 
15
  "num_attention_heads": 24,
16
  "num_channels": 3,
17
  "num_hidden_layers": 24,
@@ -20,6 +24,7 @@
20
  "qkv_bias": false,
21
  "rms_norm_eps": 1e-05,
22
  "torch_dtype": "float32",
23
- "transformers_version": "4.46.3",
24
- "use_bias": false
25
- }
 
 
1
  {
2
  "architectures": [
3
+ "Aimv2VisionModel"
4
  ],
5
  "attention_dropout": 0.0,
6
  "auto_map": {
 
8
  "AutoModel": "modeling_aimv2.AIMv2Model",
9
  "FlaxAutoModel": "modeling_flax_aimv2.FlaxAIMv2Model"
10
  },
11
+ "hidden_act": "silu",
12
  "hidden_size": 3072,
13
  "image_size": 448,
14
+ "initializer_range": 0.02,
15
  "intermediate_size": 8192,
16
+ "is_native": false,
17
+ "mlp_bias": false,
18
+ "model_type": "aimv2_vision_model",
19
  "num_attention_heads": 24,
20
  "num_channels": 3,
21
  "num_hidden_layers": 24,
 
24
  "qkv_bias": false,
25
  "rms_norm_eps": 1e-05,
26
  "torch_dtype": "float32",
27
+ "transformers_version": "4.54.0.dev0",
28
+ "use_bias": false,
29
+ "use_head": false
30
+ }
model.safetensors → model-00001-of-00003.safetensors RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2663c7027af21885e56160748f449343be0dabe9e3cc8d447d18e1f7b814cdc0
3
- size 10892089304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd819ea84275237a07324447ef4e300e816f66219ef7e6f68c03429ece33058e
3
+ size 4902259840
model-00002-of-00003.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5fbcf46425d1e93cd74f55744d819de39d29ee184ee6ad6ab4216fbf90f11bde
3
+ size 4983114904
model-00003-of-00003.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d480a95d8c05261a74af6b500902af63b62e446beae3379277f6dd7f8f10daab
3
+ size 1006721472
model.safetensors.index.json ADDED
@@ -0,0 +1,229 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "metadata": {
3
+ "total_parameters": 2723017728,
4
+ "total_size": 10892070912
5
+ },
6
+ "weight_map": {
7
+ "embeddings.patch_embed.bias": "model-00001-of-00003.safetensors",
8
+ "embeddings.patch_embed.weight": "model-00001-of-00003.safetensors",
9
+ "embeddings.position_embedding.weight": "model-00001-of-00003.safetensors",
10
+ "embeddings.rms_norm.weight": "model-00001-of-00003.safetensors",
11
+ "encoder.layers.0.attention.k_proj.weight": "model-00001-of-00003.safetensors",
12
+ "encoder.layers.0.attention.out_proj.weight": "model-00001-of-00003.safetensors",
13
+ "encoder.layers.0.attention.q_proj.weight": "model-00001-of-00003.safetensors",
14
+ "encoder.layers.0.attention.v_proj.weight": "model-00001-of-00003.safetensors",
15
+ "encoder.layers.0.ffn.down_proj.weight": "model-00001-of-00003.safetensors",
16
+ "encoder.layers.0.ffn.gate_proj.weight": "model-00001-of-00003.safetensors",
17
+ "encoder.layers.0.ffn.up_proj.weight": "model-00001-of-00003.safetensors",
18
+ "encoder.layers.0.rms_norm1.weight": "model-00001-of-00003.safetensors",
19
+ "encoder.layers.0.rms_norm2.weight": "model-00001-of-00003.safetensors",
20
+ "encoder.layers.1.attention.k_proj.weight": "model-00001-of-00003.safetensors",
21
+ "encoder.layers.1.attention.out_proj.weight": "model-00001-of-00003.safetensors",
22
+ "encoder.layers.1.attention.q_proj.weight": "model-00001-of-00003.safetensors",
23
+ "encoder.layers.1.attention.v_proj.weight": "model-00001-of-00003.safetensors",
24
+ "encoder.layers.1.ffn.down_proj.weight": "model-00001-of-00003.safetensors",
25
+ "encoder.layers.1.ffn.gate_proj.weight": "model-00001-of-00003.safetensors",
26
+ "encoder.layers.1.ffn.up_proj.weight": "model-00001-of-00003.safetensors",
27
+ "encoder.layers.1.rms_norm1.weight": "model-00001-of-00003.safetensors",
28
+ "encoder.layers.1.rms_norm2.weight": "model-00001-of-00003.safetensors",
29
+ "encoder.layers.10.attention.k_proj.weight": "model-00001-of-00003.safetensors",
30
+ "encoder.layers.10.attention.out_proj.weight": "model-00001-of-00003.safetensors",
31
+ "encoder.layers.10.attention.q_proj.weight": "model-00001-of-00003.safetensors",
32
+ "encoder.layers.10.attention.v_proj.weight": "model-00001-of-00003.safetensors",
33
+ "encoder.layers.10.ffn.down_proj.weight": "model-00002-of-00003.safetensors",
34
+ "encoder.layers.10.ffn.gate_proj.weight": "model-00001-of-00003.safetensors",
35
+ "encoder.layers.10.ffn.up_proj.weight": "model-00001-of-00003.safetensors",
36
+ "encoder.layers.10.rms_norm1.weight": "model-00002-of-00003.safetensors",
37
+ "encoder.layers.10.rms_norm2.weight": "model-00002-of-00003.safetensors",
38
+ "encoder.layers.11.attention.k_proj.weight": "model-00002-of-00003.safetensors",
39
+ "encoder.layers.11.attention.out_proj.weight": "model-00002-of-00003.safetensors",
40
+ "encoder.layers.11.attention.q_proj.weight": "model-00002-of-00003.safetensors",
41
+ "encoder.layers.11.attention.v_proj.weight": "model-00002-of-00003.safetensors",
42
+ "encoder.layers.11.ffn.down_proj.weight": "model-00002-of-00003.safetensors",
43
+ "encoder.layers.11.ffn.gate_proj.weight": "model-00002-of-00003.safetensors",
44
+ "encoder.layers.11.ffn.up_proj.weight": "model-00002-of-00003.safetensors",
45
+ "encoder.layers.11.rms_norm1.weight": "model-00002-of-00003.safetensors",
46
+ "encoder.layers.11.rms_norm2.weight": "model-00002-of-00003.safetensors",
47
+ "encoder.layers.12.attention.k_proj.weight": "model-00002-of-00003.safetensors",
48
+ "encoder.layers.12.attention.out_proj.weight": "model-00002-of-00003.safetensors",
49
+ "encoder.layers.12.attention.q_proj.weight": "model-00002-of-00003.safetensors",
50
+ "encoder.layers.12.attention.v_proj.weight": "model-00002-of-00003.safetensors",
51
+ "encoder.layers.12.ffn.down_proj.weight": "model-00002-of-00003.safetensors",
52
+ "encoder.layers.12.ffn.gate_proj.weight": "model-00002-of-00003.safetensors",
53
+ "encoder.layers.12.ffn.up_proj.weight": "model-00002-of-00003.safetensors",
54
+ "encoder.layers.12.rms_norm1.weight": "model-00002-of-00003.safetensors",
55
+ "encoder.layers.12.rms_norm2.weight": "model-00002-of-00003.safetensors",
56
+ "encoder.layers.13.attention.k_proj.weight": "model-00002-of-00003.safetensors",
57
+ "encoder.layers.13.attention.out_proj.weight": "model-00002-of-00003.safetensors",
58
+ "encoder.layers.13.attention.q_proj.weight": "model-00002-of-00003.safetensors",
59
+ "encoder.layers.13.attention.v_proj.weight": "model-00002-of-00003.safetensors",
60
+ "encoder.layers.13.ffn.down_proj.weight": "model-00002-of-00003.safetensors",
61
+ "encoder.layers.13.ffn.gate_proj.weight": "model-00002-of-00003.safetensors",
62
+ "encoder.layers.13.ffn.up_proj.weight": "model-00002-of-00003.safetensors",
63
+ "encoder.layers.13.rms_norm1.weight": "model-00002-of-00003.safetensors",
64
+ "encoder.layers.13.rms_norm2.weight": "model-00002-of-00003.safetensors",
65
+ "encoder.layers.14.attention.k_proj.weight": "model-00002-of-00003.safetensors",
66
+ "encoder.layers.14.attention.out_proj.weight": "model-00002-of-00003.safetensors",
67
+ "encoder.layers.14.attention.q_proj.weight": "model-00002-of-00003.safetensors",
68
+ "encoder.layers.14.attention.v_proj.weight": "model-00002-of-00003.safetensors",
69
+ "encoder.layers.14.ffn.down_proj.weight": "model-00002-of-00003.safetensors",
70
+ "encoder.layers.14.ffn.gate_proj.weight": "model-00002-of-00003.safetensors",
71
+ "encoder.layers.14.ffn.up_proj.weight": "model-00002-of-00003.safetensors",
72
+ "encoder.layers.14.rms_norm1.weight": "model-00002-of-00003.safetensors",
73
+ "encoder.layers.14.rms_norm2.weight": "model-00002-of-00003.safetensors",
74
+ "encoder.layers.15.attention.k_proj.weight": "model-00002-of-00003.safetensors",
75
+ "encoder.layers.15.attention.out_proj.weight": "model-00002-of-00003.safetensors",
76
+ "encoder.layers.15.attention.q_proj.weight": "model-00002-of-00003.safetensors",
77
+ "encoder.layers.15.attention.v_proj.weight": "model-00002-of-00003.safetensors",
78
+ "encoder.layers.15.ffn.down_proj.weight": "model-00002-of-00003.safetensors",
79
+ "encoder.layers.15.ffn.gate_proj.weight": "model-00002-of-00003.safetensors",
80
+ "encoder.layers.15.ffn.up_proj.weight": "model-00002-of-00003.safetensors",
81
+ "encoder.layers.15.rms_norm1.weight": "model-00002-of-00003.safetensors",
82
+ "encoder.layers.15.rms_norm2.weight": "model-00002-of-00003.safetensors",
83
+ "encoder.layers.16.attention.k_proj.weight": "model-00002-of-00003.safetensors",
84
+ "encoder.layers.16.attention.out_proj.weight": "model-00002-of-00003.safetensors",
85
+ "encoder.layers.16.attention.q_proj.weight": "model-00002-of-00003.safetensors",
86
+ "encoder.layers.16.attention.v_proj.weight": "model-00002-of-00003.safetensors",
87
+ "encoder.layers.16.ffn.down_proj.weight": "model-00002-of-00003.safetensors",
88
+ "encoder.layers.16.ffn.gate_proj.weight": "model-00002-of-00003.safetensors",
89
+ "encoder.layers.16.ffn.up_proj.weight": "model-00002-of-00003.safetensors",
90
+ "encoder.layers.16.rms_norm1.weight": "model-00002-of-00003.safetensors",
91
+ "encoder.layers.16.rms_norm2.weight": "model-00002-of-00003.safetensors",
92
+ "encoder.layers.17.attention.k_proj.weight": "model-00002-of-00003.safetensors",
93
+ "encoder.layers.17.attention.out_proj.weight": "model-00002-of-00003.safetensors",
94
+ "encoder.layers.17.attention.q_proj.weight": "model-00002-of-00003.safetensors",
95
+ "encoder.layers.17.attention.v_proj.weight": "model-00002-of-00003.safetensors",
96
+ "encoder.layers.17.ffn.down_proj.weight": "model-00002-of-00003.safetensors",
97
+ "encoder.layers.17.ffn.gate_proj.weight": "model-00002-of-00003.safetensors",
98
+ "encoder.layers.17.ffn.up_proj.weight": "model-00002-of-00003.safetensors",
99
+ "encoder.layers.17.rms_norm1.weight": "model-00002-of-00003.safetensors",
100
+ "encoder.layers.17.rms_norm2.weight": "model-00002-of-00003.safetensors",
101
+ "encoder.layers.18.attention.k_proj.weight": "model-00002-of-00003.safetensors",
102
+ "encoder.layers.18.attention.out_proj.weight": "model-00002-of-00003.safetensors",
103
+ "encoder.layers.18.attention.q_proj.weight": "model-00002-of-00003.safetensors",
104
+ "encoder.layers.18.attention.v_proj.weight": "model-00002-of-00003.safetensors",
105
+ "encoder.layers.18.ffn.down_proj.weight": "model-00002-of-00003.safetensors",
106
+ "encoder.layers.18.ffn.gate_proj.weight": "model-00002-of-00003.safetensors",
107
+ "encoder.layers.18.ffn.up_proj.weight": "model-00002-of-00003.safetensors",
108
+ "encoder.layers.18.rms_norm1.weight": "model-00002-of-00003.safetensors",
109
+ "encoder.layers.18.rms_norm2.weight": "model-00002-of-00003.safetensors",
110
+ "encoder.layers.19.attention.k_proj.weight": "model-00002-of-00003.safetensors",
111
+ "encoder.layers.19.attention.out_proj.weight": "model-00002-of-00003.safetensors",
112
+ "encoder.layers.19.attention.q_proj.weight": "model-00002-of-00003.safetensors",
113
+ "encoder.layers.19.attention.v_proj.weight": "model-00002-of-00003.safetensors",
114
+ "encoder.layers.19.ffn.down_proj.weight": "model-00002-of-00003.safetensors",
115
+ "encoder.layers.19.ffn.gate_proj.weight": "model-00002-of-00003.safetensors",
116
+ "encoder.layers.19.ffn.up_proj.weight": "model-00002-of-00003.safetensors",
117
+ "encoder.layers.19.rms_norm1.weight": "model-00002-of-00003.safetensors",
118
+ "encoder.layers.19.rms_norm2.weight": "model-00002-of-00003.safetensors",
119
+ "encoder.layers.2.attention.k_proj.weight": "model-00001-of-00003.safetensors",
120
+ "encoder.layers.2.attention.out_proj.weight": "model-00001-of-00003.safetensors",
121
+ "encoder.layers.2.attention.q_proj.weight": "model-00001-of-00003.safetensors",
122
+ "encoder.layers.2.attention.v_proj.weight": "model-00001-of-00003.safetensors",
123
+ "encoder.layers.2.ffn.down_proj.weight": "model-00001-of-00003.safetensors",
124
+ "encoder.layers.2.ffn.gate_proj.weight": "model-00001-of-00003.safetensors",
125
+ "encoder.layers.2.ffn.up_proj.weight": "model-00001-of-00003.safetensors",
126
+ "encoder.layers.2.rms_norm1.weight": "model-00001-of-00003.safetensors",
127
+ "encoder.layers.2.rms_norm2.weight": "model-00001-of-00003.safetensors",
128
+ "encoder.layers.20.attention.k_proj.weight": "model-00002-of-00003.safetensors",
129
+ "encoder.layers.20.attention.out_proj.weight": "model-00002-of-00003.safetensors",
130
+ "encoder.layers.20.attention.q_proj.weight": "model-00002-of-00003.safetensors",
131
+ "encoder.layers.20.attention.v_proj.weight": "model-00002-of-00003.safetensors",
132
+ "encoder.layers.20.ffn.down_proj.weight": "model-00002-of-00003.safetensors",
133
+ "encoder.layers.20.ffn.gate_proj.weight": "model-00002-of-00003.safetensors",
134
+ "encoder.layers.20.ffn.up_proj.weight": "model-00002-of-00003.safetensors",
135
+ "encoder.layers.20.rms_norm1.weight": "model-00002-of-00003.safetensors",
136
+ "encoder.layers.20.rms_norm2.weight": "model-00002-of-00003.safetensors",
137
+ "encoder.layers.21.attention.k_proj.weight": "model-00002-of-00003.safetensors",
138
+ "encoder.layers.21.attention.out_proj.weight": "model-00002-of-00003.safetensors",
139
+ "encoder.layers.21.attention.q_proj.weight": "model-00002-of-00003.safetensors",
140
+ "encoder.layers.21.attention.v_proj.weight": "model-00002-of-00003.safetensors",
141
+ "encoder.layers.21.ffn.down_proj.weight": "model-00003-of-00003.safetensors",
142
+ "encoder.layers.21.ffn.gate_proj.weight": "model-00002-of-00003.safetensors",
143
+ "encoder.layers.21.ffn.up_proj.weight": "model-00002-of-00003.safetensors",
144
+ "encoder.layers.21.rms_norm1.weight": "model-00003-of-00003.safetensors",
145
+ "encoder.layers.21.rms_norm2.weight": "model-00003-of-00003.safetensors",
146
+ "encoder.layers.22.attention.k_proj.weight": "model-00003-of-00003.safetensors",
147
+ "encoder.layers.22.attention.out_proj.weight": "model-00003-of-00003.safetensors",
148
+ "encoder.layers.22.attention.q_proj.weight": "model-00003-of-00003.safetensors",
149
+ "encoder.layers.22.attention.v_proj.weight": "model-00003-of-00003.safetensors",
150
+ "encoder.layers.22.ffn.down_proj.weight": "model-00003-of-00003.safetensors",
151
+ "encoder.layers.22.ffn.gate_proj.weight": "model-00003-of-00003.safetensors",
152
+ "encoder.layers.22.ffn.up_proj.weight": "model-00003-of-00003.safetensors",
153
+ "encoder.layers.22.rms_norm1.weight": "model-00003-of-00003.safetensors",
154
+ "encoder.layers.22.rms_norm2.weight": "model-00003-of-00003.safetensors",
155
+ "encoder.layers.23.attention.k_proj.weight": "model-00003-of-00003.safetensors",
156
+ "encoder.layers.23.attention.out_proj.weight": "model-00003-of-00003.safetensors",
157
+ "encoder.layers.23.attention.q_proj.weight": "model-00003-of-00003.safetensors",
158
+ "encoder.layers.23.attention.v_proj.weight": "model-00003-of-00003.safetensors",
159
+ "encoder.layers.23.ffn.down_proj.weight": "model-00003-of-00003.safetensors",
160
+ "encoder.layers.23.ffn.gate_proj.weight": "model-00003-of-00003.safetensors",
161
+ "encoder.layers.23.ffn.up_proj.weight": "model-00003-of-00003.safetensors",
162
+ "encoder.layers.23.rms_norm1.weight": "model-00003-of-00003.safetensors",
163
+ "encoder.layers.23.rms_norm2.weight": "model-00003-of-00003.safetensors",
164
+ "encoder.layers.3.attention.k_proj.weight": "model-00001-of-00003.safetensors",
165
+ "encoder.layers.3.attention.out_proj.weight": "model-00001-of-00003.safetensors",
166
+ "encoder.layers.3.attention.q_proj.weight": "model-00001-of-00003.safetensors",
167
+ "encoder.layers.3.attention.v_proj.weight": "model-00001-of-00003.safetensors",
168
+ "encoder.layers.3.ffn.down_proj.weight": "model-00001-of-00003.safetensors",
169
+ "encoder.layers.3.ffn.gate_proj.weight": "model-00001-of-00003.safetensors",
170
+ "encoder.layers.3.ffn.up_proj.weight": "model-00001-of-00003.safetensors",
171
+ "encoder.layers.3.rms_norm1.weight": "model-00001-of-00003.safetensors",
172
+ "encoder.layers.3.rms_norm2.weight": "model-00001-of-00003.safetensors",
173
+ "encoder.layers.4.attention.k_proj.weight": "model-00001-of-00003.safetensors",
174
+ "encoder.layers.4.attention.out_proj.weight": "model-00001-of-00003.safetensors",
175
+ "encoder.layers.4.attention.q_proj.weight": "model-00001-of-00003.safetensors",
176
+ "encoder.layers.4.attention.v_proj.weight": "model-00001-of-00003.safetensors",
177
+ "encoder.layers.4.ffn.down_proj.weight": "model-00001-of-00003.safetensors",
178
+ "encoder.layers.4.ffn.gate_proj.weight": "model-00001-of-00003.safetensors",
179
+ "encoder.layers.4.ffn.up_proj.weight": "model-00001-of-00003.safetensors",
180
+ "encoder.layers.4.rms_norm1.weight": "model-00001-of-00003.safetensors",
181
+ "encoder.layers.4.rms_norm2.weight": "model-00001-of-00003.safetensors",
182
+ "encoder.layers.5.attention.k_proj.weight": "model-00001-of-00003.safetensors",
183
+ "encoder.layers.5.attention.out_proj.weight": "model-00001-of-00003.safetensors",
184
+ "encoder.layers.5.attention.q_proj.weight": "model-00001-of-00003.safetensors",
185
+ "encoder.layers.5.attention.v_proj.weight": "model-00001-of-00003.safetensors",
186
+ "encoder.layers.5.ffn.down_proj.weight": "model-00001-of-00003.safetensors",
187
+ "encoder.layers.5.ffn.gate_proj.weight": "model-00001-of-00003.safetensors",
188
+ "encoder.layers.5.ffn.up_proj.weight": "model-00001-of-00003.safetensors",
189
+ "encoder.layers.5.rms_norm1.weight": "model-00001-of-00003.safetensors",
190
+ "encoder.layers.5.rms_norm2.weight": "model-00001-of-00003.safetensors",
191
+ "encoder.layers.6.attention.k_proj.weight": "model-00001-of-00003.safetensors",
192
+ "encoder.layers.6.attention.out_proj.weight": "model-00001-of-00003.safetensors",
193
+ "encoder.layers.6.attention.q_proj.weight": "model-00001-of-00003.safetensors",
194
+ "encoder.layers.6.attention.v_proj.weight": "model-00001-of-00003.safetensors",
195
+ "encoder.layers.6.ffn.down_proj.weight": "model-00001-of-00003.safetensors",
196
+ "encoder.layers.6.ffn.gate_proj.weight": "model-00001-of-00003.safetensors",
197
+ "encoder.layers.6.ffn.up_proj.weight": "model-00001-of-00003.safetensors",
198
+ "encoder.layers.6.rms_norm1.weight": "model-00001-of-00003.safetensors",
199
+ "encoder.layers.6.rms_norm2.weight": "model-00001-of-00003.safetensors",
200
+ "encoder.layers.7.attention.k_proj.weight": "model-00001-of-00003.safetensors",
201
+ "encoder.layers.7.attention.out_proj.weight": "model-00001-of-00003.safetensors",
202
+ "encoder.layers.7.attention.q_proj.weight": "model-00001-of-00003.safetensors",
203
+ "encoder.layers.7.attention.v_proj.weight": "model-00001-of-00003.safetensors",
204
+ "encoder.layers.7.ffn.down_proj.weight": "model-00001-of-00003.safetensors",
205
+ "encoder.layers.7.ffn.gate_proj.weight": "model-00001-of-00003.safetensors",
206
+ "encoder.layers.7.ffn.up_proj.weight": "model-00001-of-00003.safetensors",
207
+ "encoder.layers.7.rms_norm1.weight": "model-00001-of-00003.safetensors",
208
+ "encoder.layers.7.rms_norm2.weight": "model-00001-of-00003.safetensors",
209
+ "encoder.layers.8.attention.k_proj.weight": "model-00001-of-00003.safetensors",
210
+ "encoder.layers.8.attention.out_proj.weight": "model-00001-of-00003.safetensors",
211
+ "encoder.layers.8.attention.q_proj.weight": "model-00001-of-00003.safetensors",
212
+ "encoder.layers.8.attention.v_proj.weight": "model-00001-of-00003.safetensors",
213
+ "encoder.layers.8.ffn.down_proj.weight": "model-00001-of-00003.safetensors",
214
+ "encoder.layers.8.ffn.gate_proj.weight": "model-00001-of-00003.safetensors",
215
+ "encoder.layers.8.ffn.up_proj.weight": "model-00001-of-00003.safetensors",
216
+ "encoder.layers.8.rms_norm1.weight": "model-00001-of-00003.safetensors",
217
+ "encoder.layers.8.rms_norm2.weight": "model-00001-of-00003.safetensors",
218
+ "encoder.layers.9.attention.k_proj.weight": "model-00001-of-00003.safetensors",
219
+ "encoder.layers.9.attention.out_proj.weight": "model-00001-of-00003.safetensors",
220
+ "encoder.layers.9.attention.q_proj.weight": "model-00001-of-00003.safetensors",
221
+ "encoder.layers.9.attention.v_proj.weight": "model-00001-of-00003.safetensors",
222
+ "encoder.layers.9.ffn.down_proj.weight": "model-00001-of-00003.safetensors",
223
+ "encoder.layers.9.ffn.gate_proj.weight": "model-00001-of-00003.safetensors",
224
+ "encoder.layers.9.ffn.up_proj.weight": "model-00001-of-00003.safetensors",
225
+ "encoder.layers.9.rms_norm1.weight": "model-00001-of-00003.safetensors",
226
+ "encoder.layers.9.rms_norm2.weight": "model-00001-of-00003.safetensors",
227
+ "rms_norm.weight": "model-00003-of-00003.safetensors"
228
+ }
229
+ }
preprocessor_config.json CHANGED
@@ -3,6 +3,10 @@
3
  "height": 448,
4
  "width": 448
5
  },
 
 
 
 
6
  "do_center_crop": true,
7
  "do_convert_rgb": true,
8
  "do_normalize": true,
@@ -13,14 +17,16 @@
13
  0.4578275,
14
  0.40821073
15
  ],
16
- "image_processor_type": "CLIPImageProcessor",
17
  "image_std": [
18
  0.26862954,
19
  0.26130258,
20
  0.27577711
21
  ],
 
22
  "resample": 3,
23
  "rescale_factor": 0.00392156862745098,
 
24
  "size": {
25
  "shortest_edge": 448
26
  }
 
3
  "height": 448,
4
  "width": 448
5
  },
6
+ "data_format": "channels_first",
7
+ "default_to_square": false,
8
+ "device": null,
9
+ "disable_grouping": null,
10
  "do_center_crop": true,
11
  "do_convert_rgb": true,
12
  "do_normalize": true,
 
17
  0.4578275,
18
  0.40821073
19
  ],
20
+ "image_processor_type": "CLIPImageProcessorFast",
21
  "image_std": [
22
  0.26862954,
23
  0.26130258,
24
  0.27577711
25
  ],
26
+ "input_data_format": null,
27
  "resample": 3,
28
  "rescale_factor": 0.00392156862745098,
29
+ "return_tensors": null,
30
  "size": {
31
  "shortest_edge": 448
32
  }