danielhanchen commited on
Commit
eabca91
·
verified ·
1 Parent(s): 813fad8

Add files using upload-large-folder tool

Browse files
Files changed (22) hide show
  1. .gitattributes +2 -0
  2. Q4_K_M/Llama-4-Maverick-17B-128E-Instruct-Q4_K_M-00001-of-00005.gguf +1 -1
  3. Q4_K_M/Llama-4-Maverick-17B-128E-Instruct-Q4_K_M-00002-of-00005.gguf +1 -1
  4. Q4_K_M/Llama-4-Maverick-17B-128E-Instruct-Q4_K_M-00003-of-00005.gguf +1 -1
  5. Q4_K_M/Llama-4-Maverick-17B-128E-Instruct-Q4_K_M-00004-of-00005.gguf +1 -1
  6. Q4_K_M/Llama-4-Maverick-17B-128E-Instruct-Q4_K_M-00005-of-00005.gguf +1 -1
  7. UD-Q2_K_XL/Llama-4-Maverick-17B-128E-Instruct-UD-Q2_K_XL-00001-of-00004.gguf +2 -2
  8. UD-Q2_K_XL/Llama-4-Maverick-17B-128E-Instruct-UD-Q2_K_XL-00002-of-00004.gguf +1 -1
  9. UD-Q2_K_XL/Llama-4-Maverick-17B-128E-Instruct-UD-Q2_K_XL-00003-of-00004.gguf +2 -2
  10. UD-Q2_K_XL/Llama-4-Maverick-17B-128E-Instruct-UD-Q2_K_XL-00004-of-00004.gguf +1 -1
  11. UD-Q3_K_XL/Llama-4-Maverick-17B-128E-Instruct-UD-Q3_K_XL-00001-of-00004.gguf +1 -1
  12. UD-Q3_K_XL/Llama-4-Maverick-17B-128E-Instruct-UD-Q3_K_XL-00002-of-00004.gguf +1 -1
  13. UD-Q3_K_XL/Llama-4-Maverick-17B-128E-Instruct-UD-Q3_K_XL-00003-of-00004.gguf +1 -1
  14. UD-Q3_K_XL/Llama-4-Maverick-17B-128E-Instruct-UD-Q3_K_XL-00004-of-00004.gguf +1 -1
  15. UD-Q4_K_XL/Llama-4-Maverick-17B-128E-Instruct-UD-Q4_K_XL-00001-of-00005.gguf +2 -2
  16. UD-Q4_K_XL/Llama-4-Maverick-17B-128E-Instruct-UD-Q4_K_XL-00002-of-00005.gguf +1 -1
  17. UD-Q4_K_XL/Llama-4-Maverick-17B-128E-Instruct-UD-Q4_K_XL-00003-of-00005.gguf +1 -1
  18. UD-Q4_K_XL/Llama-4-Maverick-17B-128E-Instruct-UD-Q4_K_XL-00004-of-00005.gguf +1 -1
  19. UD-Q4_K_XL/Llama-4-Maverick-17B-128E-Instruct-UD-Q4_K_XL-00005-of-00005.gguf +1 -1
  20. config.json +84 -3
  21. mmproj-F16.gguf +3 -0
  22. mmproj-F32.gguf +3 -0
.gitattributes CHANGED
@@ -139,3 +139,5 @@ BF16/Llama-4-Maverick-17B-128E-Instruct-BF16-00012-of-00018.gguf filter=lfs diff
139
  BF16/Llama-4-Maverick-17B-128E-Instruct-BF16-00009-of-00018.gguf filter=lfs diff=lfs merge=lfs -text
140
  BF16/Llama-4-Maverick-17B-128E-Instruct-BF16-00005-of-00018.gguf filter=lfs diff=lfs merge=lfs -text
141
  BF16/Llama-4-Maverick-17B-128E-Instruct-BF16-00018-of-00018.gguf filter=lfs diff=lfs merge=lfs -text
 
 
 
139
  BF16/Llama-4-Maverick-17B-128E-Instruct-BF16-00009-of-00018.gguf filter=lfs diff=lfs merge=lfs -text
140
  BF16/Llama-4-Maverick-17B-128E-Instruct-BF16-00005-of-00018.gguf filter=lfs diff=lfs merge=lfs -text
141
  BF16/Llama-4-Maverick-17B-128E-Instruct-BF16-00018-of-00018.gguf filter=lfs diff=lfs merge=lfs -text
142
+ mmproj-F16.gguf filter=lfs diff=lfs merge=lfs -text
143
+ mmproj-F32.gguf filter=lfs diff=lfs merge=lfs -text
Q4_K_M/Llama-4-Maverick-17B-128E-Instruct-Q4_K_M-00001-of-00005.gguf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8ebe6e63fdde81efb60c417b404834ade656854b5b48b1e9accf853e9ed2a2f2
3
  size 49408442368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16c923b64805ba340dc8c6edbd2b8a93f6a0206e5ee9c0569275548c3ba40634
3
  size 49408442368
Q4_K_M/Llama-4-Maverick-17B-128E-Instruct-Q4_K_M-00002-of-00005.gguf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:61295c02a0d043f95abecfe36b61b36c32de40b275b06d55f49c922a7888e870
3
  size 49543134080
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f1b167907c322954c6e971271aa7426028149a979f2d23d56da409ab21a67e2
3
  size 49543134080
Q4_K_M/Llama-4-Maverick-17B-128E-Instruct-Q4_K_M-00003-of-00005.gguf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f5c54f466c6ea0329dd63665aaf5e0a465de072196ffbe151cb3f76d93f9dfda
3
  size 49566112640
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8138c895fc95c32c04d6fdcb98f223467b68deb597f0f5c7e2a2661313d85771
3
  size 49566112640
Q4_K_M/Llama-4-Maverick-17B-128E-Instruct-Q4_K_M-00004-of-00005.gguf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:52fc775e377ebd8aee2c64ad677c9876c86c971fb385e8e9e77d7356bdb86cfb
3
  size 48169827200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ade0af564d22825d7f273a4431d7d8d51aefeb18cbff93144f5469a9d5322afa
3
  size 48169827200
Q4_K_M/Llama-4-Maverick-17B-128E-Instruct-Q4_K_M-00005-of-00005.gguf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b005819e9a02b3412c94dda926132c97a62a959c8a03a25e1d4441fb0d8f19ec
3
  size 46079637152
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6496072373d3c807078246679852e073a9c5a95296c4a39e9327b28af512398
3
  size 46079637152
UD-Q2_K_XL/Llama-4-Maverick-17B-128E-Instruct-UD-Q2_K_XL-00001-of-00004.gguf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c826481d4953d69dcc45e9c621ad4d5e510b857c29387abce79d6b54d7ecae79
3
- size 49713025088
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d6a531a69e40e702fb32d504f41544959fb7f7e092cfb5a0fc7458388af471d
3
+ size 49713025056
UD-Q2_K_XL/Llama-4-Maverick-17B-128E-Instruct-UD-Q2_K_XL-00002-of-00004.gguf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:abcb4c4d8cabb49b53f171ec3694e280b64cbef78a03c91cd01837c025e77b11
3
  size 48619408320
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d9ab3fcc9e7ba32a17fb99da3265590ac65f3512c6062f9fd7c3661673c5ac2
3
  size 48619408320
UD-Q2_K_XL/Llama-4-Maverick-17B-128E-Instruct-UD-Q2_K_XL-00003-of-00004.gguf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1f897e138e2f8e79cc2227fdf5f5429ba78dd7f5583e5d0521a5a211796bf874
3
- size 49010432672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2117c66cb5d3c73f64678e763f0a114dc2dfab21aad78ed7d2374d8c251046c7
3
+ size 49728707232
UD-Q2_K_XL/Llama-4-Maverick-17B-128E-Instruct-UD-Q2_K_XL-00004-of-00004.gguf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2e09abde501a9aada1e237bec9a1a5c708167b3a013f239959d293eae74c256c
3
  size 3573043712
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75ae4119df73ceaebf45e3924e5ff82e2570ecacc95efc2c236c2ebb84fd0551
3
  size 3573043712
UD-Q3_K_XL/Llama-4-Maverick-17B-128E-Instruct-UD-Q3_K_XL-00001-of-00004.gguf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ec3290c56e681e0d9cd69f666404a8ad8d172d17ab96f35a1b0d800673f2be43
3
  size 48512096704
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50da970635d726ce090d8c9340124b49ce9f3d1477b495862fc752f73db29727
3
  size 48512096704
UD-Q3_K_XL/Llama-4-Maverick-17B-128E-Instruct-UD-Q3_K_XL-00002-of-00004.gguf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e3ce8be6c94b4ae92c2232a4c2f1210cd96b031c9c6eadbc5f601cb3f3581a7b
3
  size 47965275584
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93e25048ee621011ce2fc791230177d4b26809c8e1bd4ffe9c520ff68e3cc154
3
  size 47965275584
UD-Q3_K_XL/Llama-4-Maverick-17B-128E-Instruct-UD-Q3_K_XL-00003-of-00004.gguf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6c6d8f34e668aeb150e6ca7c7b1f7820d01e97efae106bf648649a48881970cc
3
  size 48513708672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0875fab7930e8de98b5c21fb51d30a3a98413211ba5639c4e773cf924abbbe48
3
  size 48513708672
UD-Q3_K_XL/Llama-4-Maverick-17B-128E-Instruct-UD-Q3_K_XL-00004-of-00004.gguf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:16ea579d77eba35496a0e2edab28ec1bb1d588f769b307a053b3952180f3fdfc
3
  size 33950643872
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c167afacfc35d68c15594a03de59af8b062bde2ead33d0cefef343f1e8918b56
3
  size 33950643872
UD-Q4_K_XL/Llama-4-Maverick-17B-128E-Instruct-UD-Q4_K_XL-00001-of-00005.gguf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:43f22e8cfe70aef7c6c71bbf5a76632b914359aabfce16e4c494c1e24bd50a3f
3
- size 49807660000
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b74dc3628041a854c7963df322ccb5b6a7df75541246ed1b3cfd10a6f6ed9e2
3
+ size 49807659968
UD-Q4_K_XL/Llama-4-Maverick-17B-128E-Instruct-UD-Q4_K_XL-00002-of-00005.gguf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ac87d0f2053cd3e26e13a5a37ee7d8c9c47eac6463290b19ea0eed89af204e44
3
  size 49830263808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8e9f010b88c8cea88753d90467431da241f997ff3cf2cc7d958cfd9e0c9f8ca
3
  size 49830263808
UD-Q4_K_XL/Llama-4-Maverick-17B-128E-Instruct-UD-Q4_K_XL-00003-of-00005.gguf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dc255a254b30db8450de6cd49b6c06568b60c15c1d06508edc77226cb2263b1e
3
  size 49832905856
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f74972e1b1ea1fc28f370e87533a8e509a34febab7fa6afb0923118d50930df
3
  size 49832905856
UD-Q4_K_XL/Llama-4-Maverick-17B-128E-Instruct-UD-Q4_K_XL-00004-of-00005.gguf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5fdb68b4b682fbc9c2f5823081449069e38a84d48c2eeb596e8ba4f40b3913c6
3
  size 49508645760
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5dbe3bdc6c29830655f7c71e9b05766cc161307eff405dc9875d8becaff21aa0
3
  size 49508645760
UD-Q4_K_XL/Llama-4-Maverick-17B-128E-Instruct-UD-Q4_K_XL-00005-of-00005.gguf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3e97509c6ee34ccd6bab002fa3f0c28ccfb7c5fc677fbb19663174631c0626a6
3
  size 33155199296
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6cc2d32447eb4720c12a05011b18749b8f3f031bbfea6c931755ce298d8f3c1d
3
  size 33155199296
config.json CHANGED
@@ -6,17 +6,21 @@
6
  "eoi_token_index": 200081,
7
  "image_token_index": 200092,
8
  "model_type": "llama4",
 
9
  "text_config": {
10
- "_attn_implementation_autoset": true,
11
  "attention_bias": false,
12
  "attention_chunk_size": 8192,
13
  "attention_dropout": 0.0,
 
 
14
  "bos_token_id": 200000,
 
15
  "eos_token_id": [
16
  200001,
17
  200007,
18
  200008
19
  ],
 
20
  "for_llm_compressor": false,
21
  "head_dim": 128,
22
  "hidden_act": "silu",
@@ -27,6 +31,82 @@
27
  "intermediate_size_mlp": 16384,
28
  "max_position_embeddings": 1048576,
29
  "model_type": "llama4_text",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
30
  "num_attention_heads": 40,
31
  "num_experts_per_tok": 1,
32
  "num_hidden_layers": 48,
@@ -44,10 +124,11 @@
44
  "use_qk_norm": false,
45
  "vocab_size": 202048
46
  },
 
47
  "torch_dtype": "bfloat16",
48
- "transformers_version": "4.51.0.dev0",
 
49
  "vision_config": {
50
- "_attn_implementation_autoset": true,
51
  "attention_dropout": 0.0,
52
  "hidden_act": "gelu",
53
  "hidden_size": 1408,
 
6
  "eoi_token_index": 200081,
7
  "image_token_index": 200092,
8
  "model_type": "llama4",
9
+ "pad_token_id": 200018,
10
  "text_config": {
 
11
  "attention_bias": false,
12
  "attention_chunk_size": 8192,
13
  "attention_dropout": 0.0,
14
+ "attn_scale": 0.1,
15
+ "attn_temperature_tuning": true,
16
  "bos_token_id": 200000,
17
+ "cache_implementation": "hybrid",
18
  "eos_token_id": [
19
  200001,
20
  200007,
21
  200008
22
  ],
23
+ "floor_scale": 8192,
24
  "for_llm_compressor": false,
25
  "head_dim": 128,
26
  "hidden_act": "silu",
 
31
  "intermediate_size_mlp": 16384,
32
  "max_position_embeddings": 1048576,
33
  "model_type": "llama4_text",
34
+ "moe_layers": [
35
+ 1,
36
+ 3,
37
+ 5,
38
+ 7,
39
+ 9,
40
+ 11,
41
+ 13,
42
+ 15,
43
+ 17,
44
+ 19,
45
+ 21,
46
+ 23,
47
+ 25,
48
+ 27,
49
+ 29,
50
+ 31,
51
+ 33,
52
+ 35,
53
+ 37,
54
+ 39,
55
+ 41,
56
+ 43,
57
+ 45,
58
+ 47
59
+ ],
60
+ "no_rope_layers": [
61
+ 1,
62
+ 1,
63
+ 1,
64
+ 0,
65
+ 1,
66
+ 1,
67
+ 1,
68
+ 0,
69
+ 1,
70
+ 1,
71
+ 1,
72
+ 0,
73
+ 1,
74
+ 1,
75
+ 1,
76
+ 0,
77
+ 1,
78
+ 1,
79
+ 1,
80
+ 0,
81
+ 1,
82
+ 1,
83
+ 1,
84
+ 0,
85
+ 1,
86
+ 1,
87
+ 1,
88
+ 0,
89
+ 1,
90
+ 1,
91
+ 1,
92
+ 0,
93
+ 1,
94
+ 1,
95
+ 1,
96
+ 0,
97
+ 1,
98
+ 1,
99
+ 1,
100
+ 0,
101
+ 1,
102
+ 1,
103
+ 1,
104
+ 0,
105
+ 1,
106
+ 1,
107
+ 1,
108
+ 0
109
+ ],
110
  "num_attention_heads": 40,
111
  "num_experts_per_tok": 1,
112
  "num_hidden_layers": 48,
 
124
  "use_qk_norm": false,
125
  "vocab_size": 202048
126
  },
127
+ "tie_word_embeddings": false,
128
  "torch_dtype": "bfloat16",
129
+ "transformers_version": "4.52.1",
130
+ "unsloth_fixed": true,
131
  "vision_config": {
 
132
  "attention_dropout": 0.0,
133
  "hidden_act": "gelu",
134
  "hidden_size": 1408,
mmproj-F16.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26997cbf220cd74202e6630da16d357e9bf05f627367d4e2639b62182758399e
3
+ size 1746780960
mmproj-F32.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0441883528df7f707547c3ee3fce8ea5a07e0a52d7ff49bc94edd443e6af4261
3
+ size 3487762208