SekoiaTree commited on
Commit
d726661
·
verified ·
1 Parent(s): a00832f

Upload Qwen3ForCausalLM

Browse files
Files changed (2) hide show
  1. config.json +41 -13
  2. model.safetensors +2 -2
config.json CHANGED
@@ -48,19 +48,47 @@
48
  "num_hidden_layers": 28,
49
  "num_key_value_heads": 8,
50
  "quantization_config": {
51
- "_load_in_4bit": false,
52
- "_load_in_8bit": true,
53
- "bnb_4bit_compute_dtype": "float32",
54
- "bnb_4bit_quant_storage": "uint8",
55
- "bnb_4bit_quant_type": "fp4",
56
- "bnb_4bit_use_double_quant": false,
57
- "llm_int8_enable_fp32_cpu_offload": false,
58
- "llm_int8_has_fp16_weight": false,
59
- "llm_int8_skip_modules": null,
60
- "llm_int8_threshold": 6.0,
61
- "load_in_4bit": false,
62
- "load_in_8bit": true,
63
- "quant_method": "bitsandbytes"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
64
  },
65
  "rms_norm_eps": 1e-06,
66
  "rope_scaling": null,
 
48
  "num_hidden_layers": 28,
49
  "num_key_value_heads": 8,
50
  "quantization_config": {
51
+ "config_groups": {
52
+ "group_0": {
53
+ "input_activations": {
54
+ "actorder": null,
55
+ "block_structure": null,
56
+ "dynamic": true,
57
+ "group_size": null,
58
+ "num_bits": 8,
59
+ "observer": null,
60
+ "observer_kwargs": {},
61
+ "strategy": "token",
62
+ "symmetric": true,
63
+ "type": "int"
64
+ },
65
+ "output_activations": null,
66
+ "targets": [
67
+ "Linear"
68
+ ],
69
+ "weights": {
70
+ "actorder": null,
71
+ "block_structure": null,
72
+ "dynamic": false,
73
+ "group_size": 128,
74
+ "num_bits": 4,
75
+ "observer": "minmax",
76
+ "observer_kwargs": {},
77
+ "strategy": "group",
78
+ "symmetric": true,
79
+ "type": "int"
80
+ }
81
+ }
82
+ },
83
+ "format": "int-quantized",
84
+ "global_compression_ratio": null,
85
+ "ignore": [
86
+ "lm_head"
87
+ ],
88
+ "kv_cache_scheme": null,
89
+ "quant_method": "compressed-tensors",
90
+ "quantization_status": "compressed",
91
+ "sparsity_config": {}
92
  },
93
  "rms_norm_eps": 1e-06,
94
  "rope_scaling": null,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:30df4133101af2c245680289f4f1d5cf7d2ed5a6e817af40e8fbd90cb0454426
3
- size 753150052
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b21d16025170d7668261760c174173b5ea50c5014c1768eed6b40878b676302
3
+ size 758636616