sadkins65 commited on
Commit
172e719
·
verified ·
1 Parent(s): ad04724

Upload folder using huggingface_hub

Browse files
Files changed (3) hide show
  1. config.json +3 -3
  2. model.safetensors +2 -2
  3. recipe.yaml +1 -1
config.json CHANGED
@@ -31,14 +31,14 @@
31
  "num_bits": 8,
32
  "observer": "minmax",
33
  "observer_kwargs": {},
34
- "strategy": "channel",
35
  "symmetric": true,
36
  "type": "int"
37
  }
38
  }
39
  },
40
  "format": "int-quantized",
41
- "global_compression_ratio": 1.2390773684863086,
42
  "ignore": [
43
  "lm_head"
44
  ],
@@ -46,7 +46,7 @@
46
  "quantization_status": "frozen",
47
  "sparsity_config": {
48
  "format": "dense",
49
- "global_sparsity": 1.1879092038191659,
50
  "registry_requires_subclass": false,
51
  "sparsity_structure": "unstructured"
52
  }
 
31
  "num_bits": 8,
32
  "observer": "minmax",
33
  "observer_kwargs": {},
34
+ "strategy": "tensor",
35
  "symmetric": true,
36
  "type": "int"
37
  }
38
  }
39
  },
40
  "format": "int-quantized",
41
+ "global_compression_ratio": 1.2391304140415598,
42
  "ignore": [
43
  "lm_head"
44
  ],
 
46
  "quantization_status": "frozen",
47
  "sparsity_config": {
48
  "format": "dense",
49
+ "global_sparsity": 7.816310105138066,
50
  "registry_requires_subclass": false,
51
  "sparsity_structure": "unstructured"
52
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aa0a2b2eacbec0d3252875883400855a36e72eda3d6fc21d8d016e7961468748
3
- size 1232041608
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac67b97b962f72184b81cf65dbbf4551d7e238a96611de7f17a73960552d46dc
3
+ size 1231252556
recipe.yaml CHANGED
@@ -5,6 +5,6 @@ quant_stage:
5
  ignore: [lm_head]
6
  config_groups:
7
  group_0:
8
- weights: {num_bits: 8, type: int, symmetric: true, strategy: channel}
9
  input_activations: {num_bits: 8, type: int, symmetric: true, dynamic: true, strategy: token}
10
  targets: [Linear]
 
5
  ignore: [lm_head]
6
  config_groups:
7
  group_0:
8
+ weights: {num_bits: 8, type: int, symmetric: true, strategy: tensor}
9
  input_activations: {num_bits: 8, type: int, symmetric: true, dynamic: true, strategy: token}
10
  targets: [Linear]