dsikka commited on
Commit
8db253e
1 Parent(s): 0f24a3f

Upload folder using huggingface_hub

Browse files
Files changed (3) hide show
  1. config.json +3 -3
  2. model.safetensors +2 -2
  3. recipe.yaml +7 -4
config.json CHANGED
@@ -28,7 +28,7 @@
28
  "Linear"
29
  ],
30
  "weights": {
31
- "actorder": null,
32
  "block_structure": null,
33
  "dynamic": false,
34
  "group_size": 128,
@@ -42,7 +42,7 @@
42
  }
43
  },
44
  "format": "pack-quantized",
45
- "global_compression_ratio": 1.883165566487463,
46
  "ignore": [
47
  "lm_head"
48
  ],
@@ -51,7 +51,7 @@
51
  "quantization_status": "compressed",
52
  "sparsity_config": {
53
  "format": "dense",
54
- "global_sparsity": 0.14375328644374685,
55
  "ignore": [],
56
  "registry_requires_subclass": false,
57
  "sparsity_structure": "unstructured",
 
28
  "Linear"
29
  ],
30
  "weights": {
31
+ "actorder": "group",
32
  "block_structure": null,
33
  "dynamic": false,
34
  "group_size": 128,
 
42
  }
43
  },
44
  "format": "pack-quantized",
45
+ "global_compression_ratio": 1.8833636632816793,
46
  "ignore": [
47
  "lm_head"
48
  ],
 
51
  "quantization_status": "compressed",
52
  "sparsity_config": {
53
  "format": "dense",
54
+ "global_sparsity": 0.1407252015594666,
55
  "ignore": [],
56
  "registry_requires_subclass": false,
57
  "sparsity_structure": "unstructured",
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:892873b79abcf66508b526a74179177e303de9b4b1464a6177096348faa7fd76
3
- size 761968800
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a526374315ca3ab080a4c930dac9144a8a2a738a69ba9446ef6027e9fd2ab1e9
3
+ size 763563248
recipe.yaml CHANGED
@@ -1,6 +1,9 @@
1
- DEFAULT_stage:
2
- DEFAULT_modifiers:
3
  GPTQModifier:
4
- targets: Linear
5
  ignore: [lm_head]
6
- scheme: W4A16
 
 
 
 
 
1
+ quant_stage:
2
+ quant_modifiers:
3
  GPTQModifier:
 
4
  ignore: [lm_head]
5
+ config_groups:
6
+ group_0:
7
+ weights: {num_bits: 4, type: int, symmetric: true, strategy: group, group_size: 128,
8
+ actorder: group}
9
+ targets: [Linear]