nm-autobot
commited on
Upload folder using huggingface_hub
Browse files- recipe.yaml +7 -0
recipe.yaml
CHANGED
@@ -2,3 +2,10 @@ quant_stage:
|
|
2 |
quant_modifiers:
|
3 |
QuantizationModifier:
|
4 |
kv_cache_scheme: {num_bits: 8, type: float, symmetric: true, strategy: tensor}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
2 |
quant_modifiers:
|
3 |
QuantizationModifier:
|
4 |
kv_cache_scheme: {num_bits: 8, type: float, symmetric: true, strategy: tensor}
|
5 |
+
GPTQModifier:
|
6 |
+
sequential_update: false
|
7 |
+
ignore: [lm_head]
|
8 |
+
config_groups:
|
9 |
+
group_0:
|
10 |
+
weights: {num_bits: 4, type: int, symmetric: true, strategy: channel, actorder: false}
|
11 |
+
targets: [Linear]
|