nm-autobot
commited on
Upload folder using huggingface_hub
Browse files- recipe.yaml +0 -7
recipe.yaml
CHANGED
@@ -2,10 +2,3 @@ quant_stage:
|
|
2 |
quant_modifiers:
|
3 |
QuantizationModifier:
|
4 |
kv_cache_scheme: {num_bits: 8, type: float, symmetric: true, strategy: tensor}
|
5 |
-
GPTQModifier:
|
6 |
-
sequential_update: false
|
7 |
-
ignore: [lm_head]
|
8 |
-
config_groups:
|
9 |
-
group_0:
|
10 |
-
weights: {num_bits: 4, type: int, symmetric: true, strategy: channel, actorder: false}
|
11 |
-
targets: [Linear]
|
|
|
2 |
quant_modifiers:
|
3 |
QuantizationModifier:
|
4 |
kv_cache_scheme: {num_bits: 8, type: float, symmetric: true, strategy: tensor}
|
|
|
|
|
|
|
|
|
|
|
|
|
|