Upload folder using huggingface_hub
Browse files- config.json +3 -3
- model.safetensors +2 -2
- recipe.yaml +1 -1
config.json
CHANGED
|
@@ -32,14 +32,14 @@
|
|
| 32 |
"num_bits": 8,
|
| 33 |
"observer": "minmax",
|
| 34 |
"observer_kwargs": {},
|
| 35 |
-
"strategy": "
|
| 36 |
"symmetric": true,
|
| 37 |
"type": "int"
|
| 38 |
}
|
| 39 |
}
|
| 40 |
},
|
| 41 |
"format": "int-quantized",
|
| 42 |
-
"global_compression_ratio": 1.
|
| 43 |
"ignore": [
|
| 44 |
"lm_head"
|
| 45 |
],
|
|
@@ -48,7 +48,7 @@
|
|
| 48 |
},
|
| 49 |
"sparsity_config": {
|
| 50 |
"format": "dense",
|
| 51 |
-
"global_sparsity":
|
| 52 |
"registry_requires_subclass": false,
|
| 53 |
"sparsity_structure": "unstructured"
|
| 54 |
}
|
|
|
|
| 32 |
"num_bits": 8,
|
| 33 |
"observer": "minmax",
|
| 34 |
"observer_kwargs": {},
|
| 35 |
+
"strategy": "tensor",
|
| 36 |
"symmetric": true,
|
| 37 |
"type": "int"
|
| 38 |
}
|
| 39 |
}
|
| 40 |
},
|
| 41 |
"format": "int-quantized",
|
| 42 |
+
"global_compression_ratio": 1.2391304140415598,
|
| 43 |
"ignore": [
|
| 44 |
"lm_head"
|
| 45 |
],
|
|
|
|
| 48 |
},
|
| 49 |
"sparsity_config": {
|
| 50 |
"format": "dense",
|
| 51 |
+
"global_sparsity": 7.819650685473849,
|
| 52 |
"registry_requires_subclass": false,
|
| 53 |
"sparsity_structure": "unstructured"
|
| 54 |
}
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:68c532b04501830ec5a92b14272c2cb59b8b419a2c521e57152457fb88243d5c
|
| 3 |
+
size 1231252556
|
recipe.yaml
CHANGED
|
@@ -5,6 +5,6 @@ quant_stage:
|
|
| 5 |
ignore: [lm_head]
|
| 6 |
config_groups:
|
| 7 |
group_0:
|
| 8 |
-
weights: {num_bits: 8, type: int, symmetric: true, strategy:
|
| 9 |
input_activations: {num_bits: 8, type: int, symmetric: true, dynamic: true, strategy: token}
|
| 10 |
targets: [Linear]
|
|
|
|
| 5 |
ignore: [lm_head]
|
| 6 |
config_groups:
|
| 7 |
group_0:
|
| 8 |
+
weights: {num_bits: 8, type: int, symmetric: true, strategy: tensor}
|
| 9 |
input_activations: {num_bits: 8, type: int, symmetric: true, dynamic: true, strategy: token}
|
| 10 |
targets: [Linear]
|