fxmarty
/

llama-tiny-int4-per-group-sym

fxmarty commited on Oct 10

Commit

7c13bfb

•

1 Parent(s): 275cfae

Upload folder using huggingface_hub

Files changed (1) hide show

config.json CHANGED Viewed

@@ -21,42 +21,38 @@
   "pad_token_id": -1,
   "pretraining_tp": 1,
   "quantization_config": {
-    "library": "quark",
-    "quant_method": "quark",
-    "quark_config": {
-      "algo_config": null,
-      "exclude": [
-        "lm_head"
-      ],
-      "export": {
-        "kv_cache_group": [],
-        "pack_method": "reorder",
-        "weight_format": "real_quantized",
-        "weight_merge_groups": null
-      },
-      "global_quant_config": {
-        "bias": null,
-        "input_tensors": null,
-        "output_tensors": null,
-        "target_device": null,
-        "weight": {
-          "ch_axis": 1,
-          "dtype": "int4",
-          "group_size": 4,
-          "is_dynamic": false,
-          "observer_cls": "PerGroupMinMaxObserver",
-          "qscheme": "per_group",
-          "round_method": "half_even",
-          "scale_type": "float",
-          "symmetric": true
-        }
-      },
-      "layer_quant_config": {},
-      "layer_type_quant_config": {},
       "pack_method": "reorder",
-      "quant_method": "quark",
-      "quant_mode": 1
-    }
   },
   "rms_norm_eps": 1e-06,
   "rope_scaling": null,

   "pad_token_id": -1,
   "pretraining_tp": 1,
   "quantization_config": {
+    "algo_config": null,
+    "exclude": [
+      "lm_head"
+    ],
+    "export": {
+      "kv_cache_group": [],
       "pack_method": "reorder",
+      "weight_format": "real_quantized",
+      "weight_merge_groups": null
+    },
+    "global_quant_config": {
+      "bias": null,
+      "input_tensors": null,
+      "output_tensors": null,
+      "target_device": null,
+      "weight": {
+        "ch_axis": 1,
+        "dtype": "int4",
+        "group_size": 4,
+        "is_dynamic": false,
+        "observer_cls": "PerGroupMinMaxObserver",
+        "qscheme": "per_group",
+        "round_method": "half_even",
+        "scale_type": "float",
+        "symmetric": true
+      }
+    },
+    "layer_quant_config": {},
+    "layer_type_quant_config": {},
+    "pack_method": "reorder",
+    "quant_method": "quark",
+    "quant_mode": 1
   },
   "rms_norm_eps": 1e-06,
   "rope_scaling": null,