OPEA
/

DeepSeek-V3-int4-sym-gptq-inc

4-bit precision

Model card Files Files and versions Community

wenhuach commited on 22 days ago

Commit

fc1640b

·

1 Parent(s): f769926

update to gptq format

Signed-off-by: wenhuach <wenhuach87@gmail.com>

Files changed (1) hide show

config.json +1 -2

config.json CHANGED Viewed

@@ -38,7 +38,6 @@
   "qk_nope_head_dim": 128,
   "qk_rope_head_dim": 64,
   "quantization_config": {
-    "backend": "auto_round:gptq:exllamav2",
     "amp": true,
     "autoround_version": "0.4.3",
     "batch_size": 8,
@@ -56,7 +55,7 @@
     "lr": 0.005,
     "minmax_lr": 0.005,
     "nsamples": 512,
-    "quant_method": "intel/auto-round",
     "scale_dtype": "torch.float16",
     "seqlen": 512,
     "sym": true,

   "qk_nope_head_dim": 128,
   "qk_rope_head_dim": 64,
   "quantization_config": {
     "amp": true,
     "autoround_version": "0.4.3",
     "batch_size": 8,
     "lr": 0.005,
     "minmax_lr": 0.005,
     "nsamples": 512,
+    "quant_method": "gptq",
     "scale_dtype": "torch.float16",
     "seqlen": 512,
     "sym": true,