AutoGPTQ model for Alibaba-NLP/gte-Qwen2-1.5B-instruct: 8bits, gr128, desc_act=True
4e1b0bb
verified
{ | |
"bits": 8, | |
"group_size": 128, | |
"damp_percent": 0.01, | |
"desc_act": true, | |
"static_groups": false, | |
"sym": true, | |
"true_sequential": true, | |
"model_name_or_path": null, | |
"model_file_base_name": null, | |
"is_marlin_format": false, | |
"quant_method": "gptq" | |
} |