Set `half` using `cfg.fp16` for 4bit
Browse files
src/axolotl/utils/models.py
CHANGED
@@ -112,6 +112,7 @@ def load_model(
|
|
112 |
base_model_config if base_model_config else base_model,
|
113 |
model_path,
|
114 |
device_map=cfg.device_map,
|
|
|
115 |
groupsize=cfg.gptq_groupsize if cfg.gptq_groupsize else -1,
|
116 |
is_v1_model=cfg.gptq_model_v1
|
117 |
if cfg.gptq_model_v1 is not None
|
|
|
112 |
base_model_config if base_model_config else base_model,
|
113 |
model_path,
|
114 |
device_map=cfg.device_map,
|
115 |
+
half=cfg.fp16,
|
116 |
groupsize=cfg.gptq_groupsize if cfg.gptq_groupsize else -1,
|
117 |
is_v1_model=cfg.gptq_model_v1
|
118 |
if cfg.gptq_model_v1 is not None
|