abhinavkulkarni
commited on
Commit
•
8f8f68c
1
Parent(s):
c0eee97
Update README.md
Browse files
README.md
CHANGED
@@ -63,7 +63,7 @@ q_config = {
|
|
63 |
load_quant = hf_hub_download('abhinavkulkarni/falcon-7b-instruct-w4-g64-awq', 'pytorch_model.bin')
|
64 |
|
65 |
with init_empty_weights():
|
66 |
-
model = AutoModelForCausalLM.
|
67 |
torch_dtype=torch.float16, trust_remote_code=True)
|
68 |
|
69 |
real_quantize_model_weight(model, w_bit=w_bit, q_config=q_config, init_only=True)
|
|
|
63 |
load_quant = hf_hub_download('abhinavkulkarni/falcon-7b-instruct-w4-g64-awq', 'pytorch_model.bin')
|
64 |
|
65 |
with init_empty_weights():
|
66 |
+
model = AutoModelForCausalLM.from_config(config=config,
|
67 |
torch_dtype=torch.float16, trust_remote_code=True)
|
68 |
|
69 |
real_quantize_model_weight(model, w_bit=w_bit, q_config=q_config, init_only=True)
|