mike-ravkine
commited on
Commit
•
3cb2c18
1
Parent(s):
4201307
Fix q_group_size
Browse files
README.md
CHANGED
@@ -54,7 +54,7 @@ tokenizer = AutoTokenizer.from_pretrained(config.tokenizer_name)
|
|
54 |
w_bit = 4
|
55 |
q_config = {
|
56 |
"zero_point": True,
|
57 |
-
"q_group_size":
|
58 |
}
|
59 |
|
60 |
load_quant = snapshot_download('abhinavkulkarni/tiiuae-falcon-40b-instruct-w4-g128-awq')
|
|
|
54 |
w_bit = 4
|
55 |
q_config = {
|
56 |
"zero_point": True,
|
57 |
+
"q_group_size": 128,
|
58 |
}
|
59 |
|
60 |
load_quant = snapshot_download('abhinavkulkarni/tiiuae-falcon-40b-instruct-w4-g128-awq')
|