Spaces:
Running
Running
localghostx
commited on
Commit
•
6c86eb4
1
Parent(s):
345fe11
Add q2
Browse filesAdds 2-bit quantization to dropdown.
app.py
CHANGED
@@ -23,6 +23,7 @@ HF_TOKEN = os.environ.get("HF_TOKEN")
|
|
23 |
|
24 |
# I'm not sure if we need to add more stuff here
|
25 |
QUANT_PARAMS = {
|
|
|
26 |
"Q4": 4,
|
27 |
"Q8": 8,
|
28 |
}
|
@@ -139,7 +140,7 @@ with gr.Blocks(css=css) as demo:
|
|
139 |
)
|
140 |
|
141 |
q_method = gr.Dropdown(
|
142 |
-
["Q4", "Q8"],
|
143 |
label="Quantization Method",
|
144 |
info="MLX quantization type",
|
145 |
value="Q4",
|
|
|
23 |
|
24 |
# I'm not sure if we need to add more stuff here
|
25 |
QUANT_PARAMS = {
|
26 |
+
"Q2": 2
|
27 |
"Q4": 4,
|
28 |
"Q8": 8,
|
29 |
}
|
|
|
140 |
)
|
141 |
|
142 |
q_method = gr.Dropdown(
|
143 |
+
["Q2", "Q4", "Q8"],
|
144 |
label="Quantization Method",
|
145 |
info="MLX quantization type",
|
146 |
value="Q4",
|