mlx-my-repo

Running

localghostx commited on 5 days ago

Commit

6c86eb4

•

1 Parent(s): 345fe11

Add q2

Adds 2-bit quantization to dropdown.

Files changed (1) hide show

app.py CHANGED Viewed

@@ -23,6 +23,7 @@ HF_TOKEN = os.environ.get("HF_TOKEN")
 # I'm not sure if we need to add more stuff here
 QUANT_PARAMS = {
     "Q4": 4,
     "Q8": 8,
 }
@@ -139,7 +140,7 @@ with gr.Blocks(css=css) as demo:
     )
     q_method = gr.Dropdown(
-        ["Q4", "Q8"],
         label="Quantization Method",
         info="MLX quantization type",
         value="Q4",

 # I'm not sure if we need to add more stuff here
 QUANT_PARAMS = {
+    "Q2": 2
     "Q4": 4,
     "Q8": 8,
 }
     )
     q_method = gr.Dropdown(
+        ["Q2", "Q4", "Q8"],
         label="Quantization Method",
         info="MLX quantization type",
         value="Q4",