mlx-my-repo

Running

AGCobra commited on 15 days ago

Commit

5a78369

•

1 Parent(s): 345fe11

Add Q3 and Q6

Files changed (1) hide show

app.py CHANGED Viewed

@@ -23,7 +23,9 @@ HF_TOKEN = os.environ.get("HF_TOKEN")
 # I'm not sure if we need to add more stuff here
 QUANT_PARAMS = {
     "Q4": 4,
     "Q8": 8,
 }
@@ -139,7 +141,7 @@ with gr.Blocks(css=css) as demo:
     )
     q_method = gr.Dropdown(
-        ["Q4", "Q8"],
         label="Quantization Method",
         info="MLX quantization type",
         value="Q4",

 # I'm not sure if we need to add more stuff here
 QUANT_PARAMS = {
+    "Q3": 3,
     "Q4": 4,
+    "Q6": 6,
     "Q8": 8,
 }
     )
     q_method = gr.Dropdown(
+        ["Q3", "Q4", "Q6", "Q8"],
         label="Quantization Method",
         info="MLX quantization type",
         value="Q4",