Spaces:
Running
Running
Add Q3 and Q6
Browse files
app.py
CHANGED
@@ -23,7 +23,9 @@ HF_TOKEN = os.environ.get("HF_TOKEN")
|
|
23 |
|
24 |
# I'm not sure if we need to add more stuff here
|
25 |
QUANT_PARAMS = {
|
|
|
26 |
"Q4": 4,
|
|
|
27 |
"Q8": 8,
|
28 |
}
|
29 |
|
@@ -139,7 +141,7 @@ with gr.Blocks(css=css) as demo:
|
|
139 |
)
|
140 |
|
141 |
q_method = gr.Dropdown(
|
142 |
-
["Q4", "Q8"],
|
143 |
label="Quantization Method",
|
144 |
info="MLX quantization type",
|
145 |
value="Q4",
|
|
|
23 |
|
24 |
# I'm not sure if we need to add more stuff here
|
25 |
QUANT_PARAMS = {
|
26 |
+
"Q3": 3,
|
27 |
"Q4": 4,
|
28 |
+
"Q6": 6,
|
29 |
"Q8": 8,
|
30 |
}
|
31 |
|
|
|
141 |
)
|
142 |
|
143 |
q_method = gr.Dropdown(
|
144 |
+
["Q3", "Q4", "Q6", "Q8"],
|
145 |
label="Quantization Method",
|
146 |
info="MLX quantization type",
|
147 |
value="Q4",
|