Spaces:
Running
Running
Add Q3 and Q6
Browse files
app.py
CHANGED
|
@@ -23,7 +23,9 @@ HF_TOKEN = os.environ.get("HF_TOKEN")
|
|
| 23 |
|
| 24 |
# I'm not sure if we need to add more stuff here
|
| 25 |
QUANT_PARAMS = {
|
|
|
|
| 26 |
"Q4": 4,
|
|
|
|
| 27 |
"Q8": 8,
|
| 28 |
}
|
| 29 |
|
|
@@ -139,7 +141,7 @@ with gr.Blocks(css=css) as demo:
|
|
| 139 |
)
|
| 140 |
|
| 141 |
q_method = gr.Dropdown(
|
| 142 |
-
["Q4", "Q8"],
|
| 143 |
label="Quantization Method",
|
| 144 |
info="MLX quantization type",
|
| 145 |
value="Q4",
|
|
|
|
| 23 |
|
| 24 |
# I'm not sure if we need to add more stuff here
|
| 25 |
QUANT_PARAMS = {
|
| 26 |
+
"Q3": 3,
|
| 27 |
"Q4": 4,
|
| 28 |
+
"Q6": 6,
|
| 29 |
"Q8": 8,
|
| 30 |
}
|
| 31 |
|
|
|
|
| 141 |
)
|
| 142 |
|
| 143 |
q_method = gr.Dropdown(
|
| 144 |
+
["Q3", "Q4", "Q6", "Q8"],
|
| 145 |
label="Quantization Method",
|
| 146 |
info="MLX quantization type",
|
| 147 |
value="Q4",
|