Spaces:
Running
on
A10G
Running
on
A10G
Add F16 and BF16 quantization
Browse files
app.py
CHANGED
@@ -274,7 +274,7 @@ with gr.Blocks(css=css) as demo:
|
|
274 |
)
|
275 |
|
276 |
q_method = gr.Dropdown(
|
277 |
-
["Q2_K", "Q3_K_S", "Q3_K_M", "Q3_K_L", "Q4_0", "Q4_K_S", "Q4_K_M", "Q5_0", "Q5_K_S", "Q5_K_M", "Q6_K", "Q8_0"],
|
278 |
label="Quantization Method",
|
279 |
info="GGML quantization type",
|
280 |
value="Q4_K_M",
|
|
|
274 |
)
|
275 |
|
276 |
q_method = gr.Dropdown(
|
277 |
+
["Q2_K", "Q3_K_S", "Q3_K_M", "Q3_K_L", "Q4_0", "Q4_K_S", "Q4_K_M", "Q5_0", "Q5_K_S", "Q5_K_M", "Q6_K", "Q8_0", "F16", "BF16"],
|
278 |
label="Quantization Method",
|
279 |
info="GGML quantization type",
|
280 |
value="Q4_K_M",
|