Spaces:
Paused
Paused
Update app.py
Browse files
app.py
CHANGED
@@ -118,7 +118,7 @@ def process_model(model_id, q_method, use_imatrix, imatrix_q_method, private_rep
|
|
118 |
print(f"Model directory contents: {os.listdir(local_dir)}")
|
119 |
|
120 |
conversion_script = "convert_hf_to_gguf.py"
|
121 |
-
fp16_conversion = f"python llama.cpp/{conversion_script} {local_dir} --outtype
|
122 |
result = subprocess.run(fp16_conversion, shell=True, capture_output=True)
|
123 |
print(result)
|
124 |
if result.returncode != 0:
|
@@ -274,7 +274,7 @@ with gr.Blocks(css=css) as demo:
|
|
274 |
)
|
275 |
|
276 |
q_method = gr.Dropdown(
|
277 |
-
["Q2_K", "Q3_K_S", "Q3_K_M", "Q3_K_L", "Q4_0", "Q4_K_S", "Q4_K_M", "Q5_0", "Q5_K_S", "Q5_K_M", "Q6_K", "Q8_0", "F16", "BF16"],
|
278 |
label="Quantization Method",
|
279 |
info="GGML quantization type",
|
280 |
value="Q4_K_M",
|
|
|
118 |
print(f"Model directory contents: {os.listdir(local_dir)}")
|
119 |
|
120 |
conversion_script = "convert_hf_to_gguf.py"
|
121 |
+
fp16_conversion = f"python llama.cpp/{conversion_script} {local_dir} --outtype f32 --outfile {fp16}"
|
122 |
result = subprocess.run(fp16_conversion, shell=True, capture_output=True)
|
123 |
print(result)
|
124 |
if result.returncode != 0:
|
|
|
274 |
)
|
275 |
|
276 |
q_method = gr.Dropdown(
|
277 |
+
["Q2_K", "Q3_K_S", "Q3_K_M", "Q3_K_L", "Q4_0", "Q4_K_S", "Q4_K_M", "Q5_0", "Q5_K_S", "Q5_K_M", "Q6_K", "Q8_0", "F16", "BF16", "F32"],
|
278 |
label="Quantization Method",
|
279 |
info="GGML quantization type",
|
280 |
value="Q4_K_M",
|