andito HF staff commited on
Commit
41f7529
1 Parent(s): c57b386

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -118,7 +118,7 @@ def process_model(model_id, q_method, use_imatrix, imatrix_q_method, private_rep
118
  print(f"Model directory contents: {os.listdir(local_dir)}")
119
 
120
  conversion_script = "convert_hf_to_gguf.py"
121
- fp16_conversion = f"python llama.cpp/{conversion_script} {local_dir} --outtype bf16 --outfile {fp16}"
122
  result = subprocess.run(fp16_conversion, shell=True, capture_output=True)
123
  print(result)
124
  if result.returncode != 0:
@@ -274,7 +274,7 @@ with gr.Blocks(css=css) as demo:
274
  )
275
 
276
  q_method = gr.Dropdown(
277
- ["Q2_K", "Q3_K_S", "Q3_K_M", "Q3_K_L", "Q4_0", "Q4_K_S", "Q4_K_M", "Q5_0", "Q5_K_S", "Q5_K_M", "Q6_K", "Q8_0", "F16", "BF16"],
278
  label="Quantization Method",
279
  info="GGML quantization type",
280
  value="Q4_K_M",
 
118
  print(f"Model directory contents: {os.listdir(local_dir)}")
119
 
120
  conversion_script = "convert_hf_to_gguf.py"
121
+ fp16_conversion = f"python llama.cpp/{conversion_script} {local_dir} --outtype f32 --outfile {fp16}"
122
  result = subprocess.run(fp16_conversion, shell=True, capture_output=True)
123
  print(result)
124
  if result.returncode != 0:
 
274
  )
275
 
276
  q_method = gr.Dropdown(
277
+ ["Q2_K", "Q3_K_S", "Q3_K_M", "Q3_K_L", "Q4_0", "Q4_K_S", "Q4_K_M", "Q5_0", "Q5_K_S", "Q5_K_M", "Q6_K", "Q8_0", "F16", "BF16", "F32"],
278
  label="Quantization Method",
279
  info="GGML quantization type",
280
  value="Q4_K_M",