File size: 1,207 Bytes
a9fdace |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 |
#!/usr/bin/env python3
"""
8-bit quantization script
"""
import os
import subprocess
import sys
def quantize_8bit():
input_path = "trained_models/isaac_sim_hf/gguf_final/isaac_sim_qwen2.5_coder.gguf"
output_path = "trained_models/isaac_sim_hf/gguf_final/isaac_sim_qwen2.5_coder_q8_0.gguf"
if not os.path.exists(input_path):
print(f"β Input file not found: {input_path}")
return False
print(f"π’ Quantizing to 8-bit: {input_path} -> {output_path}")
cmd = [
"../../llama.cpp/build/bin/llama-quantize",
input_path,
output_path,
"q8_0"
]
try:
result = subprocess.run(cmd, capture_output=True, text=True, check=True)
print("β
8-bit quantization completed")
if os.path.exists(output_path):
size_mb = os.path.getsize(output_path) / (1024 * 1024)
print(f"π 8-bit file size: {size_mb:.1f} MB")
return True
except subprocess.CalledProcessError as e:
print(f"β 8-bit quantization failed: {e.stderr}")
return False
if __name__ == "__main__":
success = quantize_8bit()
sys.exit(0 if success else 1)
|