ahmedaeb's picture
Upload All Files
b294e23
from onnxruntime import optimizer
# Specify the models you want to optimize
models = [
'onnx/decoder_model.onnx',
'onnx/decoder_model_merged.onnx',
'onnx/decoder_model_merged_quantized.onnx',
'onnx/decoder_model_quantized.onnx',
'onnx/decoder_with_past_model.onnx',
'onnx/decoder_with_past_model_quantized.onnx',
'onnx/encoder_model.onnx',
'onnx/encoder_model_quantized.onnx'
]
for model_path in models:
# Load and optimize the model
optimized_model = optimizer.optimize_model(model_path)
# Save the optimized model
optimized_model.save_model_to_file(model_path.replace('.onnx', '_optimized.onnx'))