trtexec \ | |
--fp16 \ | |
--minShapes=input_ids:1x128,attention_mask:1x128 \ | |
--optShapes=input_ids:8x128,attention_mask:8x128 \ | |
--maxShapes=input_ids:32x128,attention_mask:32x128 \ | |
--saveEngine=model.plan \ | |
--shapes=input_ids:8x128,attention_mask:8x128 \ | |
--inputIOFormats="int64:chw,int64:chw" \ | |
--onnx=model.onnx |