import torch blob_path = "./llama-2-chat-7b_r0.8_g128.pth" blob = torch.load(blob_path) for layer, attr in blob.items(): print(f"{layer:30} | q_dtype: {attr['q_dtype']:5} | orig. shape: {str(attr['original_shape']):15} | quantized_shape: {str(attr['q_weight'].shape):15}") print("done.")