8bit_agressive / quantization_info.json

Upload quantization_info.json with huggingface_hub

0af2a02 verified 7 months ago

667 Bytes

	{
	"model_name": "luca-deandrea/MNLP_M3_mcqa_model",
	"quantization_method": "bitsandbytes",
	"config_name": "bnb_8bit_aggressive",
	"description": "8-bit with aggressive quantization",
	"expected_compression": "~4x",
	"quantization_config": {
	"load_in_4bit": false,
	"load_in_8bit": true,
	"bnb_4bit_quant_type": "fp4",
	"bnb_4bit_use_double_quant": false,
	"bnb_4bit_compute_dtype": "torch.float32",
	"llm_int8_threshold": 0.0
	},
	"timestamp": "2025-06-10 21:32:18",
	"loading_time_seconds": 10.248082876205444,
	"memory_usage_gb": 0.7341856956481934,
	"test_generation": "Hello, I am a student who has been working on a project to"
	}