HunyuanImage-3.0-Instruct-Distil-INT8 / quantization_metadata.json
EricRollei's picture
Upload folder using huggingface_hub
c7c6837 verified
raw
history blame contribute delete
880 Bytes
{
"model_type": "HunyuanImage-3.0-Instruct-Distil",
"quantization_method": "bitsandbytes_int8",
"load_in_8bit": true,
"llm_int8_threshold": 6.0,
"expected_vram_gb": 18,
"expected_total_memory_gb": 20,
"total_params": "80B",
"active_params": "13B (MoE)",
"modules_kept_bf16": [
"vae",
"vision_model",
"vision_aligner",
"patch_embed",
"final_layer",
"time_embed",
"time_embed_2",
"timestep_emb",
"guidance_emb",
"timestep_r_emb",
"attention_projections"
],
"distil_features": {
"cfg_distilled": true,
"meanflow": true,
"description": "Single-step CFG-free generation with meanflow"
},
"notes": "Distilled Instruct model - fast inference, single GPU friendly.",
"attention_layers_quantized": false,
"quality_vs_nf4": "Better quality than NF4 with reasonable memory"
}