Add config
Browse files- config.json +131 -0
config.json
ADDED
|
@@ -0,0 +1,131 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"model_type": "z-anime",
|
| 3 |
+
"architecture": "S3-DiT",
|
| 4 |
+
"parameters": "6B",
|
| 5 |
+
"license": "apache-2.0",
|
| 6 |
+
"base_model": "Tongyi-MAI/Z-Image",
|
| 7 |
+
"base_model_relation": "finetune",
|
| 8 |
+
"author": "SeeSee21",
|
| 9 |
+
"pipeline_tag": "text-to-image",
|
| 10 |
+
"prompting": {
|
| 11 |
+
"style": "natural-language",
|
| 12 |
+
"negative_prompt_support": {
|
| 13 |
+
"base": "full",
|
| 14 |
+
"distill_8step": "limited",
|
| 15 |
+
"distill_4step": "limited"
|
| 16 |
+
}
|
| 17 |
+
},
|
| 18 |
+
"variants": {
|
| 19 |
+
"base": {
|
| 20 |
+
"bf16": "diffusion_models/z-anime-base-bf16.safetensors",
|
| 21 |
+
"fp8": "diffusion_models/z-anime-base-fp8.safetensors",
|
| 22 |
+
"aio_bf16": "aio/z-anime-base-aio-bf16.safetensors",
|
| 23 |
+
"aio_fp8": "aio/z-anime-base-aio-fp8.safetensors",
|
| 24 |
+
"recommended_settings": {
|
| 25 |
+
"steps": "28-50",
|
| 26 |
+
"cfg": "3.0-5.0",
|
| 27 |
+
"sampler": "euler_ancestral",
|
| 28 |
+
"scheduler": "beta"
|
| 29 |
+
}
|
| 30 |
+
},
|
| 31 |
+
"distill_8step": {
|
| 32 |
+
"bf16": "diffusion_models/z-anime-distill-8step-bf16.safetensors",
|
| 33 |
+
"fp8": "diffusion_models/z-anime-distill-8step-fp8.safetensors",
|
| 34 |
+
"aio_bf16": "aio/z-anime-distill-8step-aio-bf16.safetensors",
|
| 35 |
+
"aio_fp8": "aio/z-anime-distill-8step-aio-fp8.safetensors",
|
| 36 |
+
"recommended_settings": {
|
| 37 |
+
"steps": 8,
|
| 38 |
+
"cfg": 1.0,
|
| 39 |
+
"sampler": "euler_ancestral",
|
| 40 |
+
"scheduler": "beta"
|
| 41 |
+
}
|
| 42 |
+
},
|
| 43 |
+
"distill_4step": {
|
| 44 |
+
"bf16": "diffusion_models/z-anime-distill-4step-bf16.safetensors",
|
| 45 |
+
"fp8": "diffusion_models/z-anime-distill-4step-fp8.safetensors",
|
| 46 |
+
"aio_bf16": "aio/z-anime-distill-4step-aio-bf16.safetensors",
|
| 47 |
+
"aio_fp8": "aio/z-anime-distill-4step-aio-fp8.safetensors",
|
| 48 |
+
"recommended_settings": {
|
| 49 |
+
"steps": 4,
|
| 50 |
+
"cfg": 1.0,
|
| 51 |
+
"sampler": "euler_ancestral",
|
| 52 |
+
"scheduler": "beta"
|
| 53 |
+
}
|
| 54 |
+
},
|
| 55 |
+
"gguf": {
|
| 56 |
+
"q8_0": {
|
| 57 |
+
"file": "gguf/z-anime-base-q8_0.gguf",
|
| 58 |
+
"description": "Q8_0 quantization",
|
| 59 |
+
"size": "~6.73 GB"
|
| 60 |
+
},
|
| 61 |
+
"q4_k_s": {
|
| 62 |
+
"file": "gguf/z-anime-base-q4_k_s.gguf",
|
| 63 |
+
"description": "Q4_K_S quantization",
|
| 64 |
+
"size": "~4.2 GB"
|
| 65 |
+
}
|
| 66 |
+
}
|
| 67 |
+
},
|
| 68 |
+
"diffusers_folder": {
|
| 69 |
+
"path": "diffusers/",
|
| 70 |
+
"pipeline_class": "ZImagePipeline",
|
| 71 |
+
"usage": "ZImagePipeline.from_pretrained('SeeSee21/Z-Anime', subfolder='diffusers', torch_dtype=torch.bfloat16)",
|
| 72 |
+
"components": [
|
| 73 |
+
"model_index.json",
|
| 74 |
+
"scheduler/",
|
| 75 |
+
"tokenizer/",
|
| 76 |
+
"text_encoder/",
|
| 77 |
+
"transformer/",
|
| 78 |
+
"vae/"
|
| 79 |
+
]
|
| 80 |
+
},
|
| 81 |
+
"components": {
|
| 82 |
+
"text_encoders": {
|
| 83 |
+
"default": {
|
| 84 |
+
"bf16": "text_encoder/qwen_3_4b-bf16.safetensors",
|
| 85 |
+
"fp8": "text_encoder/qwen_3_4b-fp8.safetensors",
|
| 86 |
+
"description": "Standard Z-Image text encoder, repackaged as a single safetensors",
|
| 87 |
+
"comfyui_path": "ComfyUI/models/clip/"
|
| 88 |
+
},
|
| 89 |
+
"engineer_v4": {
|
| 90 |
+
"bf16": "text_encoder/qwen_3_4b-engineer-v4-bf16.safetensors",
|
| 91 |
+
"fp8": "text_encoder/qwen_3_4b-engineer-v4-fp8.safetensors",
|
| 92 |
+
"description": "Alternative full fine-tune by BennyDaBall (SMART training, more varied outputs)",
|
| 93 |
+
"source": "https://huggingface.co/BennyDaBall/Qwen3-4b-Z-Image-Engineer-V4",
|
| 94 |
+
"comfyui_path": "ComfyUI/models/clip/"
|
| 95 |
+
}
|
| 96 |
+
},
|
| 97 |
+
"vae": {
|
| 98 |
+
"file": "vae/ae.safetensors",
|
| 99 |
+
"description": "Z-Image VAE (slightly trained alongside Z-Anime)",
|
| 100 |
+
"comfyui_path": "ComfyUI/models/vae/"
|
| 101 |
+
}
|
| 102 |
+
},
|
| 103 |
+
"comfyui_paths": {
|
| 104 |
+
"diffusion_models": "ComfyUI/models/diffusion_models/",
|
| 105 |
+
"unet": "ComfyUI/models/unet/",
|
| 106 |
+
"clip": "ComfyUI/models/clip/",
|
| 107 |
+
"vae": "ComfyUI/models/vae/",
|
| 108 |
+
"checkpoints": "ComfyUI/models/checkpoints/"
|
| 109 |
+
},
|
| 110 |
+
"requirements": {
|
| 111 |
+
"custom_nodes": [
|
| 112 |
+
"rgthree-comfy",
|
| 113 |
+
"ComfyUI-Lora-Manager",
|
| 114 |
+
"ComfyUI-SeedVR2_VideoUpscaler (optional)"
|
| 115 |
+
]
|
| 116 |
+
},
|
| 117 |
+
"supported_vram": "8GB+",
|
| 118 |
+
"links": {
|
| 119 |
+
"civitai": "https://civitai.red/models/2483351",
|
| 120 |
+
"base_model": "https://huggingface.co/Tongyi-MAI/Z-Image",
|
| 121 |
+
"engineer_v4": "https://huggingface.co/BennyDaBall/Qwen3-4b-Z-Image-Engineer-V4",
|
| 122 |
+
"author": "https://huggingface.co/SeeSee21"
|
| 123 |
+
},
|
| 124 |
+
"notes": [
|
| 125 |
+
"BF16 and FP8 are the main release formats.",
|
| 126 |
+
"GGUF variants are intended for lower-memory or alternative inference setups.",
|
| 127 |
+
"AIO variants include the Text Encoder and VAE in a single file (Base, 4-Step, 8-Step).",
|
| 128 |
+
"Two text encoders are included: the standard Z-Image one (default) and BennyDaBall's Engineer V4 (alternative).",
|
| 129 |
+
"The diffusers/ subfolder is a full diffusers-format checkpoint loadable via ZImagePipeline.from_pretrained(repo, subfolder='diffusers')."
|
| 130 |
+
]
|
| 131 |
+
}
|