File size: 4,564 Bytes
1536e1d | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 | {
"model_type": "z-anime",
"architecture": "S3-DiT",
"parameters": "6B",
"license": "apache-2.0",
"base_model": "Tongyi-MAI/Z-Image",
"base_model_relation": "finetune",
"author": "SeeSee21",
"pipeline_tag": "text-to-image",
"prompting": {
"style": "natural-language",
"negative_prompt_support": {
"base": "full",
"distill_8step": "limited",
"distill_4step": "limited"
}
},
"variants": {
"base": {
"bf16": "diffusion_models/z-anime-base-bf16.safetensors",
"fp8": "diffusion_models/z-anime-base-fp8.safetensors",
"aio_bf16": "aio/z-anime-base-aio-bf16.safetensors",
"aio_fp8": "aio/z-anime-base-aio-fp8.safetensors",
"recommended_settings": {
"steps": "28-50",
"cfg": "3.0-5.0",
"sampler": "euler_ancestral",
"scheduler": "beta"
}
},
"distill_8step": {
"bf16": "diffusion_models/z-anime-distill-8step-bf16.safetensors",
"fp8": "diffusion_models/z-anime-distill-8step-fp8.safetensors",
"aio_bf16": "aio/z-anime-distill-8step-aio-bf16.safetensors",
"aio_fp8": "aio/z-anime-distill-8step-aio-fp8.safetensors",
"recommended_settings": {
"steps": 8,
"cfg": 1.0,
"sampler": "euler_ancestral",
"scheduler": "beta"
}
},
"distill_4step": {
"bf16": "diffusion_models/z-anime-distill-4step-bf16.safetensors",
"fp8": "diffusion_models/z-anime-distill-4step-fp8.safetensors",
"aio_bf16": "aio/z-anime-distill-4step-aio-bf16.safetensors",
"aio_fp8": "aio/z-anime-distill-4step-aio-fp8.safetensors",
"recommended_settings": {
"steps": 4,
"cfg": 1.0,
"sampler": "euler_ancestral",
"scheduler": "beta"
}
},
"gguf": {
"q8_0": {
"file": "gguf/z-anime-base-q8_0.gguf",
"description": "Q8_0 quantization",
"size": "~6.73 GB"
},
"q4_k_s": {
"file": "gguf/z-anime-base-q4_k_s.gguf",
"description": "Q4_K_S quantization",
"size": "~4.2 GB"
}
}
},
"diffusers_folder": {
"path": "diffusers/",
"pipeline_class": "ZImagePipeline",
"usage": "ZImagePipeline.from_pretrained('SeeSee21/Z-Anime', subfolder='diffusers', torch_dtype=torch.bfloat16)",
"components": [
"model_index.json",
"scheduler/",
"tokenizer/",
"text_encoder/",
"transformer/",
"vae/"
]
},
"components": {
"text_encoders": {
"default": {
"bf16": "text_encoder/qwen_3_4b-bf16.safetensors",
"fp8": "text_encoder/qwen_3_4b-fp8.safetensors",
"description": "Standard Z-Image text encoder, repackaged as a single safetensors",
"comfyui_path": "ComfyUI/models/clip/"
},
"engineer_v4": {
"bf16": "text_encoder/qwen_3_4b-engineer-v4-bf16.safetensors",
"fp8": "text_encoder/qwen_3_4b-engineer-v4-fp8.safetensors",
"description": "Alternative full fine-tune by BennyDaBall (SMART training, more varied outputs)",
"source": "https://huggingface.co/BennyDaBall/Qwen3-4b-Z-Image-Engineer-V4",
"comfyui_path": "ComfyUI/models/clip/"
}
},
"vae": {
"file": "vae/ae.safetensors",
"description": "Z-Image VAE (slightly trained alongside Z-Anime)",
"comfyui_path": "ComfyUI/models/vae/"
}
},
"comfyui_paths": {
"diffusion_models": "ComfyUI/models/diffusion_models/",
"unet": "ComfyUI/models/unet/",
"clip": "ComfyUI/models/clip/",
"vae": "ComfyUI/models/vae/",
"checkpoints": "ComfyUI/models/checkpoints/"
},
"requirements": {
"custom_nodes": [
"rgthree-comfy",
"ComfyUI-Lora-Manager",
"ComfyUI-SeedVR2_VideoUpscaler (optional)"
]
},
"supported_vram": "8GB+",
"links": {
"civitai": "https://civitai.red/models/2483351",
"base_model": "https://huggingface.co/Tongyi-MAI/Z-Image",
"engineer_v4": "https://huggingface.co/BennyDaBall/Qwen3-4b-Z-Image-Engineer-V4",
"author": "https://huggingface.co/SeeSee21"
},
"notes": [
"BF16 and FP8 are the main release formats.",
"GGUF variants are intended for lower-memory or alternative inference setups.",
"AIO variants include the Text Encoder and VAE in a single file (Base, 4-Step, 8-Step).",
"Two text encoders are included: the standard Z-Image one (default) and BennyDaBall's Engineer V4 (alternative).",
"The diffusers/ subfolder is a full diffusers-format checkpoint loadable via ZImagePipeline.from_pretrained(repo, subfolder='diffusers')."
]
}
|