| { |
| "model_type": "z-anime", |
| "architecture": "S3-DiT", |
| "parameters": "6B", |
| "license": "apache-2.0", |
| "base_model": "Tongyi-MAI/Z-Image", |
| "base_model_relation": "finetune", |
| "author": "SeeSee21", |
| "pipeline_tag": "text-to-image", |
| "prompting": { |
| "style": "natural-language", |
| "negative_prompt_support": { |
| "base": "full", |
| "distill_8step": "limited", |
| "distill_4step": "limited" |
| } |
| }, |
| "variants": { |
| "base": { |
| "bf16": "diffusion_models/z-anime-base-bf16.safetensors", |
| "fp8": "diffusion_models/z-anime-base-fp8.safetensors", |
| "aio_bf16": "aio/z-anime-base-aio-bf16.safetensors", |
| "aio_fp8": "aio/z-anime-base-aio-fp8.safetensors", |
| "recommended_settings": { |
| "steps": "28-50", |
| "cfg": "3.0-5.0", |
| "sampler": "euler_ancestral", |
| "scheduler": "beta" |
| } |
| }, |
| "distill_8step": { |
| "bf16": "diffusion_models/z-anime-distill-8step-bf16.safetensors", |
| "fp8": "diffusion_models/z-anime-distill-8step-fp8.safetensors", |
| "aio_bf16": "aio/z-anime-distill-8step-aio-bf16.safetensors", |
| "aio_fp8": "aio/z-anime-distill-8step-aio-fp8.safetensors", |
| "recommended_settings": { |
| "steps": 8, |
| "cfg": 1.0, |
| "sampler": "euler_ancestral", |
| "scheduler": "beta" |
| } |
| }, |
| "distill_4step": { |
| "bf16": "diffusion_models/z-anime-distill-4step-bf16.safetensors", |
| "fp8": "diffusion_models/z-anime-distill-4step-fp8.safetensors", |
| "aio_bf16": "aio/z-anime-distill-4step-aio-bf16.safetensors", |
| "aio_fp8": "aio/z-anime-distill-4step-aio-fp8.safetensors", |
| "recommended_settings": { |
| "steps": 4, |
| "cfg": 1.0, |
| "sampler": "euler_ancestral", |
| "scheduler": "beta" |
| } |
| }, |
| "gguf": { |
| "q8_0": { |
| "file": "gguf/z-anime-base-q8_0.gguf", |
| "description": "Q8_0 quantization", |
| "size": "~6.73 GB" |
| }, |
| "q4_k_s": { |
| "file": "gguf/z-anime-base-q4_k_s.gguf", |
| "description": "Q4_K_S quantization", |
| "size": "~4.2 GB" |
| } |
| } |
| }, |
| "diffusers_folder": { |
| "path": "diffusers/", |
| "pipeline_class": "ZImagePipeline", |
| "usage": "ZImagePipeline.from_pretrained('SeeSee21/Z-Anime', subfolder='diffusers', torch_dtype=torch.bfloat16)", |
| "components": [ |
| "model_index.json", |
| "scheduler/", |
| "tokenizer/", |
| "text_encoder/", |
| "transformer/", |
| "vae/" |
| ] |
| }, |
| "components": { |
| "text_encoders": { |
| "default": { |
| "bf16": "text_encoder/qwen_3_4b-bf16.safetensors", |
| "fp8": "text_encoder/qwen_3_4b-fp8.safetensors", |
| "description": "Standard Z-Image text encoder, repackaged as a single safetensors", |
| "comfyui_path": "ComfyUI/models/clip/" |
| }, |
| "engineer_v4": { |
| "bf16": "text_encoder/qwen_3_4b-engineer-v4-bf16.safetensors", |
| "fp8": "text_encoder/qwen_3_4b-engineer-v4-fp8.safetensors", |
| "description": "Alternative full fine-tune by BennyDaBall (SMART training, more varied outputs)", |
| "source": "https://huggingface.co/BennyDaBall/Qwen3-4b-Z-Image-Engineer-V4", |
| "comfyui_path": "ComfyUI/models/clip/" |
| } |
| }, |
| "vae": { |
| "file": "vae/ae.safetensors", |
| "description": "Z-Image VAE (slightly trained alongside Z-Anime)", |
| "comfyui_path": "ComfyUI/models/vae/" |
| } |
| }, |
| "comfyui_paths": { |
| "diffusion_models": "ComfyUI/models/diffusion_models/", |
| "unet": "ComfyUI/models/unet/", |
| "clip": "ComfyUI/models/clip/", |
| "vae": "ComfyUI/models/vae/", |
| "checkpoints": "ComfyUI/models/checkpoints/" |
| }, |
| "requirements": { |
| "custom_nodes": [ |
| "rgthree-comfy", |
| "ComfyUI-Lora-Manager", |
| "ComfyUI-SeedVR2_VideoUpscaler (optional)" |
| ] |
| }, |
| "supported_vram": "8GB+", |
| "links": { |
| "civitai": "https://civitai.red/models/2483351", |
| "base_model": "https://huggingface.co/Tongyi-MAI/Z-Image", |
| "engineer_v4": "https://huggingface.co/BennyDaBall/Qwen3-4b-Z-Image-Engineer-V4", |
| "author": "https://huggingface.co/SeeSee21" |
| }, |
| "notes": [ |
| "BF16 and FP8 are the main release formats.", |
| "GGUF variants are intended for lower-memory or alternative inference setups.", |
| "AIO variants include the Text Encoder and VAE in a single file (Base, 4-Step, 8-Step).", |
| "Two text encoders are included: the standard Z-Image one (default) and BennyDaBall's Engineer V4 (alternative).", |
| "The diffusers/ subfolder is a full diffusers-format checkpoint loadable via ZImagePipeline.from_pretrained(repo, subfolder='diffusers')." |
| ] |
| } |
|
|