diff --git a/docs.json b/docs.json index 10389024..60fa09d6 100644 --- a/docs.json +++ b/docs.json @@ -164,7 +164,10 @@ }, { "group": "Z-Image", - "pages": ["tutorials/image/z-image/z-image-turbo"] + "pages": [ + "tutorials/image/z-image/z-image", + "tutorials/image/z-image/z-image-turbo" + ] }, { "group": "HiDream", @@ -868,7 +871,10 @@ }, { "group": "Z-Image", - "pages": ["zh-CN/tutorials/image/z-image/z-image-turbo"] + "pages": [ + "zh-CN/tutorials/image/z-image/z-image", + "zh-CN/tutorials/image/z-image/z-image-turbo" + ] }, { "group": "Ovis", diff --git a/tutorials/image/z-image/z-image-turbo.mdx b/tutorials/image/z-image/z-image-turbo.mdx index 139c5bcf..d7953696 100644 --- a/tutorials/image/z-image/z-image-turbo.mdx +++ b/tutorials/image/z-image/z-image-turbo.mdx @@ -1,7 +1,7 @@ --- -title: "Z-Image ComfyUI Workflow Example" -description: "Z-Image is a 6B parameter efficient image generation foundation model with single-stream diffusion transformer, offering sub-second inference latency." -sidebarTitle: "Z-Image" +title: "Z-Image-Turbo ComfyUI Workflow Example" +description: "Z-Image-Turbo is a distilled 6B parameter efficient image generation model with sub-second inference latency." +sidebarTitle: "Z-Image-Turbo" --- import UpdateReminder from '/snippets/tutorials/update-reminder.mdx' @@ -27,31 +27,32 @@ import UpdateReminder from '/snippets/tutorials/update-reminder.mdx' ## Z-Image-Turbo text-to-image workflow - -

Download JSON Workflow File

-
- - -

Run on ComfyUI Cloud

-
+ + + Download the Z-Image-Turbo text-to-image workflow JSON file. + + + Run this workflow directly on ComfyUI Cloud. + + -## Model links - -**text_encoders** - -- [qwen_3_4b.safetensors](https://huggingface.co/Comfy-Org/z_image_turbo/resolve/main/split_files/text_encoders/qwen_3_4b.safetensors) - -**diffusion_models** +### Z-Image-Turbo model downloads -- [z_image_turbo_bf16.safetensors](https://huggingface.co/Comfy-Org/z_image_turbo/resolve/main/split_files/diffusion_models/z_image_turbo_bf16.safetensors) + + + Text encoder for Z-Image-Turbo. + + + Diffusion model for Z-Image-Turbo. + + + VAE for Z-Image-Turbo. + + -**vae** - -- [ae.safetensors](https://huggingface.co/Comfy-Org/z_image_turbo/resolve/main/split_files/vae/ae.safetensors) - -**Model Storage Location** +**Z-Image-Turbo Model Storage Location** ``` 📂 ComfyUI/ @@ -68,15 +69,19 @@ import UpdateReminder from '/snippets/tutorials/update-reminder.mdx' This workflow uses the Z-Image-Turbo Fun Union ControlNet model to generate images with ControlNet guidance. It applies Canny edge detection to a reference image and uses the ControlNet to guide the generation process. - -

Download JSON Workflow File

-
+ + + Download the Z-Image-Turbo Fun Union ControlNet workflow JSON file. + + ### Additional model for ControlNet -**model_patches** - -- [Z-Image-Turbo-Fun-Controlnet-Union.safetensors](https://huggingface.co/alibaba-pai/Z-Image-Turbo-Fun-Controlnet-Union/resolve/main/Z-Image-Turbo-Fun-Controlnet-Union.safetensors) + + + ControlNet model patch for Z-Image-Turbo. + + **Model Storage Location** diff --git a/tutorials/image/z-image/z-image.mdx b/tutorials/image/z-image/z-image.mdx new file mode 100644 index 00000000..5fa2b66d --- /dev/null +++ b/tutorials/image/z-image/z-image.mdx @@ -0,0 +1,62 @@ +--- +title: "Z-Image ComfyUI Workflow Example" +description: "Z-Image is a 6B parameter efficient image generation foundation model with single-stream diffusion transformer for community-driven fine-tuning and custom development." +sidebarTitle: "Z-Image" +--- + +import UpdateReminder from '/snippets/tutorials/update-reminder.mdx' + +**Z-Image (造相)** is a powerful and highly efficient image generation model with **6B** parameters, developed by Alibaba's Tongyi Lab. It uses a **Scalable Single-Stream DiT** (S3-DiT) architecture where text, visual semantic tokens, and image VAE tokens are concatenated at the sequence level to serve as a unified input stream, maximizing parameter efficiency. + +Z-Image (Base) is the non-distilled foundation model designed for community-driven fine-tuning and custom development. + +**Model Highlights**: +- **Photorealistic Quality**: Delivers strong photorealistic image generation while maintaining excellent aesthetic quality +- **Accurate Bilingual Text Rendering**: Excels at accurately rendering complex Chinese and English text +- **Prompt Enhancing & Reasoning**: Prompt Enhancer empowers the model with reasoning capabilities +- **Fine-tuning Ready**: Ideal base model for custom training and adaptation + +**Related Links**: +- [GitHub](https://github.com/Tongyi-MAI/Z-Image) +- [Hugging Face](https://huggingface.co/Tongyi-MAI/Z-Image) +- [ModelScope](https://modelscope.cn/models/Tongyi-MAI/Z-Image) + +## Z-Image text-to-image workflow + + + + Download the Z-Image text-to-image workflow JSON file. + + + Run this workflow directly on ComfyUI Cloud. + + + + + +## Z-Image model downloads + + + + Text encoder for Z-Image. + + + Diffusion model for Z-Image. + + + VAE for Z-Image. + + + +**Model Storage Location** + +``` +📂 ComfyUI/ +├── 📂 models/ +│ ├── 📂 text_encoders/ +│ │ └── qwen_3_4b.safetensors +│ ├── 📂 diffusion_models/ +│ │ └── z_image_bf16.safetensors +│ └── 📂 vae/ +│ └── ae.safetensors +``` diff --git a/zh-CN/tutorials/image/z-image/z-image-turbo.mdx b/zh-CN/tutorials/image/z-image/z-image-turbo.mdx index c22d6f68..020c184f 100644 --- a/zh-CN/tutorials/image/z-image/z-image-turbo.mdx +++ b/zh-CN/tutorials/image/z-image/z-image-turbo.mdx @@ -1,7 +1,7 @@ --- -title: "Z-Image ComfyUI 工作流示例" -description: "Z-Image 是一个拥有 6B 参数的高效图像生成基础模型,采用单流扩散变换器架构,可实现亚秒级推理延迟。" -sidebarTitle: "Z-Image" +title: "Z-Image-Turbo ComfyUI 工作流示例" +description: "Z-Image-Turbo 是一个蒸馏版 6B 参数高效图像生成模型,可实现亚秒级推理延迟。" +sidebarTitle: "Z-Image-Turbo" --- import UpdateReminder from '/snippets/zh/tutorials/update-reminder.mdx' @@ -27,31 +27,32 @@ import UpdateReminder from '/snippets/zh/tutorials/update-reminder.mdx' ## Z-Image-Turbo 文生图工作流 - -

下载 JSON 工作流文件

-
- - -

在 ComfyUI Cloud 上运行

-
+ + + 下载 Z-Image-Turbo 文生图工作流 JSON 文件。 + + + 在 ComfyUI Cloud 上直接运行此工作流。 + + -## 模型链接 - -**text_encoders(文本编码器)** - -- [qwen_3_4b.safetensors](https://huggingface.co/Comfy-Org/z_image_turbo/resolve/main/split_files/text_encoders/qwen_3_4b.safetensors) - -**diffusion_models(扩散模型)** +### Z-Image-Turbo 模型下载 -- [z_image_turbo_bf16.safetensors](https://huggingface.co/Comfy-Org/z_image_turbo/resolve/main/split_files/diffusion_models/z_image_turbo_bf16.safetensors) + + + Z-Image-Turbo 文本编码器。 + + + Z-Image-Turbo 扩散模型。 + + + Z-Image-Turbo VAE。 + + -**vae** - -- [ae.safetensors](https://huggingface.co/Comfy-Org/z_image_turbo/resolve/main/split_files/vae/ae.safetensors) - -**模型存储位置** +**Z-Image-Turbo 模型存储位置** ``` 📂 ComfyUI/ @@ -68,15 +69,19 @@ import UpdateReminder from '/snippets/zh/tutorials/update-reminder.mdx' 此工作流使用 Z-Image-Turbo Fun Union ControlNet 模型生成带有 ControlNet 引导的图像。它对参考图像应用 Canny 边缘检测,并使用 ControlNet 来引导生成过程。 - -

下载 JSON 工作流文件

-
+ + + 下载 Z-Image-Turbo Fun Union ControlNet 工作流 JSON 文件。 + + ### ControlNet 所需的额外模型 -**model_patches(模型补丁)** - -- [Z-Image-Turbo-Fun-Controlnet-Union.safetensors](https://huggingface.co/alibaba-pai/Z-Image-Turbo-Fun-Controlnet-Union/resolve/main/Z-Image-Turbo-Fun-Controlnet-Union.safetensors) + + + Z-Image-Turbo ControlNet 模型补丁。 + + **模型存储位置** diff --git a/zh-CN/tutorials/image/z-image/z-image.mdx b/zh-CN/tutorials/image/z-image/z-image.mdx new file mode 100644 index 00000000..7d9d3f1a --- /dev/null +++ b/zh-CN/tutorials/image/z-image/z-image.mdx @@ -0,0 +1,62 @@ +--- +title: "Z-Image ComfyUI 工作流示例" +description: "Z-Image 是一个拥有 6B 参数的高效图像生成基础模型,采用单流扩散变换器架构,适用于社区驱动的微调和自定义开发。" +sidebarTitle: "Z-Image" +--- + +import UpdateReminder from '/snippets/zh/tutorials/update-reminder.mdx' + +**Z-Image(造相)** 是阿里巴巴通义实验室开发的一个强大且高效的图像生成模型,拥有 **6B** 参数。它采用 **可扩展单流 DiT**(S3-DiT)架构,将文本、视觉语义 token 和图像 VAE token 在序列级别进行拼接,作为统一的输入流,最大化参数效率。 + +Z-Image(Base)是非蒸馏基础模型,专为社区驱动的微调和自定义开发而设计。 + +**模型亮点**: +- **照片级真实质量**:在保持出色美学质量的同时,提供强大的照片级真实图像生成 +- **精准的双语文本渲染**:擅长准确渲染复杂的中英文文本 +- **提示词增强与推理**:提示词增强器赋予模型推理能力 +- **微调就绪**:适合自定义训练和适配的理想基础模型 + +**相关链接**: +- [GitHub](https://github.com/Tongyi-MAI/Z-Image) +- [Hugging Face](https://huggingface.co/Tongyi-MAI/Z-Image) +- [ModelScope](https://modelscope.cn/models/Tongyi-MAI/Z-Image) + +## Z-Image 文生图工作流 + + + + 下载 Z-Image 文生图工作流 JSON 文件。 + + + 在 ComfyUI Cloud 上直接运行此工作流。 + + + + + +## Z-Image 模型下载 + + + + Z-Image 文本编码器。 + + + Z-Image 扩散模型。 + + + Z-Image VAE。 + + + +**模型存储位置** + +``` +📂 ComfyUI/ +├── 📂 models/ +│ ├── 📂 text_encoders/ +│ │ └── qwen_3_4b.safetensors +│ ├── 📂 diffusion_models/ +│ │ └── z_image_bf16.safetensors +│ └── 📂 vae/ +│ └── ae.safetensors +```