diff --git a/docs/Flows/HunyuanDiT.rst b/docs/Flows/HunyuanDiT.rst new file mode 100644 index 0000000..b4d34cc --- /dev/null +++ b/docs/Flows/HunyuanDiT.rst @@ -0,0 +1,32 @@ +.. _HunyuanDiT: + +HunyuanDiT +========== + +Powerful Multi-Resolution Diffusion Transformer with Fine-Grained Chinese Understanding. + +A solid model that supports natively very high **Vibrancy**. + +Hardware +"""""""" + +- **Required memory: 12 GB** + +Time to generate 1 image(30 steps): + +- AMD 7900 XTX: **40 sec** + +Examples +"""""""" + +.. image:: /FlowsResults/HunyuanDiT_1.png + +Prompt: "*portrait of a majestic insect*" (Vibrancy: 7, Steps: 60) + +.. image:: /FlowsResults/HunyuanDiT_2.png + +Prompt: "*close portrait of happy girl on the great wall*" (Vibrancy: 7, Steps: 60) + +.. image:: /FlowsResults/HunyuanDiT_3.png + +Prompt: "*portrait of a black pug on the yellow grass*" (Vibrancy: 6, Steps: 30) diff --git a/docs/Flows/index.rst b/docs/Flows/index.rst index 0bafd25..23aea94 100644 --- a/docs/Flows/index.rst +++ b/docs/Flows/index.rst @@ -13,6 +13,7 @@ Available Flows Colorful_XL Mobius_XL Stable_Cascade + HunyuanDiT SD3_Medium VintagePortrait Photomaker_1 diff --git a/docs/FlowsResults/HunyuanDiT_1.png b/docs/FlowsResults/HunyuanDiT_1.png new file mode 100644 index 0000000..508c3f2 Binary files /dev/null and b/docs/FlowsResults/HunyuanDiT_1.png differ diff --git a/docs/FlowsResults/HunyuanDiT_2.png b/docs/FlowsResults/HunyuanDiT_2.png new file mode 100644 index 0000000..eef9fe0 Binary files /dev/null and b/docs/FlowsResults/HunyuanDiT_2.png differ diff --git a/docs/FlowsResults/HunyuanDiT_3.png b/docs/FlowsResults/HunyuanDiT_3.png new file mode 100644 index 0000000..99b2c7b Binary files /dev/null and b/docs/FlowsResults/HunyuanDiT_3.png differ diff --git a/flows/hunyuan_dit.json b/flows/hunyuan_dit.json new file mode 100644 index 0000000..c352b06 --- /dev/null +++ b/flows/hunyuan_dit.json @@ -0,0 +1,201 @@ +{ + "2": { + "inputs": { + "ckpt_name": "hunyuan_dit_1.2.safetensors" + }, + "class_type": "CheckpointLoaderSimple", + "_meta": { + "title": "Load Checkpoint" + } + }, + "116": { + "inputs": { + "samples": [ + "298", + 0 + ], + "vae": [ + "2", + 2 + ] + }, + "class_type": "VAEDecode", + "_meta": { + "title": "VAE Decode" + } + }, + "244": { + "inputs": { + "width": 1024, + "height": 1024, + "batch_size": 1 + }, + "class_type": "EmptyLatentImage", + "_meta": { + "title": "Empty Latent Image" + } + }, + "267": { + "inputs": { + "filename_prefix": "base", + "images": [ + "116", + 0 + ] + }, + "class_type": "SaveImage", + "_meta": { + "title": "Save Image" + } + }, + "291": { + "inputs": { + "name": "hunyuan_dit", + "display_name": "HunyuanDiT", + "description": "Model with Chinese Understanding ", + "author": "bigcat88", + "homepage": "https://huggingface.co/Tencent-Hunyuan/HunyuanDiT", + "documentation": "https://visionatrix.github.io/VixFlowsDocs/Flows/HunyuanDiT.html", + "license": "", + "tags": "[\"general\", \"simple\"]", + "version": "1.0.0", + "requires": "[]", + "is_seed_supported": true, + "is_count_supported": true + }, + "class_type": "VixUiWorkflowMetadata", + "_meta": { + "title": "VixUI-WorkflowMetadata" + } + }, + "292": { + "inputs": { + "text": "", + "display_name": "Prompt", + "optional": false, + "advanced": false, + "order": 1, + "custom_id": "prompt" + }, + "class_type": "VixUiPrompt", + "_meta": { + "title": "VixUI-Prompt" + } + }, + "293": { + "inputs": { + "text": "", + "display_name": "Negative Prompt", + "optional": true, + "advanced": true, + "order": 15, + "custom_id": "negative_prompt" + }, + "class_type": "VixUiPrompt", + "_meta": { + "title": "VixUI-Prompt" + } + }, + "294": { + "inputs": { + "text": [ + "293", + 0 + ], + "clip": [ + "2", + 1 + ] + }, + "class_type": "CLIPTextEncode", + "_meta": { + "title": "CLIP Text Encode (Negative Prompt)" + } + }, + "295": { + "inputs": { + "text": [ + "292", + 0 + ], + "clip": [ + "2", + 1 + ] + }, + "class_type": "CLIPTextEncode", + "_meta": { + "title": "CLIP Text Encode (Positive Prompt)" + } + }, + "298": { + "inputs": { + "seed": 1, + "steps": [ + "300", + 0 + ], + "cfg": [ + "308", + 0 + ], + "sampler_name": "euler", + "scheduler": "sgm_uniform", + "denoise": 1, + "model": [ + "2", + 0 + ], + "positive": [ + "295", + 0 + ], + "negative": [ + "294", + 0 + ], + "latent_image": [ + "244", + 0 + ] + }, + "class_type": "KSampler", + "_meta": { + "title": "KSampler" + } + }, + "300": { + "inputs": { + "value": 30, + "display_name": "Steps number to generate", + "optional": true, + "advanced": true, + "min": 20, + "max": 60, + "step": 1, + "order": 91, + "custom_id": "steps_count" + }, + "class_type": "VixUiRangeInt", + "_meta": { + "title": "VixUI-RangeInt" + } + }, + "308": { + "inputs": { + "value": 6, + "display_name": "Vibrancy", + "optional": true, + "advanced": true, + "min": 2, + "max": 15, + "step": 0.1, + "order": 90, + "custom_id": "vibrancy" + }, + "class_type": "VixUiRangeFloat", + "_meta": { + "title": "VixUI-RangeFloat" + } + } +} diff --git a/models_catalog.json b/models_catalog.json index 32eff49..dd5aeb6 100644 --- a/models_catalog.json +++ b/models_catalog.json @@ -694,5 +694,17 @@ "url": "https://huggingface.co/comfyanonymous/flux_RealismLora_converted_comfyui/resolve/main/flux_realism_lora.safetensors", "homepage": "https://huggingface.co/XLabs-AI/flux-RealismLora", "hash": "379e73dccfb57822ee3b12f374e141ce1c79a13b7ff19da4219ef2a2a610038e" + }, + "HunyuanDiT": { + "regexes": [ + { + "input_value": "^(?=.*(?i:hunyuan_dit_1\\.2))(?=.*(?i:safetensors)).*", + "input_name": "^(?!.*(?i:lora)).*" + } + ], + "save_path": "checkpoints/hunyuan_dit_1.2.safetensors", + "url": "https://huggingface.co/comfyanonymous/hunyuan_dit_comfyui/resolve/main/hunyuan_dit_1.2.safetensors", + "homepage": "https://huggingface.co/Tencent-Hunyuan/HunyuanDiT", + "hash": "4fb84f84079cda457d171b3c6b15d1be95b5a3e5d9825703951a99ddf92d1787" } }