tencent
/

HunyuanImage-3.0-Instruct-Distil

@@ -168,7 +168,7 @@ pip install flashinfer-python==0.5.0
 ```bash
 # Download from HuggingFace and rename the directory.
 # Notice that the directory name should not contain dots, which may cause issues when loading using Transformers.
-hf download tencent/HunyuanImage-3.0-Instruct --local-dir ./HunyuanImage-3-Instruct
 ```
 ##### 2️⃣ Run with Transformers
@@ -177,8 +177,8 @@ hf download tencent/HunyuanImage-3.0-Instruct --local-dir ./HunyuanImage-3-Instr
 from transformers import AutoModelForCausalLM
 # Load the model
-model_id = "./HunyuanImage-3-Instruct"
-# Currently we can not load the model using HF model_id `tencent/HunyuanImage-3.0-Instruct` directly
 # due to the dot in the name.
 kwargs = dict(
@@ -208,7 +208,7 @@ cot_text, samples = model.generate_image(
     use_system_prompt="en_unified",
     bot_task="think_recaption",  # Use "think_recaption" for reasoning and enhancement
     infer_align_image_size=True,  # Align output image size to input image size
-    diff_infer_steps=50,
     verbose=2
 )
@@ -216,31 +216,6 @@ cot_text, samples = model.generate_image(
 samples[0].save("image_edit.png")
 ```
-#### 🏠 Local Installation & Usage
-##### 1️⃣ Clone the Repository
-```bash
-git clone https://github.com/Tencent-Hunyuan/HunyuanImage-3.0.git
-cd HunyuanImage-3.0/
-```
-##### 2️⃣ Download Model Weights
-```bash
-# Download from HuggingFace
-hf download tencent/HunyuanImage-3.0-Instruct --local-dir ./HunyuanImage-3-Instruct
-```
-##### 3️⃣ Run the Demo
-More demos in `run_demo_instruct.sh`.
-```bash
-export MODEL_PATH="./HunyuanImage-3-Instruct"
-bash run_demo_instruct.sh
-```
 ##### 4️⃣ Command Line Arguments
 | Arguments               | Description                                                  | Recommended    |
@@ -263,18 +238,6 @@ bash run_demo_instruct.sh
 | `--max_new_tokens`      | Maximum number of new tokens to generate                     | `2048` |
 | `--use-taylor-cache`    | Use Taylor Cache when sampling                              | `False`     |
-##### 5️⃣ For fewer Sampling Steps
-We recommend using the model [HunyuanImage-3.0-Instruct-Distil](https://huggingface.co/tencent/HunyuanImage-3.0-Instruct-Distil) with `--diff-infer-steps 8`, while keeping all other recommended parameter values **unchanged**.
-```bash
-# Download HunyuanImage-3.0-Instruct-Distil from HuggingFace
-hf download tencent/HunyuanImage-3.0-Instruct-Distil --local-dir ./HunyuanImage-3-Instruct-Distil
-# Run the demo with 8 steps to samples
-export MODEL_PATH="./HunyuanImage-3-Instruct-Distil"
-bash run_demo_instruct_Distil.sh
-```
 <details>
 <summary> Previous Version (Pure Text-to-Image) </summary>

 ```bash
 # Download from HuggingFace and rename the directory.
 # Notice that the directory name should not contain dots, which may cause issues when loading using Transformers.
+hf download tencent/HunyuanImage-3.0-Instruct-Distil --local-dir ./HunyuanImage-3-Instruct-Distil
 ```
 ##### 2️⃣ Run with Transformers
 from transformers import AutoModelForCausalLM
 # Load the model
+model_id = "./HunyuanImage-3-Instruct-Distil"
+# Currently we can not load the model using HF model_id `tencent/HunyuanImage-3.0-Instruct-Distil` directly
 # due to the dot in the name.
 kwargs = dict(
     use_system_prompt="en_unified",
     bot_task="think_recaption",  # Use "think_recaption" for reasoning and enhancement
     infer_align_image_size=True,  # Align output image size to input image size
+    diff_infer_steps=8,
     verbose=2
 )
 samples[0].save("image_edit.png")
 ```
 ##### 4️⃣ Command Line Arguments
 | Arguments               | Description                                                  | Recommended    |
 | `--max_new_tokens`      | Maximum number of new tokens to generate                     | `2048` |
 | `--use-taylor-cache`    | Use Taylor Cache when sampling                              | `False`     |
 <details>
 <summary> Previous Version (Pure Text-to-Image) </summary>