passenger12138 commited on
Commit
8816b1e
·
0 Parent(s):
.gitattributes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ transform2venom.safetensors filter=lfs diff=lfs merge=lfs -text
2
+ *.mp4 filter=lfs diff=lfs merge=lfs -text
3
+ *.png filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,170 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ language:
4
+ - en
5
+ base_model:
6
+ - Wan-AI/Wan2.1-I2V-14B-480P
7
+ - Wan-AI/Wan2.1-I2V-14B-480P-Diffusers
8
+ pipeline_tag: image-to-video
9
+ tags:
10
+ - text-to-image
11
+ - lora
12
+ - diffusers
13
+ - template:diffusion-lora
14
+
15
+ widget:
16
+ - text: >-
17
+ "The video begins with a anime young character with long hair. 5en3m venom transformation. Transform into a venom character transformation. Venom is depicted with his iconic black symbiote body, large white eyes with black pupils, sharp teeth, and a menacing expression. The transformation is smooth and seamless, blending the human figure with the monstrous ."
18
+ output:
19
+ url: example_videos/9_epoch40.mp4
20
+ - text: >-
21
+ The video begins with a woman wearing black clothes. 5en3m venom transformation. Transform into a venom character transformation. Venom is depicted with his iconic black symbiote body, large white eyes with black pupils, sharp teeth, and a menacing expression. The transformation is smooth and seamless, blending the human figure with the monstrous .
22
+ output:
23
+ url: example_videos/8_epoch40.mp4
24
+ - text: >-
25
+ The video begins with a man wearing a suit. 5en3m venom transformation. Transform into a venom character transformation. Venom is depicted with his iconic black symbiote body, large white eyes with black pupils, sharp teeth, and a menacing expression.The transformation is smooth and seamless, blending the human figure with the monstrous .
26
+ output:
27
+ url: example_videos/10_epoch40.mp4
28
+ ---
29
+
30
+ <div style="background-color: #f8f9fa; padding: 20px; border-radius: 10px; margin-bottom: 20px;">
31
+ <h1 style="color: #24292e; margin-top: 0;">Transform to Venom Effect LoRA for Wan2.1 14B I2V 480p</h1>
32
+
33
+ <div style="background-color: white; padding: 15px; border-radius: 8px; margin: 15px 0; box-shadow: 0 2px 4px rgba(0,0,0,0.1);">
34
+ <h2 style="color: #24292e; margin-top: 0;">Overview</h2>
35
+ <p>This LoRA is trained on the Wan2.1 14B I2V 480p model and allows you to transform any object to venom in an image. The effect works on a wide variety of objects, from animals to vehicles to people!</p>
36
+ </div>
37
+
38
+ <div style="background-color: white; padding: 15px; border-radius: 8px; margin: 15px 0; box-shadow: 0 2px 4px rgba(0,0,0,0.1);">
39
+ <h2 style="color: #24292e; margin-top: 0;">Features</h2>
40
+ <ul style="margin-bottom: 0;">
41
+ <li>Transform any image into a video of it being squished</li>
42
+ <li>Trained on the Wan2.1 14B 480p I2V base model</li>
43
+ <li>Consistent results across different object types</li>
44
+ <li>Simple prompt structure that's easy to adapt</li>
45
+ </ul>
46
+ </div>
47
+
48
+ </div>
49
+
50
+ <Gallery />
51
+
52
+ # Model File and Inference Workflow
53
+
54
+ ## 📥 Download Links:
55
+
56
+ - [transform2venom.safetensors](./transform2venom.safetensors) - LoRA Model File
57
+ - [wan_img2video_lora_workflow.json](./workflow/wan_img2video_lora_workflow.json) - Wan I2V with LoRA Workflow for ComfyUI
58
+
59
+ ## Using with Diffusers
60
+ ```py
61
+ pip install git+https://github.com/huggingface/diffusers.git
62
+ ```
63
+
64
+ ```py
65
+ import torch
66
+ from diffusers.utils import export_to_video, load_image
67
+ from diffusers import AutoencoderKLWan, WanImageToVideoPipeline
68
+ from transformers import CLIPVisionModel
69
+ import numpy as np
70
+
71
+ model_id = "Wan-AI/Wan2.1-I2V-14B-480P-Diffusers"
72
+ image_encoder = CLIPVisionModel.from_pretrained(model_id, subfolder="image_encoder", torch_dtype=torch.float32)
73
+ vae = AutoencoderKLWan.from_pretrained(model_id, subfolder="vae", torch_dtype=torch.float32)
74
+
75
+ # Note: Choose Unipcm scheduler to generate higher quality videos for Wan
76
+ flow_shift = 3.0 # 5.0 for 720P, 3.0 for 480P
77
+ scheduler = UniPCMultistepScheduler(
78
+ prediction_type="flow_prediction",
79
+ use_flow_sigmas=True,
80
+ num_train_timesteps=1000,
81
+ flow_shift=flow_shift,
82
+ scheduler=scheduler,
83
+ )
84
+ pipe = WanImageToVideoPipeline.from_pretrained(model_id, vae=vae, image_encoder=image_encoder, torch_dtype=torch.bfloat16)
85
+ pipe.to("cuda")
86
+
87
+ pipe.load_lora_weights("passenger12138/Transform2Venom")
88
+
89
+ pipe.enable_model_cpu_offload() #for low-vram environments
90
+
91
+ prompt = "The video begins with a man wearing a suit. 5en3m venom transformation. Transform into a venom character transformation. Venom is depicted with his iconic black symbiote body, large white eyes with black pupils, sharp teeth, and a menacing expression. The transformation is smooth and seamless, blending the human figure with the monstrous ."
92
+
93
+ image = load_image('./test_i2vlora_imgs/1.png')
94
+
95
+ max_area = 480 * 832
96
+ aspect_ratio = image.height / image.width
97
+ mod_value = pipe.vae_scale_factor_spatial * pipe.transformer.config.patch_size[1]
98
+ height = round(np.sqrt(max_area * aspect_ratio)) // mod_value * mod_value
99
+ width = round(np.sqrt(max_area / aspect_ratio)) // mod_value * mod_value
100
+ image = image.resize((width, height))
101
+
102
+ output = pipe(
103
+ image=image,
104
+ prompt=prompt,
105
+ height=height,
106
+ width=width,
107
+ num_frames=81,
108
+ guidance_scale=5.0,
109
+ num_inference_steps=28
110
+ ).frames[0]
111
+ export_to_video(output, "output.mp4", fps=16)
112
+ ```
113
+
114
+ ---
115
+ <div style="background-color: #f8f9fa; padding: 20px; border-radius: 10px; margin-bottom: 20px;">
116
+ <div style="background-color: white; padding: 15px; border-radius: 8px; margin: 15px 0; box-shadow: 0 2px 4px rgba(0,0,0,0.1);">
117
+ <h2 style="color: #24292e; margin-top: 0;">Recommended Settings</h2>
118
+ <ul style="margin-bottom: 0;">
119
+ <li><b>LoRA Strength:</b> 1.0</li>
120
+ <li><b>Embedded Guidance Scale:</b> 6.0</li>
121
+ <li><b>Flow Shift:</b> 3.0</li>
122
+ </ul>
123
+ </div>
124
+
125
+ <div style="background-color: white; padding: 15px; border-radius: 8px; margin: 15px 0; box-shadow: 0 2px 4px rgba(0,0,0,0.1);">
126
+ <h2 style="color: #24292e; margin-top: 0;">Trigger Words</h2>
127
+ <p>The key trigger phrase is: <code style="background-color: #f0f0f0; padding: 3px 6px; border-radius: 4px;">5en3m venom transformation.</code></p>
128
+ </div>
129
+
130
+ <div style="background-color: white; padding: 15px; border-radius: 8px; margin: 15px 0; box-shadow: 0 2px 4px rgba(0,0,0,0.1);">
131
+ <h2 style="color: #24292e; margin-top: 0;">Prompt Template</h2>
132
+ <p>For best results, use this prompt structure:</p>
133
+ <div style="background-color: #f0f0f0; padding: 12px; border-radius: 6px; margin: 10px 0;">
134
+ <i>The video begins with a [object]. 5en3m venom transformation. Transform into a venom character transformation. Venom is depicted with his iconic black symbiote body, large white eyes with black pupils, sharp teeth, and a menacing expression. The transformation is smooth and seamless, blending the human figure with the monstrous .</i>
135
+ </div>
136
+ <p>Simply replace <code style="background-color: #f0f0f0; padding: 3px 6px; border-radius: 4px;">[object]</code> with whatever you want to see transform to venom!</p>
137
+ </div>
138
+
139
+ <div style="background-color: white; padding: 15px; border-radius: 8px; margin: 15px 0; box-shadow: 0 2px 4px rgba(0,0,0,0.1);">
140
+ <h2 style="color: #24292e; margin-top: 0;">ComfyUI Workflow</h2>
141
+ <p>This LoRA works with a modified version of <a href="https://github.com/kijai/ComfyUI-WanVideoWrapper/blob/main/example_workflows/wanvideo_480p_I2V_example_02.json" style="color: #0366d6; text-decoration: none;">Kijai's Wan Video Wrapper workflow</a>. The main modification is adding a Wan LoRA node connected to the base model.</p>
142
+
143
+ </div>
144
+ </div>
145
+
146
+ <div style="background-color: #f8f9fa; padding: 20px; border-radius: 10px; margin-bottom: 20px;">
147
+ <div style="background-color: white; padding: 15px; border-radius: 8px; margin: 15px 0; box-shadow: 0 2px 4px rgba(0,0,0,0.1);">
148
+ <h2 style="color: #24292e; margin-top: 0;">Model Information</h2>
149
+ <p>The model weights are available in Safetensors format. See the Downloads section above.</p>
150
+ </div>
151
+
152
+ <div style="background-color: white; padding: 15px; border-radius: 8px; margin: 15px 0; box-shadow: 0 2px 4px rgba(0,0,0,0.1);">
153
+ <h2 style="color: #24292e; margin-top: 0;">Training Details</h2>
154
+ <ul style="margin-bottom: 0;">
155
+ <li><b>Base Model:</b> Wan2.1 14B I2V 480p</li>
156
+ <li><b>Training Data:</b> 1.5 minutes of video (40 short clips of things being squished)</li>
157
+ <li><b>Epochs:</b> 40</li>
158
+ </ul>
159
+ </div>
160
+
161
+ <div style="background-color: white; padding: 15px; border-radius: 8px; margin: 15px 0; box-shadow: 0 2px 4px rgba(0,0,0,0.1);">
162
+ <h2 style="color: #24292e; margin-top: 0;">Additional Information</h2>
163
+ <p>Training was done using <a href="https://github.com/tdrussell/diffusion-pipe" style="color: #0366d6; text-decoration: none;">Diffusion Pipe for Training</a></p>
164
+ </div>
165
+
166
+ <div style="background-color: white; padding: 15px; border-radius: 8px; margin: 15px 0; box-shadow: 0 2px 4px rgba(0,0,0,0.1);">
167
+ <h2 style="color: #24292e; margin-top: 0;">Acknowledgments</h2>
168
+ <p style="margin-bottom: 0;">Special thanks to Kijai for the ComfyUI Wan Video Wrapper and tdrussell for the training scripts and RemadeAI some case!</p>
169
+ </div>
170
+ </div>
example_videos/10_epoch40.mp4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b0251f9c00ea7134b62c0a548e285ccb8ec33a722c1db872033dc80f28739a0
3
+ size 635170
example_videos/8_epoch40.mp4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:715c1dfac41efa23a0f659856f8a8dfc302e654f4e67a6bbe4edb70a10678ed5
3
+ size 615331
example_videos/9_epoch40.mp4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:740bdcce497d572900cee0c4885ea479380c245507ca2092847a03c3795c2516
3
+ size 749864
test_i2vlora_imgs/10.png ADDED

Git LFS Details

  • SHA256: 57dd823435b9d9539e9e81b71803c431b8c1886818f856ada5e75d6184c3570e
  • Pointer size: 132 Bytes
  • Size of remote file: 1.58 MB
test_i2vlora_imgs/8.png ADDED

Git LFS Details

  • SHA256: f18e4f4e10d2b4b536aded0d5ffb64615cf144ef667aeca6507c05822c93ca06
  • Pointer size: 132 Bytes
  • Size of remote file: 1.09 MB
test_i2vlora_imgs/9.png ADDED

Git LFS Details

  • SHA256: 57dd8c2ff4395e6cba03c27e5042c0bb85ad5df0342550ec35ea0a676bfe589f
  • Pointer size: 132 Bytes
  • Size of remote file: 2.13 MB
transform2venom.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0ad3ded26790df8a4c6dd9405403df6034135c81cf036f9e0ded4cf2cf2f378
3
+ size 359257680
workflow/wan_img2video_lora_workflow.json ADDED
@@ -0,0 +1,801 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "last_node_id": 43,
3
+ "last_link_id": 42,
4
+ "nodes": [
5
+ {
6
+ "id": 11,
7
+ "type": "LoadWanVideoT5TextEncoder",
8
+ "pos": [
9
+ 389.7322998046875,
10
+ -13.508200645446777
11
+ ],
12
+ "size": [
13
+ 377.1661376953125,
14
+ 130
15
+ ],
16
+ "flags": {},
17
+ "order": 0,
18
+ "mode": 0,
19
+ "inputs": [],
20
+ "outputs": [
21
+ {
22
+ "name": "wan_t5_model",
23
+ "type": "WANTEXTENCODER",
24
+ "links": [
25
+ 15
26
+ ],
27
+ "slot_index": 0
28
+ }
29
+ ],
30
+ "properties": {
31
+ "Node name for S&R": "LoadWanVideoT5TextEncoder"
32
+ },
33
+ "widgets_values": [
34
+ "umt5-xxl-enc-bf16.safetensors",
35
+ "bf16",
36
+ "offload_device",
37
+ "disabled"
38
+ ]
39
+ },
40
+ {
41
+ "id": 13,
42
+ "type": "LoadWanVideoClipTextEncoder",
43
+ "pos": [
44
+ 270.7287902832031,
45
+ 165.3174591064453
46
+ ],
47
+ "size": [
48
+ 510.6601257324219,
49
+ 106
50
+ ],
51
+ "flags": {},
52
+ "order": 1,
53
+ "mode": 0,
54
+ "inputs": [],
55
+ "outputs": [
56
+ {
57
+ "name": "wan_clip_model",
58
+ "type": "WANCLIP",
59
+ "links": [
60
+ 17
61
+ ],
62
+ "slot_index": 0
63
+ }
64
+ ],
65
+ "properties": {
66
+ "Node name for S&R": "LoadWanVideoClipTextEncoder"
67
+ },
68
+ "widgets_values": [
69
+ "open-clip-xlm-roberta-large-vit-huge-14_fp16.safetensors",
70
+ "fp16",
71
+ "offload_device"
72
+ ]
73
+ },
74
+ {
75
+ "id": 21,
76
+ "type": "WanVideoVAELoader",
77
+ "pos": [
78
+ 310.204833984375,
79
+ 320.3585510253906
80
+ ],
81
+ "size": [
82
+ 441.94390869140625,
83
+ 90.83087158203125
84
+ ],
85
+ "flags": {},
86
+ "order": 2,
87
+ "mode": 0,
88
+ "inputs": [],
89
+ "outputs": [
90
+ {
91
+ "name": "vae",
92
+ "type": "WANVAE",
93
+ "links": [
94
+ 21,
95
+ 34
96
+ ],
97
+ "slot_index": 0
98
+ }
99
+ ],
100
+ "properties": {
101
+ "Node name for S&R": "WanVideoVAELoader"
102
+ },
103
+ "widgets_values": [
104
+ "Wan2_1_VAE_bf16.safetensors",
105
+ "fp16"
106
+ ]
107
+ },
108
+ {
109
+ "id": 28,
110
+ "type": "WanVideoDecode",
111
+ "pos": [
112
+ 1220.4002685546875,
113
+ 371.8823547363281
114
+ ],
115
+ "size": [
116
+ 315,
117
+ 174
118
+ ],
119
+ "flags": {},
120
+ "order": 14,
121
+ "mode": 0,
122
+ "inputs": [
123
+ {
124
+ "name": "vae",
125
+ "type": "WANVAE",
126
+ "link": 34
127
+ },
128
+ {
129
+ "name": "samples",
130
+ "type": "LATENT",
131
+ "link": 33
132
+ }
133
+ ],
134
+ "outputs": [
135
+ {
136
+ "name": "images",
137
+ "type": "IMAGE",
138
+ "links": [
139
+ 36
140
+ ],
141
+ "slot_index": 0
142
+ }
143
+ ],
144
+ "properties": {
145
+ "Node name for S&R": "WanVideoDecode"
146
+ },
147
+ "widgets_values": [
148
+ true,
149
+ 272,
150
+ 272,
151
+ 144,
152
+ 128
153
+ ]
154
+ },
155
+ {
156
+ "id": 34,
157
+ "type": "Note",
158
+ "pos": [
159
+ 904.7526245117188,
160
+ 562.6104736328125
161
+ ],
162
+ "size": [
163
+ 262.5184020996094,
164
+ 58
165
+ ],
166
+ "flags": {},
167
+ "order": 4,
168
+ "mode": 0,
169
+ "inputs": [],
170
+ "outputs": [],
171
+ "properties": {},
172
+ "widgets_values": [
173
+ "Under 81 frames doesn't seem to work?"
174
+ ],
175
+ "color": "#432",
176
+ "bgcolor": "#653"
177
+ },
178
+ {
179
+ "id": 30,
180
+ "type": "VHS_VideoCombine",
181
+ "pos": [
182
+ 1633.1920166015625,
183
+ -278.24945068359375
184
+ ],
185
+ "size": [
186
+ 648.850341796875,
187
+ 976.850341796875
188
+ ],
189
+ "flags": {},
190
+ "order": 15,
191
+ "mode": 0,
192
+ "inputs": [
193
+ {
194
+ "name": "images",
195
+ "type": "IMAGE",
196
+ "link": 36
197
+ },
198
+ {
199
+ "name": "audio",
200
+ "type": "AUDIO",
201
+ "shape": 7,
202
+ "link": null
203
+ },
204
+ {
205
+ "name": "meta_batch",
206
+ "type": "VHS_BatchManager",
207
+ "shape": 7,
208
+ "link": null
209
+ },
210
+ {
211
+ "name": "vae",
212
+ "type": "VAE",
213
+ "shape": 7,
214
+ "link": null
215
+ }
216
+ ],
217
+ "outputs": [
218
+ {
219
+ "name": "Filenames",
220
+ "type": "VHS_FILENAMES",
221
+ "links": null
222
+ }
223
+ ],
224
+ "properties": {
225
+ "Node name for S&R": "VHS_VideoCombine"
226
+ },
227
+ "widgets_values": {
228
+ "frame_rate": 16,
229
+ "loop_count": 0,
230
+ "filename_prefix": "WanVideo2_1",
231
+ "format": "video/h264-mp4",
232
+ "pix_fmt": "yuv420p",
233
+ "crf": 19,
234
+ "save_metadata": true,
235
+ "trim_to_audio": false,
236
+ "pingpong": false,
237
+ "save_output": true,
238
+ "videopreview": {
239
+ "hidden": false,
240
+ "paused": false,
241
+ "params": {
242
+ "filename": "WanVideo2_1_00033.mp4",
243
+ "subfolder": "",
244
+ "type": "output",
245
+ "format": "video/h264-mp4",
246
+ "frame_rate": 16,
247
+ "workflow": "WanVideo2_1_00033.png",
248
+ "fullpath": "C:\\Users\\drini\\OneDrive\\Documents\\ComfyUI_windows_portable\\ComfyUI\\output\\WanVideo2_1_00033.mp4"
249
+ }
250
+ }
251
+ }
252
+ },
253
+ {
254
+ "id": 17,
255
+ "type": "WanVideoImageClipEncode",
256
+ "pos": [
257
+ 875.01025390625,
258
+ 278.4588623046875
259
+ ],
260
+ "size": [
261
+ 315,
262
+ 242
263
+ ],
264
+ "flags": {},
265
+ "order": 11,
266
+ "mode": 0,
267
+ "inputs": [
268
+ {
269
+ "name": "clip",
270
+ "type": "WANCLIP",
271
+ "link": 17
272
+ },
273
+ {
274
+ "name": "image",
275
+ "type": "IMAGE",
276
+ "link": 18
277
+ },
278
+ {
279
+ "name": "vae",
280
+ "type": "WANVAE",
281
+ "link": 21
282
+ }
283
+ ],
284
+ "outputs": [
285
+ {
286
+ "name": "image_embeds",
287
+ "type": "WANVIDIMAGE_EMBEDS",
288
+ "links": [
289
+ 32
290
+ ],
291
+ "slot_index": 0
292
+ }
293
+ ],
294
+ "properties": {
295
+ "Node name for S&R": "WanVideoImageClipEncode"
296
+ },
297
+ "widgets_values": [
298
+ 440,
299
+ 440,
300
+ 81,
301
+ true,
302
+ 0,
303
+ 1,
304
+ 1
305
+ ]
306
+ },
307
+ {
308
+ "id": 18,
309
+ "type": "LoadImage",
310
+ "pos": [
311
+ 473.90985107421875,
312
+ 451.8916931152344
313
+ ],
314
+ "size": [
315
+ 255.50192260742188,
316
+ 314
317
+ ],
318
+ "flags": {},
319
+ "order": 6,
320
+ "mode": 0,
321
+ "inputs": [],
322
+ "outputs": [
323
+ {
324
+ "name": "IMAGE",
325
+ "type": "IMAGE",
326
+ "links": [
327
+ 18
328
+ ]
329
+ },
330
+ {
331
+ "name": "MASK",
332
+ "type": "MASK",
333
+ "links": null
334
+ }
335
+ ],
336
+ "properties": {
337
+ "Node name for S&R": "LoadImage"
338
+ },
339
+ "widgets_values": [
340
+ "SN56-06-110121-P07-PikaChew-MD-1.jpg",
341
+ "image"
342
+ ]
343
+ },
344
+ {
345
+ "id": 27,
346
+ "type": "WanVideoSampler",
347
+ "pos": [
348
+ 1216.8856201171875,
349
+ -52.87528991699219
350
+ ],
351
+ "size": [
352
+ 315,
353
+ 330
354
+ ],
355
+ "flags": {},
356
+ "order": 13,
357
+ "mode": 0,
358
+ "inputs": [
359
+ {
360
+ "name": "model",
361
+ "type": "WANVIDEOMODEL",
362
+ "link": 29
363
+ },
364
+ {
365
+ "name": "text_embeds",
366
+ "type": "WANVIDEOTEXTEMBEDS",
367
+ "link": 30
368
+ },
369
+ {
370
+ "name": "image_embeds",
371
+ "type": "WANVIDIMAGE_EMBEDS",
372
+ "link": 32
373
+ },
374
+ {
375
+ "name": "samples",
376
+ "type": "LATENT",
377
+ "shape": 7,
378
+ "link": null
379
+ },
380
+ {
381
+ "name": "feta_args",
382
+ "type": "FETAARGS",
383
+ "shape": 7,
384
+ "link": null
385
+ }
386
+ ],
387
+ "outputs": [
388
+ {
389
+ "name": "samples",
390
+ "type": "LATENT",
391
+ "links": [
392
+ 33
393
+ ],
394
+ "slot_index": 0
395
+ }
396
+ ],
397
+ "properties": {
398
+ "Node name for S&R": "WanVideoSampler"
399
+ },
400
+ "widgets_values": [
401
+ 20,
402
+ 6,
403
+ 5,
404
+ 189992167790583,
405
+ "randomize",
406
+ true,
407
+ "dpm++",
408
+ 0,
409
+ 1
410
+ ]
411
+ },
412
+ {
413
+ "id": 35,
414
+ "type": "WanVideoTorchCompileSettings",
415
+ "pos": [
416
+ 1229.75146484375,
417
+ -314.2430725097656
418
+ ],
419
+ "size": [
420
+ 390.5999755859375,
421
+ 178
422
+ ],
423
+ "flags": {},
424
+ "order": 5,
425
+ "mode": 0,
426
+ "inputs": [],
427
+ "outputs": [
428
+ {
429
+ "name": "torch_compile_args",
430
+ "type": "WANCOMPILEARGS",
431
+ "links": [],
432
+ "slot_index": 0
433
+ }
434
+ ],
435
+ "properties": {
436
+ "Node name for S&R": "WanVideoTorchCompileSettings"
437
+ },
438
+ "widgets_values": [
439
+ "inductor",
440
+ false,
441
+ "default",
442
+ false,
443
+ 64,
444
+ true
445
+ ]
446
+ },
447
+ {
448
+ "id": 22,
449
+ "type": "WanVideoModelLoader",
450
+ "pos": [
451
+ 736.3001098632812,
452
+ -306.7892761230469
453
+ ],
454
+ "size": [
455
+ 477.4410095214844,
456
+ 226.43276977539062
457
+ ],
458
+ "flags": {},
459
+ "order": 12,
460
+ "mode": 0,
461
+ "inputs": [
462
+ {
463
+ "name": "compile_args",
464
+ "type": "WANCOMPILEARGS",
465
+ "shape": 7,
466
+ "link": null
467
+ },
468
+ {
469
+ "name": "block_swap_args",
470
+ "type": "BLOCKSWAPARGS",
471
+ "shape": 7,
472
+ "link": 39
473
+ },
474
+ {
475
+ "name": "lora",
476
+ "type": "WANVIDLORA",
477
+ "shape": 7,
478
+ "link": 41
479
+ }
480
+ ],
481
+ "outputs": [
482
+ {
483
+ "name": "model",
484
+ "type": "WANVIDEOMODEL",
485
+ "links": [
486
+ 29
487
+ ],
488
+ "slot_index": 0
489
+ }
490
+ ],
491
+ "properties": {
492
+ "Node name for S&R": "WanVideoModelLoader"
493
+ },
494
+ "widgets_values": [
495
+ "Wan2_1-I2V-14B-480P_fp8_e4m3fn.safetensors",
496
+ "bf16",
497
+ "fp8_e4m3fn",
498
+ "offload_device",
499
+ "sageattn"
500
+ ]
501
+ },
502
+ {
503
+ "id": 41,
504
+ "type": "WanVideoLoraSelect",
505
+ "pos": [
506
+ 402.9853515625,
507
+ -296.4585266113281
508
+ ],
509
+ "size": [
510
+ 315,
511
+ 102
512
+ ],
513
+ "flags": {},
514
+ "order": 9,
515
+ "mode": 0,
516
+ "inputs": [
517
+ {
518
+ "name": "prev_lora",
519
+ "type": "WANVIDLORA",
520
+ "shape": 7,
521
+ "link": null
522
+ },
523
+ {
524
+ "name": "blocks",
525
+ "type": "SELECTEDBLOCKS",
526
+ "shape": 7,
527
+ "link": null
528
+ }
529
+ ],
530
+ "outputs": [
531
+ {
532
+ "name": "lora",
533
+ "type": "WANVIDLORA",
534
+ "links": [
535
+ 41
536
+ ],
537
+ "slot_index": 0
538
+ }
539
+ ],
540
+ "properties": {
541
+ "Node name for S&R": "WanVideoLoraSelect"
542
+ },
543
+ "widgets_values": [
544
+ "Squish\\squish_18.safetensors",
545
+ 1
546
+ ]
547
+ },
548
+ {
549
+ "id": 36,
550
+ "type": "Note",
551
+ "pos": [
552
+ 106.82392120361328,
553
+ -5.778542518615723
554
+ ],
555
+ "size": [
556
+ 265.13958740234375,
557
+ 90.68971252441406
558
+ ],
559
+ "flags": {},
560
+ "order": 3,
561
+ "mode": 0,
562
+ "inputs": [],
563
+ "outputs": [],
564
+ "properties": {},
565
+ "widgets_values": [
566
+ "sdpa should work too, haven't tested flaash\n\nfp8_fast seems to cause huge quality degradation"
567
+ ],
568
+ "color": "#432",
569
+ "bgcolor": "#653"
570
+ },
571
+ {
572
+ "id": 32,
573
+ "type": "WanVideoBlockSwap",
574
+ "pos": [
575
+ 410.6151428222656,
576
+ -130.26060485839844
577
+ ],
578
+ "size": [
579
+ 315,
580
+ 58
581
+ ],
582
+ "flags": {},
583
+ "order": 8,
584
+ "mode": 0,
585
+ "inputs": [],
586
+ "outputs": [
587
+ {
588
+ "name": "block_swap_args",
589
+ "type": "BLOCKSWAPARGS",
590
+ "links": [
591
+ 39
592
+ ],
593
+ "slot_index": 0
594
+ }
595
+ ],
596
+ "properties": {
597
+ "Node name for S&R": "WanVideoBlockSwap"
598
+ },
599
+ "widgets_values": [
600
+ 10
601
+ ]
602
+ },
603
+ {
604
+ "id": 33,
605
+ "type": "Note",
606
+ "pos": [
607
+ 86.63419342041016,
608
+ -128.0150146484375
609
+ ],
610
+ "size": [
611
+ 318.5887756347656,
612
+ 58
613
+ ],
614
+ "flags": {},
615
+ "order": 7,
616
+ "mode": 0,
617
+ "inputs": [],
618
+ "outputs": [],
619
+ "properties": {},
620
+ "widgets_values": [
621
+ "Models:\nhttps://huggingface.co/Kijai/WanVideo_comfy/tree/main"
622
+ ],
623
+ "color": "#432",
624
+ "bgcolor": "#653"
625
+ },
626
+ {
627
+ "id": 16,
628
+ "type": "WanVideoTextEncode",
629
+ "pos": [
630
+ 795.1016235351562,
631
+ -16.162620544433594
632
+ ],
633
+ "size": [
634
+ 400,
635
+ 200
636
+ ],
637
+ "flags": {},
638
+ "order": 10,
639
+ "mode": 0,
640
+ "inputs": [
641
+ {
642
+ "name": "t5",
643
+ "type": "WANTEXTENCODER",
644
+ "link": 15
645
+ }
646
+ ],
647
+ "outputs": [
648
+ {
649
+ "name": "text_embeds",
650
+ "type": "WANVIDEOTEXTEMBEDS",
651
+ "links": [
652
+ 30
653
+ ],
654
+ "slot_index": 0
655
+ }
656
+ ],
657
+ "properties": {
658
+ "Node name for S&R": "WanVideoTextEncode"
659
+ },
660
+ "widgets_values": [
661
+ "In the video, a miniature tank is presented. The tank is held in a person’s hands. The person then presses on the tank, causing a sq41sh squish effect. The person keeps pressing down on the tank, further showing the sq41sh squish effect.",
662
+ "bad quality video",
663
+ true,
664
+ [
665
+ false,
666
+ true
667
+ ],
668
+ [
669
+ false,
670
+ true
671
+ ]
672
+ ]
673
+ }
674
+ ],
675
+ "links": [
676
+ [
677
+ 15,
678
+ 11,
679
+ 0,
680
+ 16,
681
+ 0,
682
+ "WANTEXTENCODER"
683
+ ],
684
+ [
685
+ 17,
686
+ 13,
687
+ 0,
688
+ 17,
689
+ 0,
690
+ "WANCLIP"
691
+ ],
692
+ [
693
+ 18,
694
+ 18,
695
+ 0,
696
+ 17,
697
+ 1,
698
+ "IMAGE"
699
+ ],
700
+ [
701
+ 21,
702
+ 21,
703
+ 0,
704
+ 17,
705
+ 2,
706
+ "VAE"
707
+ ],
708
+ [
709
+ 29,
710
+ 22,
711
+ 0,
712
+ 27,
713
+ 0,
714
+ "WANVIDEOMODEL"
715
+ ],
716
+ [
717
+ 30,
718
+ 16,
719
+ 0,
720
+ 27,
721
+ 1,
722
+ "WANVIDEOTEXTEMBEDS"
723
+ ],
724
+ [
725
+ 32,
726
+ 17,
727
+ 0,
728
+ 27,
729
+ 2,
730
+ "WANVIDIMAGE_EMBEDS"
731
+ ],
732
+ [
733
+ 33,
734
+ 27,
735
+ 0,
736
+ 28,
737
+ 1,
738
+ "LATENT"
739
+ ],
740
+ [
741
+ 34,
742
+ 21,
743
+ 0,
744
+ 28,
745
+ 0,
746
+ "VAE"
747
+ ],
748
+ [
749
+ 36,
750
+ 28,
751
+ 0,
752
+ 30,
753
+ 0,
754
+ "IMAGE"
755
+ ],
756
+ [
757
+ 39,
758
+ 32,
759
+ 0,
760
+ 22,
761
+ 1,
762
+ "BLOCKSWAPARGS"
763
+ ],
764
+ [
765
+ 41,
766
+ 41,
767
+ 0,
768
+ 22,
769
+ 2,
770
+ "WANVIDLORA"
771
+ ]
772
+ ],
773
+ "groups": [],
774
+ "config": {},
775
+ "extra": {
776
+ "ds": {
777
+ "scale": 0.7972024500000019,
778
+ "offset": {
779
+ "0": -135.86273193359375,
780
+ "1": 357.7580871582031
781
+ }
782
+ },
783
+ "node_versions": {
784
+ "ComfyUI-WanVideoWrapper": "4ce7e41492822e25f513f219ae11b1e0ff204b2a",
785
+ "ComfyUI-VideoHelperSuite": "565208bfe0a8050193ae3c8e61c96b6200dd9506",
786
+ "comfy-core": "0.3.18"
787
+ },
788
+ "VHS_latentpreview": false,
789
+ "VHS_latentpreviewrate": 0,
790
+ "VHS_MetadataImage": true,
791
+ "VHS_KeepIntermediate": true,
792
+ "ue_links": [],
793
+ "workspace_info": {
794
+ "id": "mZ-DLut47Mni3MFPHoL4Y",
795
+ "saveLock": false,
796
+ "cloudID": null,
797
+ "coverMediaPath": null
798
+ }
799
+ },
800
+ "version": 0.4
801
+ }