comfyuiman commited on
Commit
16c4c48
·
verified ·
1 Parent(s): a532078

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ loss_log.db filter=lfs diff=lfs merge=lfs -text
.huggingfaceignore ADDED
@@ -0,0 +1 @@
 
 
1
+ *.db-wal
.job_config.json ADDED
@@ -0,0 +1,227 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "job": "extension",
3
+ "config": {
4
+ "name": "PLORAV7_LTX",
5
+ "process": [
6
+ {
7
+ "type": "diffusion_trainer",
8
+ "training_folder": "/app/ai-toolkit/output",
9
+ "sqlite_db_path": "/app/ai-toolkit/aitk_db.db",
10
+ "device": "cuda",
11
+ "trigger_word": null,
12
+ "performance_log_every": 10,
13
+ "network": {
14
+ "type": "lora",
15
+ "linear": 32,
16
+ "linear_alpha": 32,
17
+ "conv": 16,
18
+ "conv_alpha": 16,
19
+ "lokr_full_rank": true,
20
+ "lokr_factor": -1,
21
+ "network_kwargs": {
22
+ "ignore_if_contains": []
23
+ }
24
+ },
25
+ "save": {
26
+ "dtype": "bf16",
27
+ "save_every": 500,
28
+ "max_step_saves_to_keep": 400,
29
+ "save_format": "diffusers",
30
+ "push_to_hub": false
31
+ },
32
+ "datasets": [
33
+ {
34
+ "folder_path": "/app/ai-toolkit/datasets/49",
35
+ "mask_path": null,
36
+ "mask_min_value": 0.1,
37
+ "default_caption": "",
38
+ "caption_ext": "txt",
39
+ "caption_dropout_rate": 0,
40
+ "cache_latents_to_disk": true,
41
+ "is_reg": false,
42
+ "network_weight": 1,
43
+ "resolution": [
44
+ 512
45
+ ],
46
+ "controls": [],
47
+ "shrink_video_to_frames": true,
48
+ "num_frames": 49,
49
+ "flip_x": false,
50
+ "flip_y": false,
51
+ "num_repeats": 2,
52
+ "do_i2v": false,
53
+ "fps": 24
54
+ },
55
+ {
56
+ "folder_path": "/app/ai-toolkit/datasets/73",
57
+ "mask_path": null,
58
+ "mask_min_value": 0.1,
59
+ "default_caption": "",
60
+ "caption_ext": "txt",
61
+ "caption_dropout_rate": 0,
62
+ "cache_latents_to_disk": true,
63
+ "is_reg": false,
64
+ "network_weight": 1,
65
+ "resolution": [
66
+ 512
67
+ ],
68
+ "controls": [],
69
+ "shrink_video_to_frames": true,
70
+ "num_frames": 73,
71
+ "flip_x": false,
72
+ "flip_y": false,
73
+ "num_repeats": 2
74
+ },
75
+ {
76
+ "folder_path": "/app/ai-toolkit/datasets/81",
77
+ "mask_path": null,
78
+ "mask_min_value": 0.1,
79
+ "default_caption": "",
80
+ "caption_ext": "txt",
81
+ "caption_dropout_rate": 0,
82
+ "cache_latents_to_disk": true,
83
+ "is_reg": false,
84
+ "network_weight": 1,
85
+ "resolution": [
86
+ 512
87
+ ],
88
+ "controls": [],
89
+ "shrink_video_to_frames": true,
90
+ "num_frames": 81,
91
+ "flip_x": false,
92
+ "flip_y": false,
93
+ "num_repeats": 2
94
+ },
95
+ {
96
+ "folder_path": "/app/ai-toolkit/datasets/89",
97
+ "mask_path": null,
98
+ "mask_min_value": 0.1,
99
+ "default_caption": "",
100
+ "caption_ext": "txt",
101
+ "caption_dropout_rate": 0,
102
+ "cache_latents_to_disk": true,
103
+ "is_reg": false,
104
+ "network_weight": 1,
105
+ "resolution": [
106
+ 512
107
+ ],
108
+ "controls": [],
109
+ "shrink_video_to_frames": true,
110
+ "num_frames": 89,
111
+ "flip_x": false,
112
+ "flip_y": false,
113
+ "num_repeats": 2
114
+ },
115
+ {
116
+ "folder_path": "/app/ai-toolkit/datasets/97",
117
+ "mask_path": null,
118
+ "mask_min_value": 0.1,
119
+ "default_caption": "",
120
+ "caption_ext": "txt",
121
+ "caption_dropout_rate": 0,
122
+ "cache_latents_to_disk": true,
123
+ "is_reg": false,
124
+ "network_weight": 1,
125
+ "resolution": [
126
+ 512
127
+ ],
128
+ "controls": [],
129
+ "shrink_video_to_frames": true,
130
+ "num_frames": 97,
131
+ "flip_x": false,
132
+ "flip_y": false,
133
+ "num_repeats": 2
134
+ },
135
+ {
136
+ "folder_path": "/app/ai-toolkit/datasets/images",
137
+ "mask_path": null,
138
+ "mask_min_value": 0.1,
139
+ "default_caption": "",
140
+ "caption_ext": "txt",
141
+ "caption_dropout_rate": 0,
142
+ "cache_latents_to_disk": true,
143
+ "is_reg": false,
144
+ "network_weight": 1,
145
+ "resolution": [
146
+ 512,
147
+ 768
148
+ ],
149
+ "controls": [],
150
+ "shrink_video_to_frames": true,
151
+ "num_frames": 1,
152
+ "flip_x": false,
153
+ "flip_y": false,
154
+ "num_repeats": 1
155
+ }
156
+ ],
157
+ "train": {
158
+ "batch_size": 1,
159
+ "bypass_guidance_embedding": false,
160
+ "steps": 25000,
161
+ "gradient_accumulation": 1,
162
+ "train_unet": true,
163
+ "train_text_encoder": false,
164
+ "gradient_checkpointing": true,
165
+ "noise_scheduler": "flowmatch",
166
+ "optimizer": "adamw8bit",
167
+ "timestep_type": "weighted",
168
+ "content_or_style": "balanced",
169
+ "optimizer_params": {
170
+ "weight_decay": 0.0001
171
+ },
172
+ "unload_text_encoder": false,
173
+ "cache_text_embeddings": true,
174
+ "lr": 0.0001,
175
+ "ema_config": {
176
+ "use_ema": false,
177
+ "ema_decay": 0.99
178
+ },
179
+ "skip_first_sample": false,
180
+ "force_first_sample": false,
181
+ "disable_sampling": true,
182
+ "dtype": "bf16",
183
+ "diff_output_preservation": false,
184
+ "diff_output_preservation_multiplier": 1,
185
+ "diff_output_preservation_class": "person",
186
+ "switch_boundary_every": 1,
187
+ "loss_type": "mse"
188
+ },
189
+ "logging": {
190
+ "log_every": 1,
191
+ "use_ui_logger": true
192
+ },
193
+ "model": {
194
+ "name_or_path": "Lightricks/LTX-2",
195
+ "quantize": true,
196
+ "qtype": "qfloat8",
197
+ "quantize_te": true,
198
+ "qtype_te": "uint6",
199
+ "arch": "ltx2",
200
+ "low_vram": true,
201
+ "model_kwargs": {},
202
+ "layer_offloading": false,
203
+ "layer_offloading_text_encoder_percent": 1,
204
+ "layer_offloading_transformer_percent": 1
205
+ },
206
+ "sample": {
207
+ "sampler": "flowmatch",
208
+ "sample_every": 250,
209
+ "width": 768,
210
+ "height": 768,
211
+ "samples": [],
212
+ "neg": "",
213
+ "seed": 42,
214
+ "walk_seed": true,
215
+ "guidance_scale": 4,
216
+ "sample_steps": 25,
217
+ "num_frames": 121,
218
+ "fps": 24
219
+ }
220
+ }
221
+ ]
222
+ },
223
+ "meta": {
224
+ "name": "[name]",
225
+ "version": "1.0"
226
+ }
227
+ }
PLORAV7_LTX_000000500.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d41895c8f8aa28a89a78feb28a29eedeb40f5eb0bdcf4fd507cc5046d0c8150
3
+ size 616948936
PLORAV7_LTX_000001000.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc4d78e9469b751ff5697e6e31ee1066cfefdc74523a129625da3bed3785cce2
3
+ size 616948936
PLORAV7_LTX_000001500.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:432752e36f370c551221a66abffb299a409b0abb60a086d9c8e42da3beb0c656
3
+ size 616948936
PLORAV7_LTX_000002000.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fa83117ceb7113ffd7aac0b131a9f8bfa4ad8ed51da50ca157d1828b443a39c
3
+ size 616948936
PLORAV7_LTX_000002500.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d792597c559358303edce19ff969ae86c5d959f69ebc529aaeb8fdd03106efd1
3
+ size 616948936
PLORAV7_LTX_000003000.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ae92528e5b06f7784180e66fa654d35099c2fb08a4edafbe58d4278f2a91aac
3
+ size 616948936
PLORAV7_LTX_000003500.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fdae5b883f2c05bcb71ce95307f1252fb0c9817edef1a2c30bbc737d1b6ebc18
3
+ size 616948936
PLORAV7_LTX_000004000.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b354f2d509aae2f6d7d9e9a1cda12a38096728146bbbc323e0573ae22d37f1f
3
+ size 616948936
PLORAV7_LTX_000004500.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92ade0c748a15205a0cf94151b113fcd9a7fae530a615c743f234383ca2300aa
3
+ size 616948936
PLORAV7_LTX_000005000.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c96872f33ea4a33600d37272f7c5f5aef4436b1cdc0ace4a80bb0df963b60e27
3
+ size 616948936
PLORAV7_LTX_000005500.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cfd606624bdc940ac90940b0d2c2cd7002c3761d0fa82358fece9c594a19600b
3
+ size 616948936
PLORAV7_LTX_000006000.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccb68a111c636d2f4ab6dfa1184201cd59c000b6c1a6a30cecbf984436fc8af2
3
+ size 616948936
PLORAV7_LTX_000006500.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:618e0a009a7213dff88f35943bc5937c15cfe29729ad64250e94bf802e5ab49b
3
+ size 616948936
PLORAV7_LTX_000007000.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9620a14bba8fae1e578eda64a2e100fc3a6ac5d6f2e2851e9d43119ac0072430
3
+ size 616948936
PLORAV7_LTX_000007500.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a73ce7788a7e444fe35060503ffd8351652ed6d1052f51f7d94335b514c5a95
3
+ size 616948936
PLORAV7_LTX_000008000.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97beedbc78317824fdaaeae7a4cc8b5b1957c48de2c01bdf65dad94ff256babc
3
+ size 616948936
PLORAV7_LTX_000008500.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c50a99d13a913843f4e2b9ee17d134154cff6cc32f9c4b69755dceb63f4f6428
3
+ size 616948936
PLORAV7_LTX_000009000.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a30f52f67aa087ea88c3337b650656ae22d7441d32ede56ba6f3a7eb4265a5d
3
+ size 616948936
PLORAV7_LTX_000009500.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:798570c465a7263cd06ea169044ee9eda9402b7bbf725b89b61607dfbafe81a7
3
+ size 616948936
PLORAV7_LTX_000010000.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:087ba767e92c10bd7dc9454aa7ad3b8dc839b8ef6029238bd7e800c1bbea05a0
3
+ size 616948936
PLORAV7_LTX_000010500.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:295d5947b8f997100425ce8373eb0e709ed5994af42b844fae5e3ec9ebed2d2a
3
+ size 616948936
PLORAV7_LTX_000011000.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7cbc6a8e154f6ff4e59569b7717df48abefac075861f21b2787927bc8e36fdc1
3
+ size 616948936
PLORAV7_LTX_000011500.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a384b90a9188c4806977c266c09b51addd147c3a9cd37584f55bcfbfa897a2a4
3
+ size 616948936
PLORAV7_LTX_000012000.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a91e6efa7842823d949b8230383a54b1f8ae269c49a11661d01543127c6c63e3
3
+ size 616948936
PLORAV7_LTX_000012500.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc2851c5894a7b6bb2bcfeb0ee30b1f9eaecd41ff406a3bc14218b4902a8b709
3
+ size 616948936
PLORAV7_LTX_000013000.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a6f79067ce45f0fc0d57b00c288727005c866b9f0b549dc75f511708d668523
3
+ size 616948936
PLORAV7_LTX_000013500.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f4eb36f76a73149055a88daaa47ec035bb0b1fc8e146ff44a229e546d8936fe
3
+ size 616948936
config.yaml ADDED
@@ -0,0 +1,192 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ job: extension
2
+ config:
3
+ name: PLORAV7_LTX
4
+ process:
5
+ - type: diffusion_trainer
6
+ training_folder: /app/ai-toolkit/output
7
+ sqlite_db_path: /app/ai-toolkit/aitk_db.db
8
+ device: cuda
9
+ trigger_word: null
10
+ performance_log_every: 10
11
+ network:
12
+ type: lora
13
+ linear: 32
14
+ linear_alpha: 32
15
+ conv: 16
16
+ conv_alpha: 16
17
+ lokr_full_rank: true
18
+ lokr_factor: -1
19
+ network_kwargs:
20
+ ignore_if_contains: []
21
+ save:
22
+ dtype: bf16
23
+ save_every: 500
24
+ max_step_saves_to_keep: 400
25
+ save_format: diffusers
26
+ push_to_hub: false
27
+ datasets:
28
+ - folder_path: /app/ai-toolkit/datasets/49
29
+ mask_path: null
30
+ mask_min_value: 0.1
31
+ default_caption: ''
32
+ caption_ext: txt
33
+ caption_dropout_rate: 0
34
+ cache_latents_to_disk: true
35
+ is_reg: false
36
+ network_weight: 1
37
+ resolution:
38
+ - 512
39
+ controls: []
40
+ shrink_video_to_frames: true
41
+ num_frames: 49
42
+ flip_x: false
43
+ flip_y: false
44
+ num_repeats: 2
45
+ do_i2v: false
46
+ fps: 24
47
+ - folder_path: /app/ai-toolkit/datasets/73
48
+ mask_path: null
49
+ mask_min_value: 0.1
50
+ default_caption: ''
51
+ caption_ext: txt
52
+ caption_dropout_rate: 0
53
+ cache_latents_to_disk: true
54
+ is_reg: false
55
+ network_weight: 1
56
+ resolution:
57
+ - 512
58
+ controls: []
59
+ shrink_video_to_frames: true
60
+ num_frames: 73
61
+ flip_x: false
62
+ flip_y: false
63
+ num_repeats: 2
64
+ - folder_path: /app/ai-toolkit/datasets/81
65
+ mask_path: null
66
+ mask_min_value: 0.1
67
+ default_caption: ''
68
+ caption_ext: txt
69
+ caption_dropout_rate: 0
70
+ cache_latents_to_disk: true
71
+ is_reg: false
72
+ network_weight: 1
73
+ resolution:
74
+ - 512
75
+ controls: []
76
+ shrink_video_to_frames: true
77
+ num_frames: 81
78
+ flip_x: false
79
+ flip_y: false
80
+ num_repeats: 2
81
+ - folder_path: /app/ai-toolkit/datasets/89
82
+ mask_path: null
83
+ mask_min_value: 0.1
84
+ default_caption: ''
85
+ caption_ext: txt
86
+ caption_dropout_rate: 0
87
+ cache_latents_to_disk: true
88
+ is_reg: false
89
+ network_weight: 1
90
+ resolution:
91
+ - 512
92
+ controls: []
93
+ shrink_video_to_frames: true
94
+ num_frames: 89
95
+ flip_x: false
96
+ flip_y: false
97
+ num_repeats: 2
98
+ - folder_path: /app/ai-toolkit/datasets/97
99
+ mask_path: null
100
+ mask_min_value: 0.1
101
+ default_caption: ''
102
+ caption_ext: txt
103
+ caption_dropout_rate: 0
104
+ cache_latents_to_disk: true
105
+ is_reg: false
106
+ network_weight: 1
107
+ resolution:
108
+ - 512
109
+ controls: []
110
+ shrink_video_to_frames: true
111
+ num_frames: 97
112
+ flip_x: false
113
+ flip_y: false
114
+ num_repeats: 2
115
+ - folder_path: /app/ai-toolkit/datasets/images
116
+ mask_path: null
117
+ mask_min_value: 0.1
118
+ default_caption: ''
119
+ caption_ext: txt
120
+ caption_dropout_rate: 0
121
+ cache_latents_to_disk: true
122
+ is_reg: false
123
+ network_weight: 1
124
+ resolution:
125
+ - 512
126
+ - 768
127
+ controls: []
128
+ shrink_video_to_frames: true
129
+ num_frames: 1
130
+ flip_x: false
131
+ flip_y: false
132
+ num_repeats: 1
133
+ train:
134
+ batch_size: 1
135
+ bypass_guidance_embedding: false
136
+ steps: 25000
137
+ gradient_accumulation: 1
138
+ train_unet: true
139
+ train_text_encoder: false
140
+ gradient_checkpointing: true
141
+ noise_scheduler: flowmatch
142
+ optimizer: adamw8bit
143
+ timestep_type: weighted
144
+ content_or_style: balanced
145
+ optimizer_params:
146
+ weight_decay: 0.0001
147
+ unload_text_encoder: false
148
+ cache_text_embeddings: true
149
+ lr: 0.0001
150
+ ema_config:
151
+ use_ema: false
152
+ ema_decay: 0.99
153
+ skip_first_sample: false
154
+ force_first_sample: false
155
+ disable_sampling: true
156
+ dtype: bf16
157
+ diff_output_preservation: false
158
+ diff_output_preservation_multiplier: 1
159
+ diff_output_preservation_class: person
160
+ switch_boundary_every: 1
161
+ loss_type: mse
162
+ logging:
163
+ log_every: 1
164
+ use_ui_logger: true
165
+ model:
166
+ name_or_path: Lightricks/LTX-2
167
+ quantize: true
168
+ qtype: qfloat8
169
+ quantize_te: true
170
+ qtype_te: uint6
171
+ arch: ltx2
172
+ low_vram: true
173
+ model_kwargs: {}
174
+ layer_offloading: false
175
+ layer_offloading_text_encoder_percent: 1
176
+ layer_offloading_transformer_percent: 1
177
+ sample:
178
+ sampler: flowmatch
179
+ sample_every: 250
180
+ width: 768
181
+ height: 768
182
+ samples: []
183
+ neg: ''
184
+ seed: 42
185
+ walk_seed: true
186
+ guidance_scale: 4
187
+ sample_steps: 25
188
+ num_frames: 121
189
+ fps: 24
190
+ meta:
191
+ name: PLORAV7_LTX
192
+ version: '1.0'
log.txt ADDED
The diff for this file is too large to render. See raw diff
 
logs/0_log.txt ADDED
@@ -0,0 +1,344 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
0
  0%| | 0/48 [00:00<?, ?it/s]
1
  0%| | 0/48 [00:00<?, ?it/s]
2
  2%|2 | 1/48 [00:00<00:27, 1.70it/s]
3
  2%|2 | 1/48 [00:00<00:27, 1.70it/s]
4
  4%|4 | 2/48 [00:00<00:19, 2.35it/s]
5
  4%|4 | 2/48 [00:00<00:19, 2.35it/s]
6
  6%|6 | 3/48 [00:01<00:18, 2.43it/s]
7
  6%|6 | 3/48 [00:01<00:18, 2.43it/s]
8
  8%|8 | 4/48 [00:01<00:16, 2.66it/s]
9
  8%|8 | 4/48 [00:01<00:16, 2.66it/s]
10
  10%|# | 5/48 [00:01<00:15, 2.82it/s]
11
  10%|# | 5/48 [00:01<00:15, 2.82it/s]
12
  12%|#2 | 6/48 [00:02<00:16, 2.62it/s]
13
  12%|#2 | 6/48 [00:02<00:16, 2.62it/s]
14
  15%|#4 | 7/48 [00:02<00:16, 2.47it/s]
15
  15%|#4 | 7/48 [00:02<00:16, 2.47it/s]
16
  17%|#6 | 8/48 [00:03<00:16, 2.45it/s]
17
  17%|#6 | 8/48 [00:03<00:16, 2.45it/s]
18
  19%|#8 | 9/48 [00:03<00:16, 2.41it/s]
19
  19%|#8 | 9/48 [00:03<00:16, 2.41it/s]
20
  21%|## | 10/48 [00:04<00:14, 2.54it/s]
21
  21%|## | 10/48 [00:04<00:14, 2.54it/s]
22
  23%|##2 | 11/48 [00:04<00:15, 2.38it/s]
23
  23%|##2 | 11/48 [00:04<00:15, 2.38it/s]
24
  25%|##5 | 12/48 [00:04<00:15, 2.29it/s]
25
  25%|##5 | 12/48 [00:04<00:15, 2.29it/s]
26
  27%|##7 | 13/48 [00:05<00:16, 2.19it/s]
27
  27%|##7 | 13/48 [00:05<00:16, 2.19it/s]
28
  29%|##9 | 14/48 [00:05<00:14, 2.40it/s]
29
  29%|##9 | 14/48 [00:05<00:14, 2.40it/s]
30
  31%|###1 | 15/48 [00:06<00:12, 2.55it/s]
31
  31%|###1 | 15/48 [00:06<00:12, 2.55it/s]
32
  33%|###3 | 16/48 [00:06<00:11, 2.68it/s]
33
  33%|###3 | 16/48 [00:06<00:11, 2.68it/s]
34
  35%|###5 | 17/48 [00:06<00:11, 2.80it/s]
35
  35%|###5 | 17/48 [00:06<00:11, 2.80it/s]
36
  38%|###7 | 18/48 [00:07<00:10, 2.87it/s]
37
  38%|###7 | 18/48 [00:07<00:10, 2.87it/s]
38
  40%|###9 | 19/48 [00:07<00:11, 2.56it/s]
39
  40%|###9 | 19/48 [00:07<00:11, 2.56it/s]
40
  42%|####1 | 20/48 [00:07<00:10, 2.70it/s]
41
  42%|####1 | 20/48 [00:07<00:10, 2.70it/s]
42
  44%|####3 | 21/48 [00:08<00:09, 2.79it/s]
43
  44%|####3 | 21/48 [00:08<00:09, 2.79it/s]
44
  46%|####5 | 22/48 [00:08<00:09, 2.86it/s]
45
  46%|####5 | 22/48 [00:08<00:09, 2.86it/s]
46
  48%|####7 | 23/48 [00:08<00:08, 2.92it/s]
47
  48%|####7 | 23/48 [00:08<00:08, 2.92it/s]
48
  50%|##### | 24/48 [00:09<00:08, 2.96it/s]
49
  50%|##### | 24/48 [00:09<00:08, 2.96it/s]
50
  52%|#####2 | 25/48 [00:09<00:08, 2.62it/s]
51
  52%|#####2 | 25/48 [00:09<00:08, 2.62it/s]
52
  54%|#####4 | 26/48 [00:10<00:08, 2.74it/s]
53
  54%|#####4 | 26/48 [00:10<00:08, 2.74it/s]
54
  56%|#####6 | 27/48 [00:10<00:07, 2.84it/s]
55
  56%|#####6 | 27/48 [00:10<00:07, 2.84it/s]
56
  58%|#####8 | 28/48 [00:10<00:06, 2.89it/s]
57
  58%|#####8 | 28/48 [00:10<00:06, 2.89it/s]
58
  60%|###### | 29/48 [00:11<00:06, 2.96it/s]
59
  60%|###### | 29/48 [00:11<00:06, 2.96it/s]
60
  62%|######2 | 30/48 [00:11<00:05, 3.01it/s]
61
  62%|######2 | 30/48 [00:11<00:05, 3.01it/s]
62
  65%|######4 | 31/48 [00:11<00:05, 3.01it/s]
63
  65%|######4 | 31/48 [00:11<00:05, 3.01it/s]
64
  67%|######6 | 32/48 [00:12<00:06, 2.65it/s]
65
  67%|######6 | 32/48 [00:12<00:06, 2.65it/s]
66
  69%|######8 | 33/48 [00:12<00:05, 2.77it/s]
67
  69%|######8 | 33/48 [00:12<00:05, 2.77it/s]
68
  71%|####### | 34/48 [00:12<00:04, 2.85it/s]
69
  71%|####### | 34/48 [00:12<00:04, 2.85it/s]
70
  73%|#######2 | 35/48 [00:13<00:04, 2.90it/s]
71
  73%|#######2 | 35/48 [00:13<00:04, 2.90it/s]
72
  75%|#######5 | 36/48 [00:13<00:04, 2.95it/s]
73
  75%|#######5 | 36/48 [00:13<00:04, 2.95it/s]
74
  77%|#######7 | 37/48 [00:13<00:03, 2.97it/s]
75
  77%|#######7 | 37/48 [00:13<00:03, 2.97it/s]
76
  79%|#######9 | 38/48 [00:14<00:03, 2.61it/s]
77
  79%|#######9 | 38/48 [00:14<00:03, 2.61it/s]
78
  81%|########1 | 39/48 [00:14<00:03, 2.73it/s]
79
  81%|########1 | 39/48 [00:14<00:03, 2.73it/s]
80
  83%|########3 | 40/48 [00:14<00:02, 2.82it/s]
81
  83%|########3 | 40/48 [00:14<00:02, 2.82it/s]
82
  85%|########5 | 41/48 [00:15<00:02, 2.90it/s]
83
  85%|########5 | 41/48 [00:15<00:02, 2.90it/s]
84
  88%|########7 | 42/48 [00:15<00:02, 2.95it/s]
85
  88%|########7 | 42/48 [00:15<00:02, 2.95it/s]
86
  90%|########9 | 43/48 [00:15<00:01, 2.99it/s]
87
  90%|########9 | 43/48 [00:15<00:01, 2.99it/s]
88
  92%|#########1| 44/48 [00:16<00:01, 3.01it/s]
89
  92%|#########1| 44/48 [00:16<00:01, 3.01it/s]
90
  94%|#########3| 45/48 [00:16<00:01, 2.63it/s]
91
  94%|#########3| 45/48 [00:16<00:01, 2.63it/s]
92
  96%|#########5| 46/48 [00:17<00:00, 2.75it/s]
93
  96%|#########5| 46/48 [00:17<00:00, 2.75it/s]
94
  98%|#########7| 47/48 [00:17<00:00, 2.85it/s]
95
  98%|#########7| 47/48 [00:17<00:00, 2.85it/s]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
96
  0%| | 0/140 [00:00<?, ?it/s]
97
  0%| | 0/140 [00:00<?, ?it/s]
98
  8%|7 | 11/140 [00:00<00:01, 102.69it/s]
99
  8%|7 | 11/140 [00:00<00:01, 102.69it/s]
100
  19%|#8 | 26/140 [00:00<00:00, 126.82it/s]
101
  19%|#8 | 26/140 [00:00<00:00, 126.82it/s]
102
  31%|### | 43/140 [00:00<00:00, 143.80it/s]
103
  31%|### | 43/140 [00:00<00:00, 143.80it/s]
104
  41%|####1 | 58/140 [00:00<00:00, 143.46it/s]
105
  41%|####1 | 58/140 [00:00<00:00, 143.46it/s]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Running 1 job
2
+ {
3
+ "type": "diffusion_trainer",
4
+ "training_folder": "/app/ai-toolkit/output",
5
+ "sqlite_db_path": "/app/ai-toolkit/aitk_db.db",
6
+ "device": "cuda",
7
+ "trigger_word": null,
8
+ "performance_log_every": 10,
9
+ "network": {
10
+ "type": "lora",
11
+ "linear": 32,
12
+ "linear_alpha": 32,
13
+ "conv": 16,
14
+ "conv_alpha": 16,
15
+ "lokr_full_rank": true,
16
+ "lokr_factor": -1,
17
+ "network_kwargs": {
18
+ "ignore_if_contains": []
19
+ }
20
+ },
21
+ "save": {
22
+ "dtype": "bf16",
23
+ "save_every": 500,
24
+ "max_step_saves_to_keep": 400,
25
+ "save_format": "diffusers",
26
+ "push_to_hub": false
27
+ },
28
+ "datasets": [
29
+ {
30
+ "folder_path": "/app/ai-toolkit/datasets/49",
31
+ "mask_path": null,
32
+ "mask_min_value": 0.1,
33
+ "default_caption": "",
34
+ "caption_ext": "txt",
35
+ "caption_dropout_rate": 0,
36
+ "cache_latents_to_disk": true,
37
+ "is_reg": false,
38
+ "network_weight": 1,
39
+ "resolution": [
40
+ 512
41
+ ],
42
+ "controls": [],
43
+ "shrink_video_to_frames": true,
44
+ "num_frames": 49,
45
+ "flip_x": false,
46
+ "flip_y": false,
47
+ "num_repeats": 2,
48
+ "do_i2v": false,
49
+ "fps": 24
50
+ },
51
+ {
52
+ "folder_path": "/app/ai-toolkit/datasets/73",
53
+ "mask_path": null,
54
+ "mask_min_value": 0.1,
55
+ "default_caption": "",
56
+ "caption_ext": "txt",
57
+ "caption_dropout_rate": 0,
58
+ "cache_latents_to_disk": true,
59
+ "is_reg": false,
60
+ "network_weight": 1,
61
+ "resolution": [
62
+ 512
63
+ ],
64
+ "controls": [],
65
+ "shrink_video_to_frames": true,
66
+ "num_frames": 73,
67
+ "flip_x": false,
68
+ "flip_y": false,
69
+ "num_repeats": 2
70
+ },
71
+ {
72
+ "folder_path": "/app/ai-toolkit/datasets/81",
73
+ "mask_path": null,
74
+ "mask_min_value": 0.1,
75
+ "default_caption": "",
76
+ "caption_ext": "txt",
77
+ "caption_dropout_rate": 0,
78
+ "cache_latents_to_disk": true,
79
+ "is_reg": false,
80
+ "network_weight": 1,
81
+ "resolution": [
82
+ 512
83
+ ],
84
+ "controls": [],
85
+ "shrink_video_to_frames": true,
86
+ "num_frames": 81,
87
+ "flip_x": false,
88
+ "flip_y": false,
89
+ "num_repeats": 2
90
+ },
91
+ {
92
+ "folder_path": "/app/ai-toolkit/datasets/89",
93
+ "mask_path": null,
94
+ "mask_min_value": 0.1,
95
+ "default_caption": "",
96
+ "caption_ext": "txt",
97
+ "caption_dropout_rate": 0,
98
+ "cache_latents_to_disk": true,
99
+ "is_reg": false,
100
+ "network_weight": 1,
101
+ "resolution": [
102
+ 512
103
+ ],
104
+ "controls": [],
105
+ "shrink_video_to_frames": true,
106
+ "num_frames": 89,
107
+ "flip_x": false,
108
+ "flip_y": false,
109
+ "num_repeats": 2
110
+ },
111
+ {
112
+ "folder_path": "/app/ai-toolkit/datasets/97",
113
+ "mask_path": null,
114
+ "mask_min_value": 0.1,
115
+ "default_caption": "",
116
+ "caption_ext": "txt",
117
+ "caption_dropout_rate": 0,
118
+ "cache_latents_to_disk": true,
119
+ "is_reg": false,
120
+ "network_weight": 1,
121
+ "resolution": [
122
+ 512
123
+ ],
124
+ "controls": [],
125
+ "shrink_video_to_frames": true,
126
+ "num_frames": 97,
127
+ "flip_x": false,
128
+ "flip_y": false,
129
+ "num_repeats": 2
130
+ },
131
+ {
132
+ "folder_path": "/app/ai-toolkit/datasets/images",
133
+ "mask_path": null,
134
+ "mask_min_value": 0.1,
135
+ "default_caption": "",
136
+ "caption_ext": "txt",
137
+ "caption_dropout_rate": 0,
138
+ "cache_latents_to_disk": true,
139
+ "is_reg": false,
140
+ "network_weight": 1,
141
+ "resolution": [
142
+ 512,
143
+ 768
144
+ ],
145
+ "controls": [],
146
+ "shrink_video_to_frames": true,
147
+ "num_frames": 1,
148
+ "flip_x": false,
149
+ "flip_y": false,
150
+ "num_repeats": 1
151
+ }
152
+ ],
153
+ "train": {
154
+ "batch_size": 1,
155
+ "bypass_guidance_embedding": false,
156
+ "steps": 25000,
157
+ "gradient_accumulation": 1,
158
+ "train_unet": true,
159
+ "train_text_encoder": false,
160
+ "gradient_checkpointing": true,
161
+ "noise_scheduler": "flowmatch",
162
+ "optimizer": "adamw8bit",
163
+ "timestep_type": "weighted",
164
+ "content_or_style": "balanced",
165
+ "optimizer_params": {
166
+ "weight_decay": 0.0001
167
+ },
168
+ "unload_text_encoder": false,
169
+ "cache_text_embeddings": true,
170
+ "lr": 0.0001,
171
+ "ema_config": {
172
+ "use_ema": false,
173
+ "ema_decay": 0.99
174
+ },
175
+ "skip_first_sample": false,
176
+ "force_first_sample": false,
177
+ "disable_sampling": true,
178
+ "dtype": "bf16",
179
+ "diff_output_preservation": false,
180
+ "diff_output_preservation_multiplier": 1,
181
+ "diff_output_preservation_class": "person",
182
+ "switch_boundary_every": 1,
183
+ "loss_type": "mse"
184
+ },
185
+ "logging": {
186
+ "log_every": 1,
187
+ "use_ui_logger": true
188
+ },
189
+ "model": {
190
+ "name_or_path": "Lightricks/LTX-2",
191
+ "quantize": true,
192
+ "qtype": "qfloat8",
193
+ "quantize_te": true,
194
+ "qtype_te": "uint6",
195
+ "arch": "ltx2",
196
+ "low_vram": true,
197
+ "model_kwargs": {},
198
+ "layer_offloading": false,
199
+ "layer_offloading_text_encoder_percent": 1,
200
+ "layer_offloading_transformer_percent": 1
201
+ },
202
+ "sample": {
203
+ "sampler": "flowmatch",
204
+ "sample_every": 250,
205
+ "width": 768,
206
+ "height": 768,
207
+ "samples": [],
208
+ "neg": "",
209
+ "seed": 42,
210
+ "walk_seed": true,
211
+ "guidance_scale": 4,
212
+ "sample_steps": 25,
213
+ "num_frames": 121,
214
+ "fps": 24
215
+ }
216
+ }
217
+ Changing sample extention to animated webp
218
+ Using SQLite database at /app/ai-toolkit/aitk_db.db
219
+ Job ID: "bf530ed1-e796-42a1-9ffa-55399fe92986"
220
+
221
+ #############################################
222
+ # Running job: PLORAV7_LTX
223
+ #############################################
224
+
225
+
226
+ Running 1 process
227
+ Loading LTX2 model
228
+ Loading transformer
229
+
230
+
231
+
232
+
233
+
234
+
235
+
236
+
237
+
238
+
239
+
240
+
241
+
242
+
243
+
244
+
245
+
246
+
247
+
248
+
249
+
250
+
251
+ Quantizing Transformer
252
+ - quantizing 48 transformer blocks
253
+
254
  0%| | 0/48 [00:00<?, ?it/s]
255
  0%| | 0/48 [00:00<?, ?it/s]
256
  2%|2 | 1/48 [00:00<00:27, 1.70it/s]
257
  2%|2 | 1/48 [00:00<00:27, 1.70it/s]
258
  4%|4 | 2/48 [00:00<00:19, 2.35it/s]
259
  4%|4 | 2/48 [00:00<00:19, 2.35it/s]
260
  6%|6 | 3/48 [00:01<00:18, 2.43it/s]
261
  6%|6 | 3/48 [00:01<00:18, 2.43it/s]
262
  8%|8 | 4/48 [00:01<00:16, 2.66it/s]
263
  8%|8 | 4/48 [00:01<00:16, 2.66it/s]
264
  10%|# | 5/48 [00:01<00:15, 2.82it/s]
265
  10%|# | 5/48 [00:01<00:15, 2.82it/s]
266
  12%|#2 | 6/48 [00:02<00:16, 2.62it/s]
267
  12%|#2 | 6/48 [00:02<00:16, 2.62it/s]
268
  15%|#4 | 7/48 [00:02<00:16, 2.47it/s]
269
  15%|#4 | 7/48 [00:02<00:16, 2.47it/s]
270
  17%|#6 | 8/48 [00:03<00:16, 2.45it/s]
271
  17%|#6 | 8/48 [00:03<00:16, 2.45it/s]
272
  19%|#8 | 9/48 [00:03<00:16, 2.41it/s]
273
  19%|#8 | 9/48 [00:03<00:16, 2.41it/s]
274
  21%|## | 10/48 [00:04<00:14, 2.54it/s]
275
  21%|## | 10/48 [00:04<00:14, 2.54it/s]
276
  23%|##2 | 11/48 [00:04<00:15, 2.38it/s]
277
  23%|##2 | 11/48 [00:04<00:15, 2.38it/s]
278
  25%|##5 | 12/48 [00:04<00:15, 2.29it/s]
279
  25%|##5 | 12/48 [00:04<00:15, 2.29it/s]
280
  27%|##7 | 13/48 [00:05<00:16, 2.19it/s]
281
  27%|##7 | 13/48 [00:05<00:16, 2.19it/s]
282
  29%|##9 | 14/48 [00:05<00:14, 2.40it/s]
283
  29%|##9 | 14/48 [00:05<00:14, 2.40it/s]
284
  31%|###1 | 15/48 [00:06<00:12, 2.55it/s]
285
  31%|###1 | 15/48 [00:06<00:12, 2.55it/s]
286
  33%|###3 | 16/48 [00:06<00:11, 2.68it/s]
287
  33%|###3 | 16/48 [00:06<00:11, 2.68it/s]
288
  35%|###5 | 17/48 [00:06<00:11, 2.80it/s]
289
  35%|###5 | 17/48 [00:06<00:11, 2.80it/s]
290
  38%|###7 | 18/48 [00:07<00:10, 2.87it/s]
291
  38%|###7 | 18/48 [00:07<00:10, 2.87it/s]
292
  40%|###9 | 19/48 [00:07<00:11, 2.56it/s]
293
  40%|###9 | 19/48 [00:07<00:11, 2.56it/s]
294
  42%|####1 | 20/48 [00:07<00:10, 2.70it/s]
295
  42%|####1 | 20/48 [00:07<00:10, 2.70it/s]
296
  44%|####3 | 21/48 [00:08<00:09, 2.79it/s]
297
  44%|####3 | 21/48 [00:08<00:09, 2.79it/s]
298
  46%|####5 | 22/48 [00:08<00:09, 2.86it/s]
299
  46%|####5 | 22/48 [00:08<00:09, 2.86it/s]
300
  48%|####7 | 23/48 [00:08<00:08, 2.92it/s]
301
  48%|####7 | 23/48 [00:08<00:08, 2.92it/s]
302
  50%|##### | 24/48 [00:09<00:08, 2.96it/s]
303
  50%|##### | 24/48 [00:09<00:08, 2.96it/s]
304
  52%|#####2 | 25/48 [00:09<00:08, 2.62it/s]
305
  52%|#####2 | 25/48 [00:09<00:08, 2.62it/s]
306
  54%|#####4 | 26/48 [00:10<00:08, 2.74it/s]
307
  54%|#####4 | 26/48 [00:10<00:08, 2.74it/s]
308
  56%|#####6 | 27/48 [00:10<00:07, 2.84it/s]
309
  56%|#####6 | 27/48 [00:10<00:07, 2.84it/s]
310
  58%|#####8 | 28/48 [00:10<00:06, 2.89it/s]
311
  58%|#####8 | 28/48 [00:10<00:06, 2.89it/s]
312
  60%|###### | 29/48 [00:11<00:06, 2.96it/s]
313
  60%|###### | 29/48 [00:11<00:06, 2.96it/s]
314
  62%|######2 | 30/48 [00:11<00:05, 3.01it/s]
315
  62%|######2 | 30/48 [00:11<00:05, 3.01it/s]
316
  65%|######4 | 31/48 [00:11<00:05, 3.01it/s]
317
  65%|######4 | 31/48 [00:11<00:05, 3.01it/s]
318
  67%|######6 | 32/48 [00:12<00:06, 2.65it/s]
319
  67%|######6 | 32/48 [00:12<00:06, 2.65it/s]
320
  69%|######8 | 33/48 [00:12<00:05, 2.77it/s]
321
  69%|######8 | 33/48 [00:12<00:05, 2.77it/s]
322
  71%|####### | 34/48 [00:12<00:04, 2.85it/s]
323
  71%|####### | 34/48 [00:12<00:04, 2.85it/s]
324
  73%|#######2 | 35/48 [00:13<00:04, 2.90it/s]
325
  73%|#######2 | 35/48 [00:13<00:04, 2.90it/s]
326
  75%|#######5 | 36/48 [00:13<00:04, 2.95it/s]
327
  75%|#######5 | 36/48 [00:13<00:04, 2.95it/s]
328
  77%|#######7 | 37/48 [00:13<00:03, 2.97it/s]
329
  77%|#######7 | 37/48 [00:13<00:03, 2.97it/s]
330
  79%|#######9 | 38/48 [00:14<00:03, 2.61it/s]
331
  79%|#######9 | 38/48 [00:14<00:03, 2.61it/s]
332
  81%|########1 | 39/48 [00:14<00:03, 2.73it/s]
333
  81%|########1 | 39/48 [00:14<00:03, 2.73it/s]
334
  83%|########3 | 40/48 [00:14<00:02, 2.82it/s]
335
  83%|########3 | 40/48 [00:14<00:02, 2.82it/s]
336
  85%|########5 | 41/48 [00:15<00:02, 2.90it/s]
337
  85%|########5 | 41/48 [00:15<00:02, 2.90it/s]
338
  88%|########7 | 42/48 [00:15<00:02, 2.95it/s]
339
  88%|########7 | 42/48 [00:15<00:02, 2.95it/s]
340
  90%|########9 | 43/48 [00:15<00:01, 2.99it/s]
341
  90%|########9 | 43/48 [00:15<00:01, 2.99it/s]
342
  92%|#########1| 44/48 [00:16<00:01, 3.01it/s]
343
  92%|#########1| 44/48 [00:16<00:01, 3.01it/s]
344
  94%|#########3| 45/48 [00:16<00:01, 2.63it/s]
345
  94%|#########3| 45/48 [00:16<00:01, 2.63it/s]
346
  96%|#########5| 46/48 [00:17<00:00, 2.75it/s]
347
  96%|#########5| 46/48 [00:17<00:00, 2.75it/s]
348
  98%|#########7| 47/48 [00:17<00:00, 2.85it/s]
349
  98%|#########7| 47/48 [00:17<00:00, 2.85it/s]
350
+
351
+ - quantizing extras
352
+ Moving transformer to CPU
353
+ Loading text encoder
354
+
355
+
356
+
357
+
358
+
359
+
360
+
361
+
362
+
363
+
364
+
365
+
366
+
367
+
368
+
369
+
370
+
371
+
372
+
373
+
374
+
375
+
376
+
377
+
378
+
379
+
380
+
381
+
382
+
383
+
384
+
385
+
386
+
387
+
388
+
389
+
390
+
391
+
392
+
393
+
394
+
395
+
396
+ Quantizing Text Encoder
397
+ Loading VAEs and other components
398
+
399
+
400
+
401
+
402
+
403
+
404
+
405
+
406
+
407
+
408
+
409
+
410
+
411
+
412
+
413
+
414
+ Making pipe
415
+ Preparing Model
416
+ Model Loaded
417
+ create LoRA network. base dim (rank): 32, alpha: 32
418
+ neuron dropout: p=None, rank dropout: p=None, module dropout: p=None
419
+ apply LoRA to Conv2d with kernel size (3,3). dim (rank): 16, alpha: 16
420
+ create LoRA for Text Encoder: 0 modules.
421
+ create LoRA for U-Net: 1344 modules.
422
+ enable LoRA for U-Net
423
+ Dataset: /app/ai-toolkit/datasets/49
424
+ - Preprocessing video dimensions
425
+
426
  0%| | 0/140 [00:00<?, ?it/s]
427
  0%| | 0/140 [00:00<?, ?it/s]
428
  8%|7 | 11/140 [00:00<00:01, 102.69it/s]
429
  8%|7 | 11/140 [00:00<00:01, 102.69it/s]
430
  19%|#8 | 26/140 [00:00<00:00, 126.82it/s]
431
  19%|#8 | 26/140 [00:00<00:00, 126.82it/s]
432
  31%|### | 43/140 [00:00<00:00, 143.80it/s]
433
  31%|### | 43/140 [00:00<00:00, 143.80it/s]
434
  41%|####1 | 58/140 [00:00<00:00, 143.46it/s]
435
  41%|####1 | 58/140 [00:00<00:00, 143.46it/s]
436
+
437
+ - Found 140 videos
438
+ Bucket sizes for /app/ai-toolkit/datasets/49:
439
+ 576x416: 78 files
440
+ 576x448: 44 files
441
+ 544x416: 16 files
442
+ 512x384: 2 files
443
+ 4 buckets made
444
+ Caching latents for /app/ai-toolkit/datasets/49
445
+ - Saving latents to disk
446
+
447
+
448
+ Caching text_embeddings for /app/ai-toolkit/datasets/49
449
+ - Saving text embeddings to disk
450
+
logs/1_log.txt ADDED
@@ -0,0 +1,378 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
0
  0%| | 0/48 [00:00<?, ?it/s]
1
  0%| | 0/48 [00:00<?, ?it/s]
2
  2%|2 | 1/48 [00:00<00:32, 1.44it/s]
3
  2%|2 | 1/48 [00:00<00:32, 1.44it/s]
4
  4%|4 | 2/48 [00:01<00:25, 1.79it/s]
5
  4%|4 | 2/48 [00:01<00:25, 1.79it/s]
6
  6%|6 | 3/48 [00:01<00:23, 1.94it/s]
7
  6%|6 | 3/48 [00:01<00:23, 1.94it/s]
8
  8%|8 | 4/48 [00:02<00:21, 2.02it/s]
9
  8%|8 | 4/48 [00:02<00:21, 2.02it/s]
10
  10%|# | 5/48 [00:02<00:20, 2.07it/s]
11
  10%|# | 5/48 [00:02<00:20, 2.07it/s]
12
  12%|#2 | 6/48 [00:03<00:19, 2.10it/s]
13
  12%|#2 | 6/48 [00:03<00:19, 2.10it/s]
14
  15%|#4 | 7/48 [00:03<00:19, 2.13it/s]
15
  15%|#4 | 7/48 [00:03<00:19, 2.13it/s]
16
  17%|#6 | 8/48 [00:03<00:18, 2.14it/s]
17
  17%|#6 | 8/48 [00:03<00:18, 2.14it/s]
18
  19%|#8 | 9/48 [00:04<00:18, 2.16it/s]
19
  19%|#8 | 9/48 [00:04<00:18, 2.16it/s]
20
  21%|## | 10/48 [00:04<00:17, 2.18it/s]
21
  21%|## | 10/48 [00:04<00:17, 2.18it/s]
22
  23%|##2 | 11/48 [00:05<00:16, 2.18it/s]
23
  23%|##2 | 11/48 [00:05<00:16, 2.18it/s]
24
  25%|##5 | 12/48 [00:05<00:16, 2.19it/s]
25
  25%|##5 | 12/48 [00:05<00:16, 2.19it/s]
26
  27%|##7 | 13/48 [00:06<00:17, 1.98it/s]
27
  27%|##7 | 13/48 [00:06<00:17, 1.98it/s]
28
  29%|##9 | 14/48 [00:06<00:16, 2.05it/s]
29
  29%|##9 | 14/48 [00:06<00:16, 2.05it/s]
30
  31%|###1 | 15/48 [00:07<00:15, 2.10it/s]
31
  31%|###1 | 15/48 [00:07<00:15, 2.10it/s]
32
  33%|###3 | 16/48 [00:07<00:15, 2.13it/s]
33
  33%|###3 | 16/48 [00:07<00:15, 2.13it/s]
34
  35%|###5 | 17/48 [00:08<00:14, 2.15it/s]
35
  35%|###5 | 17/48 [00:08<00:14, 2.15it/s]
36
  38%|###7 | 18/48 [00:08<00:13, 2.17it/s]
37
  38%|###7 | 18/48 [00:08<00:13, 2.17it/s]
38
  40%|###9 | 19/48 [00:09<00:14, 1.99it/s]
39
  40%|###9 | 19/48 [00:09<00:14, 1.99it/s]
40
  42%|####1 | 20/48 [00:09<00:13, 2.05it/s]
41
  42%|####1 | 20/48 [00:09<00:13, 2.05it/s]
42
  44%|####3 | 21/48 [00:10<00:12, 2.08it/s]
43
  44%|####3 | 21/48 [00:10<00:12, 2.08it/s]
44
  46%|####5 | 22/48 [00:10<00:12, 2.11it/s]
45
  46%|####5 | 22/48 [00:10<00:12, 2.11it/s]
46
  48%|####7 | 23/48 [00:11<00:11, 2.14it/s]
47
  48%|####7 | 23/48 [00:11<00:11, 2.14it/s]
48
  50%|##### | 24/48 [00:11<00:11, 2.17it/s]
49
  50%|##### | 24/48 [00:11<00:11, 2.17it/s]
50
  52%|#####2 | 25/48 [00:12<00:11, 1.96it/s]
51
  52%|#####2 | 25/48 [00:12<00:11, 1.96it/s]
52
  54%|#####4 | 26/48 [00:12<00:10, 2.07it/s]
53
  54%|#####4 | 26/48 [00:12<00:10, 2.07it/s]
54
  56%|#####6 | 27/48 [00:12<00:09, 2.13it/s]
55
  56%|#####6 | 27/48 [00:12<00:09, 2.13it/s]
56
  58%|#####8 | 28/48 [00:13<00:09, 2.18it/s]
57
  58%|#####8 | 28/48 [00:13<00:09, 2.18it/s]
58
  60%|###### | 29/48 [00:13<00:08, 2.22it/s]
59
  60%|###### | 29/48 [00:13<00:08, 2.22it/s]
60
  62%|######2 | 30/48 [00:14<00:08, 2.25it/s]
61
  62%|######2 | 30/48 [00:14<00:08, 2.25it/s]
62
  65%|######4 | 31/48 [00:14<00:07, 2.27it/s]
63
  65%|######4 | 31/48 [00:14<00:07, 2.27it/s]
64
  67%|######6 | 32/48 [00:15<00:07, 2.01it/s]
65
  67%|######6 | 32/48 [00:15<00:07, 2.01it/s]
66
  69%|######8 | 33/48 [00:15<00:07, 2.06it/s]
67
  69%|######8 | 33/48 [00:15<00:07, 2.06it/s]
68
  71%|####### | 34/48 [00:16<00:06, 2.10it/s]
69
  71%|####### | 34/48 [00:16<00:06, 2.10it/s]
70
  73%|#######2 | 35/48 [00:16<00:06, 2.13it/s]
71
  73%|#######2 | 35/48 [00:16<00:06, 2.13it/s]
72
  75%|#######5 | 36/48 [00:17<00:05, 2.16it/s]
73
  75%|#######5 | 36/48 [00:17<00:05, 2.16it/s]
74
  77%|#######7 | 37/48 [00:17<00:05, 2.18it/s]
75
  77%|#######7 | 37/48 [00:17<00:05, 2.18it/s]
76
  79%|#######9 | 38/48 [00:18<00:05, 1.98it/s]
77
  79%|#######9 | 38/48 [00:18<00:05, 1.98it/s]
78
  81%|########1 | 39/48 [00:18<00:04, 1.93it/s]
79
  81%|########1 | 39/48 [00:18<00:04, 1.93it/s]
80
  83%|########3 | 40/48 [00:19<00:04, 1.86it/s]
81
  83%|########3 | 40/48 [00:19<00:04, 1.86it/s]
82
  85%|########5 | 41/48 [00:19<00:03, 1.82it/s]
83
  85%|########5 | 41/48 [00:19<00:03, 1.82it/s]
84
  88%|########7 | 42/48 [00:20<00:03, 1.78it/s]
85
  88%|########7 | 42/48 [00:20<00:03, 1.78it/s]
86
  90%|########9 | 43/48 [00:21<00:02, 1.73it/s]
87
  90%|########9 | 43/48 [00:21<00:02, 1.73it/s]
88
  92%|#########1| 44/48 [00:21<00:02, 1.71it/s]
89
  92%|#########1| 44/48 [00:21<00:02, 1.71it/s]
90
  94%|#########3| 45/48 [00:22<00:01, 1.52it/s]
91
  94%|#########3| 45/48 [00:22<00:01, 1.52it/s]
92
  96%|#########5| 46/48 [00:23<00:01, 1.55it/s]
93
  96%|#########5| 46/48 [00:23<00:01, 1.55it/s]
94
  98%|#########7| 47/48 [00:23<00:00, 1.56it/s]
95
  98%|#########7| 47/48 [00:23<00:00, 1.56it/s]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
96
  0%| | 0/140 [00:00<?, ?it/s]
97
  0%| | 0/140 [00:00<?, ?it/s]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
98
  0%| | 0/122 [00:00<?, ?it/s]
99
  0%| | 0/122 [00:00<?, ?it/s]
100
  16%|#5 | 19/122 [00:00<00:00, 187.83it/s]
101
  16%|#5 | 19/122 [00:00<00:00, 187.83it/s]
102
  31%|###1 | 38/122 [00:00<00:00, 164.03it/s]
103
  31%|###1 | 38/122 [00:00<00:00, 164.03it/s]
104
  45%|####5 | 55/122 [00:00<00:00, 161.12it/s]
105
  45%|####5 | 55/122 [00:00<00:00, 161.12it/s]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
106
  0%| | 0/2 [00:00<?, ?it/s]
107
  0%| | 0/2 [00:00<?, ?it/s]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
108
  0%| | 0/4 [00:00<?, ?it/s]
109
  0%| | 0/4 [00:00<?, ?it/s]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
110
  0%| | 0/58 [00:00<?, ?it/s]
111
  0%| | 0/58 [00:00<?, ?it/s]
112
  26%|##5 | 15/58 [00:00<00:00, 146.08it/s]
113
  26%|##5 | 15/58 [00:00<00:00, 146.08it/s]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
114
  0%| | 0/47 [00:00<?, ?it/s]
115
  0%| | 0/47 [00:00<?, ?it/s]
116
  70%|####### | 33/47 [00:00<00:00, 329.71it/s]
117
  70%|####### | 33/47 [00:00<00:00, 329.71it/s]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
118
  0%| | 0/47 [00:00<?, ?it/s]
119
  0%| | 0/47 [00:00<?, ?it/s]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Running 1 job
2
+ {
3
+ "type": "diffusion_trainer",
4
+ "training_folder": "/app/ai-toolkit/output",
5
+ "sqlite_db_path": "/app/ai-toolkit/aitk_db.db",
6
+ "device": "cuda",
7
+ "trigger_word": null,
8
+ "performance_log_every": 10,
9
+ "network": {
10
+ "type": "lora",
11
+ "linear": 32,
12
+ "linear_alpha": 32,
13
+ "conv": 16,
14
+ "conv_alpha": 16,
15
+ "lokr_full_rank": true,
16
+ "lokr_factor": -1,
17
+ "network_kwargs": {
18
+ "ignore_if_contains": []
19
+ }
20
+ },
21
+ "save": {
22
+ "dtype": "bf16",
23
+ "save_every": 500,
24
+ "max_step_saves_to_keep": 400,
25
+ "save_format": "diffusers",
26
+ "push_to_hub": false
27
+ },
28
+ "datasets": [
29
+ {
30
+ "folder_path": "/app/ai-toolkit/datasets/49",
31
+ "mask_path": null,
32
+ "mask_min_value": 0.1,
33
+ "default_caption": "",
34
+ "caption_ext": "txt",
35
+ "caption_dropout_rate": 0,
36
+ "cache_latents_to_disk": true,
37
+ "is_reg": false,
38
+ "network_weight": 1,
39
+ "resolution": [
40
+ 512
41
+ ],
42
+ "controls": [],
43
+ "shrink_video_to_frames": true,
44
+ "num_frames": 49,
45
+ "flip_x": false,
46
+ "flip_y": false,
47
+ "num_repeats": 2,
48
+ "do_i2v": false,
49
+ "fps": 24
50
+ },
51
+ {
52
+ "folder_path": "/app/ai-toolkit/datasets/73",
53
+ "mask_path": null,
54
+ "mask_min_value": 0.1,
55
+ "default_caption": "",
56
+ "caption_ext": "txt",
57
+ "caption_dropout_rate": 0,
58
+ "cache_latents_to_disk": true,
59
+ "is_reg": false,
60
+ "network_weight": 1,
61
+ "resolution": [
62
+ 512
63
+ ],
64
+ "controls": [],
65
+ "shrink_video_to_frames": true,
66
+ "num_frames": 73,
67
+ "flip_x": false,
68
+ "flip_y": false,
69
+ "num_repeats": 2
70
+ },
71
+ {
72
+ "folder_path": "/app/ai-toolkit/datasets/81",
73
+ "mask_path": null,
74
+ "mask_min_value": 0.1,
75
+ "default_caption": "",
76
+ "caption_ext": "txt",
77
+ "caption_dropout_rate": 0,
78
+ "cache_latents_to_disk": true,
79
+ "is_reg": false,
80
+ "network_weight": 1,
81
+ "resolution": [
82
+ 512
83
+ ],
84
+ "controls": [],
85
+ "shrink_video_to_frames": true,
86
+ "num_frames": 81,
87
+ "flip_x": false,
88
+ "flip_y": false,
89
+ "num_repeats": 2
90
+ },
91
+ {
92
+ "folder_path": "/app/ai-toolkit/datasets/89",
93
+ "mask_path": null,
94
+ "mask_min_value": 0.1,
95
+ "default_caption": "",
96
+ "caption_ext": "txt",
97
+ "caption_dropout_rate": 0,
98
+ "cache_latents_to_disk": true,
99
+ "is_reg": false,
100
+ "network_weight": 1,
101
+ "resolution": [
102
+ 512
103
+ ],
104
+ "controls": [],
105
+ "shrink_video_to_frames": true,
106
+ "num_frames": 89,
107
+ "flip_x": false,
108
+ "flip_y": false,
109
+ "num_repeats": 2
110
+ },
111
+ {
112
+ "folder_path": "/app/ai-toolkit/datasets/97",
113
+ "mask_path": null,
114
+ "mask_min_value": 0.1,
115
+ "default_caption": "",
116
+ "caption_ext": "txt",
117
+ "caption_dropout_rate": 0,
118
+ "cache_latents_to_disk": true,
119
+ "is_reg": false,
120
+ "network_weight": 1,
121
+ "resolution": [
122
+ 512
123
+ ],
124
+ "controls": [],
125
+ "shrink_video_to_frames": true,
126
+ "num_frames": 97,
127
+ "flip_x": false,
128
+ "flip_y": false,
129
+ "num_repeats": 2
130
+ },
131
+ {
132
+ "folder_path": "/app/ai-toolkit/datasets/images",
133
+ "mask_path": null,
134
+ "mask_min_value": 0.1,
135
+ "default_caption": "",
136
+ "caption_ext": "txt",
137
+ "caption_dropout_rate": 0,
138
+ "cache_latents_to_disk": true,
139
+ "is_reg": false,
140
+ "network_weight": 1,
141
+ "resolution": [
142
+ 512,
143
+ 768
144
+ ],
145
+ "controls": [],
146
+ "shrink_video_to_frames": true,
147
+ "num_frames": 1,
148
+ "flip_x": false,
149
+ "flip_y": false,
150
+ "num_repeats": 1
151
+ }
152
+ ],
153
+ "train": {
154
+ "batch_size": 1,
155
+ "bypass_guidance_embedding": false,
156
+ "steps": 25000,
157
+ "gradient_accumulation": 1,
158
+ "train_unet": true,
159
+ "train_text_encoder": false,
160
+ "gradient_checkpointing": true,
161
+ "noise_scheduler": "flowmatch",
162
+ "optimizer": "adamw8bit",
163
+ "timestep_type": "weighted",
164
+ "content_or_style": "balanced",
165
+ "optimizer_params": {
166
+ "weight_decay": 0.0001
167
+ },
168
+ "unload_text_encoder": false,
169
+ "cache_text_embeddings": true,
170
+ "lr": 0.0001,
171
+ "ema_config": {
172
+ "use_ema": false,
173
+ "ema_decay": 0.99
174
+ },
175
+ "skip_first_sample": false,
176
+ "force_first_sample": false,
177
+ "disable_sampling": true,
178
+ "dtype": "bf16",
179
+ "diff_output_preservation": false,
180
+ "diff_output_preservation_multiplier": 1,
181
+ "diff_output_preservation_class": "person",
182
+ "switch_boundary_every": 1,
183
+ "loss_type": "mse"
184
+ },
185
+ "logging": {
186
+ "log_every": 1,
187
+ "use_ui_logger": true
188
+ },
189
+ "model": {
190
+ "name_or_path": "Lightricks/LTX-2",
191
+ "quantize": true,
192
+ "qtype": "qfloat8",
193
+ "quantize_te": true,
194
+ "qtype_te": "uint6",
195
+ "arch": "ltx2",
196
+ "low_vram": true,
197
+ "model_kwargs": {},
198
+ "layer_offloading": false,
199
+ "layer_offloading_text_encoder_percent": 1,
200
+ "layer_offloading_transformer_percent": 1
201
+ },
202
+ "sample": {
203
+ "sampler": "flowmatch",
204
+ "sample_every": 250,
205
+ "width": 768,
206
+ "height": 768,
207
+ "samples": [],
208
+ "neg": "",
209
+ "seed": 42,
210
+ "walk_seed": true,
211
+ "guidance_scale": 4,
212
+ "sample_steps": 25,
213
+ "num_frames": 121,
214
+ "fps": 24
215
+ }
216
+ }
217
+ Changing sample extention to animated webp
218
+ Using SQLite database at /app/ai-toolkit/aitk_db.db
219
+ Job ID: "bf530ed1-e796-42a1-9ffa-55399fe92986"
220
+
221
+ #############################################
222
+ # Running job: PLORAV7_LTX
223
+ #############################################
224
+
225
+
226
+ Running 1 process
227
+ Loading LTX2 model
228
+ Loading transformer
229
+
230
+
231
+ Quantizing Transformer
232
+ - quantizing 48 transformer blocks
233
+
234
  0%| | 0/48 [00:00<?, ?it/s]
235
  0%| | 0/48 [00:00<?, ?it/s]
236
  2%|2 | 1/48 [00:00<00:32, 1.44it/s]
237
  2%|2 | 1/48 [00:00<00:32, 1.44it/s]
238
  4%|4 | 2/48 [00:01<00:25, 1.79it/s]
239
  4%|4 | 2/48 [00:01<00:25, 1.79it/s]
240
  6%|6 | 3/48 [00:01<00:23, 1.94it/s]
241
  6%|6 | 3/48 [00:01<00:23, 1.94it/s]
242
  8%|8 | 4/48 [00:02<00:21, 2.02it/s]
243
  8%|8 | 4/48 [00:02<00:21, 2.02it/s]
244
  10%|# | 5/48 [00:02<00:20, 2.07it/s]
245
  10%|# | 5/48 [00:02<00:20, 2.07it/s]
246
  12%|#2 | 6/48 [00:03<00:19, 2.10it/s]
247
  12%|#2 | 6/48 [00:03<00:19, 2.10it/s]
248
  15%|#4 | 7/48 [00:03<00:19, 2.13it/s]
249
  15%|#4 | 7/48 [00:03<00:19, 2.13it/s]
250
  17%|#6 | 8/48 [00:03<00:18, 2.14it/s]
251
  17%|#6 | 8/48 [00:03<00:18, 2.14it/s]
252
  19%|#8 | 9/48 [00:04<00:18, 2.16it/s]
253
  19%|#8 | 9/48 [00:04<00:18, 2.16it/s]
254
  21%|## | 10/48 [00:04<00:17, 2.18it/s]
255
  21%|## | 10/48 [00:04<00:17, 2.18it/s]
256
  23%|##2 | 11/48 [00:05<00:16, 2.18it/s]
257
  23%|##2 | 11/48 [00:05<00:16, 2.18it/s]
258
  25%|##5 | 12/48 [00:05<00:16, 2.19it/s]
259
  25%|##5 | 12/48 [00:05<00:16, 2.19it/s]
260
  27%|##7 | 13/48 [00:06<00:17, 1.98it/s]
261
  27%|##7 | 13/48 [00:06<00:17, 1.98it/s]
262
  29%|##9 | 14/48 [00:06<00:16, 2.05it/s]
263
  29%|##9 | 14/48 [00:06<00:16, 2.05it/s]
264
  31%|###1 | 15/48 [00:07<00:15, 2.10it/s]
265
  31%|###1 | 15/48 [00:07<00:15, 2.10it/s]
266
  33%|###3 | 16/48 [00:07<00:15, 2.13it/s]
267
  33%|###3 | 16/48 [00:07<00:15, 2.13it/s]
268
  35%|###5 | 17/48 [00:08<00:14, 2.15it/s]
269
  35%|###5 | 17/48 [00:08<00:14, 2.15it/s]
270
  38%|###7 | 18/48 [00:08<00:13, 2.17it/s]
271
  38%|###7 | 18/48 [00:08<00:13, 2.17it/s]
272
  40%|###9 | 19/48 [00:09<00:14, 1.99it/s]
273
  40%|###9 | 19/48 [00:09<00:14, 1.99it/s]
274
  42%|####1 | 20/48 [00:09<00:13, 2.05it/s]
275
  42%|####1 | 20/48 [00:09<00:13, 2.05it/s]
276
  44%|####3 | 21/48 [00:10<00:12, 2.08it/s]
277
  44%|####3 | 21/48 [00:10<00:12, 2.08it/s]
278
  46%|####5 | 22/48 [00:10<00:12, 2.11it/s]
279
  46%|####5 | 22/48 [00:10<00:12, 2.11it/s]
280
  48%|####7 | 23/48 [00:11<00:11, 2.14it/s]
281
  48%|####7 | 23/48 [00:11<00:11, 2.14it/s]
282
  50%|##### | 24/48 [00:11<00:11, 2.17it/s]
283
  50%|##### | 24/48 [00:11<00:11, 2.17it/s]
284
  52%|#####2 | 25/48 [00:12<00:11, 1.96it/s]
285
  52%|#####2 | 25/48 [00:12<00:11, 1.96it/s]
286
  54%|#####4 | 26/48 [00:12<00:10, 2.07it/s]
287
  54%|#####4 | 26/48 [00:12<00:10, 2.07it/s]
288
  56%|#####6 | 27/48 [00:12<00:09, 2.13it/s]
289
  56%|#####6 | 27/48 [00:12<00:09, 2.13it/s]
290
  58%|#####8 | 28/48 [00:13<00:09, 2.18it/s]
291
  58%|#####8 | 28/48 [00:13<00:09, 2.18it/s]
292
  60%|###### | 29/48 [00:13<00:08, 2.22it/s]
293
  60%|###### | 29/48 [00:13<00:08, 2.22it/s]
294
  62%|######2 | 30/48 [00:14<00:08, 2.25it/s]
295
  62%|######2 | 30/48 [00:14<00:08, 2.25it/s]
296
  65%|######4 | 31/48 [00:14<00:07, 2.27it/s]
297
  65%|######4 | 31/48 [00:14<00:07, 2.27it/s]
298
  67%|######6 | 32/48 [00:15<00:07, 2.01it/s]
299
  67%|######6 | 32/48 [00:15<00:07, 2.01it/s]
300
  69%|######8 | 33/48 [00:15<00:07, 2.06it/s]
301
  69%|######8 | 33/48 [00:15<00:07, 2.06it/s]
302
  71%|####### | 34/48 [00:16<00:06, 2.10it/s]
303
  71%|####### | 34/48 [00:16<00:06, 2.10it/s]
304
  73%|#######2 | 35/48 [00:16<00:06, 2.13it/s]
305
  73%|#######2 | 35/48 [00:16<00:06, 2.13it/s]
306
  75%|#######5 | 36/48 [00:17<00:05, 2.16it/s]
307
  75%|#######5 | 36/48 [00:17<00:05, 2.16it/s]
308
  77%|#######7 | 37/48 [00:17<00:05, 2.18it/s]
309
  77%|#######7 | 37/48 [00:17<00:05, 2.18it/s]
310
  79%|#######9 | 38/48 [00:18<00:05, 1.98it/s]
311
  79%|#######9 | 38/48 [00:18<00:05, 1.98it/s]
312
  81%|########1 | 39/48 [00:18<00:04, 1.93it/s]
313
  81%|########1 | 39/48 [00:18<00:04, 1.93it/s]
314
  83%|########3 | 40/48 [00:19<00:04, 1.86it/s]
315
  83%|########3 | 40/48 [00:19<00:04, 1.86it/s]
316
  85%|########5 | 41/48 [00:19<00:03, 1.82it/s]
317
  85%|########5 | 41/48 [00:19<00:03, 1.82it/s]
318
  88%|########7 | 42/48 [00:20<00:03, 1.78it/s]
319
  88%|########7 | 42/48 [00:20<00:03, 1.78it/s]
320
  90%|########9 | 43/48 [00:21<00:02, 1.73it/s]
321
  90%|########9 | 43/48 [00:21<00:02, 1.73it/s]
322
  92%|#########1| 44/48 [00:21<00:02, 1.71it/s]
323
  92%|#########1| 44/48 [00:21<00:02, 1.71it/s]
324
  94%|#########3| 45/48 [00:22<00:01, 1.52it/s]
325
  94%|#########3| 45/48 [00:22<00:01, 1.52it/s]
326
  96%|#########5| 46/48 [00:23<00:01, 1.55it/s]
327
  96%|#########5| 46/48 [00:23<00:01, 1.55it/s]
328
  98%|#########7| 47/48 [00:23<00:00, 1.56it/s]
329
  98%|#########7| 47/48 [00:23<00:00, 1.56it/s]
330
+
331
+ - quantizing extras
332
+ Moving transformer to CPU
333
+ Loading text encoder
334
+
335
+
336
+ Quantizing Text Encoder
337
+ Loading VAEs and other components
338
+ Making pipe
339
+ Preparing Model
340
+ Model Loaded
341
+ create LoRA network. base dim (rank): 32, alpha: 32
342
+ neuron dropout: p=None, rank dropout: p=None, module dropout: p=None
343
+ apply LoRA to Conv2d with kernel size (3,3). dim (rank): 16, alpha: 16
344
+ create LoRA for Text Encoder: 0 modules.
345
+ create LoRA for U-Net: 1344 modules.
346
+ enable LoRA for U-Net
347
+ Dataset: /app/ai-toolkit/datasets/49
348
+ - Preprocessing video dimensions
349
+
350
  0%| | 0/140 [00:00<?, ?it/s]
351
  0%| | 0/140 [00:00<?, ?it/s]
352
+
353
+ - Found 140 videos
354
+ Bucket sizes for /app/ai-toolkit/datasets/49:
355
+ 576x416: 78 files
356
+ 576x448: 44 files
357
+ 544x416: 16 files
358
+ 512x384: 2 files
359
+ 4 buckets made
360
+ Caching latents for /app/ai-toolkit/datasets/49
361
+ - Saving latents to disk
362
+
363
+
364
+ Caching text_embeddings for /app/ai-toolkit/datasets/49
365
+ - Saving text embeddings to disk
366
+
367
+
368
+ Dataset: /app/ai-toolkit/datasets/73
369
+ - Preprocessing video dimensions
370
+
371
  0%| | 0/122 [00:00<?, ?it/s]
372
  0%| | 0/122 [00:00<?, ?it/s]
373
  16%|#5 | 19/122 [00:00<00:00, 187.83it/s]
374
  16%|#5 | 19/122 [00:00<00:00, 187.83it/s]
375
  31%|###1 | 38/122 [00:00<00:00, 164.03it/s]
376
  31%|###1 | 38/122 [00:00<00:00, 164.03it/s]
377
  45%|####5 | 55/122 [00:00<00:00, 161.12it/s]
378
  45%|####5 | 55/122 [00:00<00:00, 161.12it/s]
379
+
380
+ - Found 122 videos
381
+ Bucket sizes for /app/ai-toolkit/datasets/73:
382
+ 576x416: 104 files
383
+ 576x448: 6 files
384
+ 672x384: 12 files
385
+ 3 buckets made
386
+ Caching latents for /app/ai-toolkit/datasets/73
387
+ - Saving latents to disk
388
+
389
+
390
+ Caching text_embeddings for /app/ai-toolkit/datasets/73
391
+ - Saving text embeddings to disk
392
+
393
+
394
+ Dataset: /app/ai-toolkit/datasets/81
395
+ - Preprocessing video dimensions
396
+
397
  0%| | 0/2 [00:00<?, ?it/s]
398
  0%| | 0/2 [00:00<?, ?it/s]
399
+
400
+ - Found 2 videos
401
+ Bucket sizes for /app/ai-toolkit/datasets/81:
402
+ 576x416: 2 files
403
+ 1 buckets made
404
+ Caching latents for /app/ai-toolkit/datasets/81
405
+ - Saving latents to disk
406
+
407
+
408
+ Caching text_embeddings for /app/ai-toolkit/datasets/81
409
+ - Saving text embeddings to disk
410
+
411
+
412
+ Dataset: /app/ai-toolkit/datasets/89
413
+ - Preprocessing video dimensions
414
+
415
  0%| | 0/4 [00:00<?, ?it/s]
416
  0%| | 0/4 [00:00<?, ?it/s]
417
+
418
+ - Found 4 videos
419
+ Bucket sizes for /app/ai-toolkit/datasets/89:
420
+ 576x416: 4 files
421
+ 1 buckets made
422
+ Caching latents for /app/ai-toolkit/datasets/89
423
+ - Saving latents to disk
424
+
425
+
426
+ Caching text_embeddings for /app/ai-toolkit/datasets/89
427
+ - Saving text embeddings to disk
428
+
429
+
430
+ Dataset: /app/ai-toolkit/datasets/97
431
+ - Preprocessing video dimensions
432
+
433
  0%| | 0/58 [00:00<?, ?it/s]
434
  0%| | 0/58 [00:00<?, ?it/s]
435
  26%|##5 | 15/58 [00:00<00:00, 146.08it/s]
436
  26%|##5 | 15/58 [00:00<00:00, 146.08it/s]
437
+
438
+ - Found 58 videos
439
+ Bucket sizes for /app/ai-toolkit/datasets/97:
440
+ 576x416: 46 files
441
+ 672x384: 4 files
442
+ 576x448: 8 files
443
+ 3 buckets made
444
+ Caching latents for /app/ai-toolkit/datasets/97
445
+ - Saving latents to disk
446
+
447
+
448
+ Caching text_embeddings for /app/ai-toolkit/datasets/97
449
+ - Saving text embeddings to disk
450
+
451
+
452
+ Dataset: /app/ai-toolkit/datasets/images
453
+ - Preprocessing image dimensions
454
+
455
  0%| | 0/47 [00:00<?, ?it/s]
456
  0%| | 0/47 [00:00<?, ?it/s]
457
  70%|####### | 33/47 [00:00<00:00, 329.71it/s]
458
  70%|####### | 33/47 [00:00<00:00, 329.71it/s]
459
+
460
+ - Found 47 images
461
+ Bucket sizes for /app/ai-toolkit/datasets/images:
462
+ 512x512: 46 files
463
+ 576x416: 1 files
464
+ 2 buckets made
465
+ Caching latents for /app/ai-toolkit/datasets/images
466
+ - Saving latents to disk
467
+
468
+
469
+ Caching text_embeddings for /app/ai-toolkit/datasets/images
470
+ - Saving text embeddings to disk
471
+
472
+
473
+ Dataset: /app/ai-toolkit/datasets/images
474
+ - Preprocessing image dimensions
475
+
476
  0%| | 0/47 [00:00<?, ?it/s]
477
  0%| | 0/47 [00:00<?, ?it/s]
478
+
479
+ - Found 47 images
480
+ Bucket sizes for /app/ai-toolkit/datasets/images:
481
+ 512x512: 39 files
482
+ 768x768: 7 files
483
+ 864x608: 1 files
484
+ 3 buckets made
485
+ Caching latents for /app/ai-toolkit/datasets/images
486
+ - Saving latents to disk
487
+
488
+
489
+ Caching text_embeddings for /app/ai-toolkit/datasets/images
490
+ - Saving text embeddings to disk
491
+
492
+
493
+ Caching embeddings and unloading text encoder
494
+
495
+ ***** UNLOADING TEXT ENCODER *****
496
+ Embeddings cached to disk. We dont need the text encoder anymore
497
+ ***********************************
498
+
loss_log.db ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c458df4ee077dc800fab502699c92766a5727ee41dbaff2e7fa45883484b006
3
+ size 2482176
optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3f825b0eee730ea333c1974d79d7c8bfe0ae347a73cf8d2d7c8e3009e865090
3
+ size 626683383
pid.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ 504