ms13d commited on
Commit
b69f3f8
·
verified ·
1 Parent(s): 50ae7f1

Add files using upload-large-folder tool

Browse files
.gitattributes CHANGED
@@ -33,3 +33,10 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ samples/1771653011691__000000250_0.webp filter=lfs diff=lfs merge=lfs -text
37
+ samples/1771653850701__000000500_0.jpg filter=lfs diff=lfs merge=lfs -text
38
+ samples/1771654478072__000000750_0.jpg filter=lfs diff=lfs merge=lfs -text
39
+ samples/1771655093289__000001000_0.jpg filter=lfs diff=lfs merge=lfs -text
40
+ samples/1771655711953__000001250_0.jpg filter=lfs diff=lfs merge=lfs -text
41
+ loss_log.db filter=lfs diff=lfs merge=lfs -text
42
+ loss_log.db-wal filter=lfs diff=lfs merge=lfs -text
.job_config.json ADDED
@@ -0,0 +1,133 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "job": "extension",
3
+ "config": {
4
+ "name": "lana-lora-wan2.2",
5
+ "process": [
6
+ {
7
+ "type": "diffusion_trainer",
8
+ "training_folder": "/root/lab/ai-toolkit/output",
9
+ "sqlite_db_path": "/root/lab/ai-toolkit/aitk_db.db",
10
+ "device": "cuda",
11
+ "trigger_word": "l4n4lux",
12
+ "performance_log_every": 10,
13
+ "network": {
14
+ "type": "lora",
15
+ "linear": 64,
16
+ "linear_alpha": 64,
17
+ "conv": 16,
18
+ "conv_alpha": 16,
19
+ "lokr_full_rank": true,
20
+ "lokr_factor": -1,
21
+ "network_kwargs": {
22
+ "ignore_if_contains": []
23
+ }
24
+ },
25
+ "save": {
26
+ "dtype": "bf16",
27
+ "save_every": 250,
28
+ "max_step_saves_to_keep": 4,
29
+ "save_format": "diffusers",
30
+ "push_to_hub": false
31
+ },
32
+ "datasets": [
33
+ {
34
+ "folder_path": "/root/lab/ai-toolkit/datasets/lana",
35
+ "mask_path": null,
36
+ "mask_min_value": 0.1,
37
+ "default_caption": "l4n4lux",
38
+ "caption_ext": "txt",
39
+ "caption_dropout_rate": 0.05,
40
+ "cache_latents_to_disk": false,
41
+ "is_reg": false,
42
+ "network_weight": 1,
43
+ "resolution": [
44
+ 512,
45
+ 768,
46
+ 1024
47
+ ],
48
+ "controls": [],
49
+ "shrink_video_to_frames": true,
50
+ "num_frames": 1,
51
+ "flip_x": false,
52
+ "flip_y": false,
53
+ "num_repeats": 1
54
+ }
55
+ ],
56
+ "train": {
57
+ "batch_size": 1,
58
+ "bypass_guidance_embedding": false,
59
+ "steps": 5000,
60
+ "gradient_accumulation": 1,
61
+ "train_unet": true,
62
+ "train_text_encoder": false,
63
+ "gradient_checkpointing": true,
64
+ "noise_scheduler": "flowmatch",
65
+ "optimizer": "adamw8bit",
66
+ "timestep_type": "sigmoid",
67
+ "content_or_style": "balanced",
68
+ "optimizer_params": {
69
+ "weight_decay": 0.0001
70
+ },
71
+ "unload_text_encoder": false,
72
+ "cache_text_embeddings": false,
73
+ "lr": 0.0001,
74
+ "ema_config": {
75
+ "use_ema": false,
76
+ "ema_decay": 0.99
77
+ },
78
+ "skip_first_sample": true,
79
+ "force_first_sample": false,
80
+ "disable_sampling": false,
81
+ "dtype": "bf16",
82
+ "diff_output_preservation": true,
83
+ "diff_output_preservation_multiplier": 1,
84
+ "diff_output_preservation_class": "woman",
85
+ "switch_boundary_every": 1,
86
+ "loss_type": "mse"
87
+ },
88
+ "logging": {
89
+ "log_every": 1,
90
+ "use_ui_logger": true
91
+ },
92
+ "model": {
93
+ "name_or_path": "ai-toolkit/Wan2.2-T2V-A14B-Diffusers-bf16",
94
+ "quantize": false,
95
+ "qtype": "qfloat8",
96
+ "quantize_te": false,
97
+ "qtype_te": "qfloat8",
98
+ "arch": "wan22_14b:t2v",
99
+ "low_vram": false,
100
+ "model_kwargs": {
101
+ "train_high_noise": false,
102
+ "train_low_noise": true
103
+ },
104
+ "layer_offloading": false,
105
+ "layer_offloading_text_encoder_percent": 1,
106
+ "layer_offloading_transformer_percent": 1
107
+ },
108
+ "sample": {
109
+ "sampler": "flowmatch",
110
+ "sample_every": 250,
111
+ "width": 1024,
112
+ "height": 1024,
113
+ "samples": [
114
+ {
115
+ "prompt": "l4n4lux, woman with red hair, playing chess at the park, bomb going off in the background"
116
+ }
117
+ ],
118
+ "neg": "",
119
+ "seed": 42,
120
+ "walk_seed": true,
121
+ "guidance_scale": 4,
122
+ "sample_steps": 12,
123
+ "num_frames": 1,
124
+ "fps": 1
125
+ }
126
+ }
127
+ ]
128
+ },
129
+ "meta": {
130
+ "name": "[name]",
131
+ "version": "1.0"
132
+ }
133
+ }
config.yaml ADDED
@@ -0,0 +1,110 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ job: extension
2
+ config:
3
+ name: lana-lora-wan2.2
4
+ process:
5
+ - type: diffusion_trainer
6
+ training_folder: /root/lab/ai-toolkit/output
7
+ sqlite_db_path: /root/lab/ai-toolkit/aitk_db.db
8
+ device: cuda
9
+ trigger_word: l4n4lux
10
+ performance_log_every: 10
11
+ network:
12
+ type: lora
13
+ linear: 64
14
+ linear_alpha: 64
15
+ conv: 16
16
+ conv_alpha: 16
17
+ lokr_full_rank: true
18
+ lokr_factor: -1
19
+ network_kwargs:
20
+ ignore_if_contains: []
21
+ save:
22
+ dtype: bf16
23
+ save_every: 250
24
+ max_step_saves_to_keep: 4
25
+ save_format: diffusers
26
+ push_to_hub: false
27
+ datasets:
28
+ - folder_path: /root/lab/ai-toolkit/datasets/lana
29
+ mask_path: null
30
+ mask_min_value: 0.1
31
+ default_caption: l4n4lux
32
+ caption_ext: txt
33
+ caption_dropout_rate: 0.05
34
+ cache_latents_to_disk: false
35
+ is_reg: false
36
+ network_weight: 1
37
+ resolution:
38
+ - 512
39
+ - 768
40
+ - 1024
41
+ controls: []
42
+ shrink_video_to_frames: true
43
+ num_frames: 1
44
+ flip_x: false
45
+ flip_y: false
46
+ num_repeats: 1
47
+ train:
48
+ batch_size: 1
49
+ bypass_guidance_embedding: false
50
+ steps: 5000
51
+ gradient_accumulation: 1
52
+ train_unet: true
53
+ train_text_encoder: false
54
+ gradient_checkpointing: true
55
+ noise_scheduler: flowmatch
56
+ optimizer: adamw8bit
57
+ timestep_type: sigmoid
58
+ content_or_style: balanced
59
+ optimizer_params:
60
+ weight_decay: 0.0001
61
+ unload_text_encoder: false
62
+ cache_text_embeddings: false
63
+ lr: 0.0001
64
+ ema_config:
65
+ use_ema: false
66
+ ema_decay: 0.99
67
+ skip_first_sample: true
68
+ force_first_sample: false
69
+ disable_sampling: false
70
+ dtype: bf16
71
+ diff_output_preservation: true
72
+ diff_output_preservation_multiplier: 1
73
+ diff_output_preservation_class: woman
74
+ switch_boundary_every: 1
75
+ loss_type: mse
76
+ logging:
77
+ log_every: 1
78
+ use_ui_logger: true
79
+ model:
80
+ name_or_path: ai-toolkit/Wan2.2-T2V-A14B-Diffusers-bf16
81
+ quantize: false
82
+ qtype: qfloat8
83
+ quantize_te: false
84
+ qtype_te: qfloat8
85
+ arch: wan22_14b:t2v
86
+ low_vram: false
87
+ model_kwargs:
88
+ train_high_noise: false
89
+ train_low_noise: true
90
+ layer_offloading: false
91
+ layer_offloading_text_encoder_percent: 1
92
+ layer_offloading_transformer_percent: 1
93
+ sample:
94
+ sampler: flowmatch
95
+ sample_every: 250
96
+ width: 1024
97
+ height: 1024
98
+ samples:
99
+ - prompt: l4n4lux, woman with red hair, playing chess at the park, bomb going
100
+ off in the background
101
+ neg: ''
102
+ seed: 42
103
+ walk_seed: true
104
+ guidance_scale: 4
105
+ sample_steps: 12
106
+ num_frames: 1
107
+ fps: 1
108
+ meta:
109
+ name: lana-lora-wan2.2
110
+ version: '1.0'
lana-lora-wan2.2_000000250_low_noise.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:295dfc78dfd4ccceefb9a1d5d440a501d18834155f42f653b3e21f9b0ee103d7
3
+ size 613517200
lana-lora-wan2.2_000000500_low_noise.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5fad325df2bff7abc7769a6e2844c36f267936562eb30ab65c295f9e37a33bcf
3
+ size 613517200
lana-lora-wan2.2_000000750_low_noise.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:154e76abf3332afe0fb0660fcd68ff9330ec84f482d4073faf12f8255138b586
3
+ size 613517200
lana-lora-wan2.2_000001000_low_noise.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6891f479309f36b3adac4a7e713a31460a9727a2e5a278b8b670a9ac748d81a8
3
+ size 613517200
lana-lora-wan2.2_000001250_low_noise.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13172a6d07954845b90c559d2b7428b1bbd0836587d237328c12ae7bd114744a
3
+ size 613517200
log.txt ADDED
@@ -0,0 +1,188 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
0
  0%| | 0/72 [00:00<?, ?it/s]
1
  0%| | 0/72 [00:00<?, ?it/s]
 
 
 
 
 
 
 
 
2
  0%| | 0/72 [00:00<?, ?it/s]
3
  0%| | 0/72 [00:00<?, ?it/s]
 
 
 
 
 
 
 
 
4
  0%| | 0/72 [00:00<?, ?it/s]
5
  0%| | 0/72 [00:00<?, ?it/s]
 
 
 
 
 
 
 
 
1
+ Running 1 job
2
+ {
3
+ "type": "diffusion_trainer",
4
+ "training_folder": "/root/lab/ai-toolkit/output",
5
+ "sqlite_db_path": "/root/lab/ai-toolkit/aitk_db.db",
6
+ "device": "cuda",
7
+ "trigger_word": "l4n4lux",
8
+ "performance_log_every": 10,
9
+ "network": {
10
+ "type": "lora",
11
+ "linear": 64,
12
+ "linear_alpha": 64,
13
+ "conv": 16,
14
+ "conv_alpha": 16,
15
+ "lokr_full_rank": true,
16
+ "lokr_factor": -1,
17
+ "network_kwargs": {
18
+ "ignore_if_contains": []
19
+ }
20
+ },
21
+ "save": {
22
+ "dtype": "bf16",
23
+ "save_every": 250,
24
+ "max_step_saves_to_keep": 4,
25
+ "save_format": "diffusers",
26
+ "push_to_hub": false
27
+ },
28
+ "datasets": [
29
+ {
30
+ "folder_path": "/root/lab/ai-toolkit/datasets/lana",
31
+ "mask_path": null,
32
+ "mask_min_value": 0.1,
33
+ "default_caption": "l4n4lux",
34
+ "caption_ext": "txt",
35
+ "caption_dropout_rate": 0.05,
36
+ "cache_latents_to_disk": false,
37
+ "is_reg": false,
38
+ "network_weight": 1,
39
+ "resolution": [
40
+ 512,
41
+ 768,
42
+ 1024
43
+ ],
44
+ "controls": [],
45
+ "shrink_video_to_frames": true,
46
+ "num_frames": 1,
47
+ "flip_x": false,
48
+ "flip_y": false,
49
+ "num_repeats": 1
50
+ }
51
+ ],
52
+ "train": {
53
+ "batch_size": 1,
54
+ "bypass_guidance_embedding": false,
55
+ "steps": 5000,
56
+ "gradient_accumulation": 1,
57
+ "train_unet": true,
58
+ "train_text_encoder": false,
59
+ "gradient_checkpointing": true,
60
+ "noise_scheduler": "flowmatch",
61
+ "optimizer": "adamw8bit",
62
+ "timestep_type": "sigmoid",
63
+ "content_or_style": "balanced",
64
+ "optimizer_params": {
65
+ "weight_decay": 0.0001
66
+ },
67
+ "unload_text_encoder": false,
68
+ "cache_text_embeddings": false,
69
+ "lr": 0.0001,
70
+ "ema_config": {
71
+ "use_ema": false,
72
+ "ema_decay": 0.99
73
+ },
74
+ "skip_first_sample": true,
75
+ "force_first_sample": false,
76
+ "disable_sampling": false,
77
+ "dtype": "bf16",
78
+ "diff_output_preservation": true,
79
+ "diff_output_preservation_multiplier": 1,
80
+ "diff_output_preservation_class": "woman",
81
+ "switch_boundary_every": 1,
82
+ "loss_type": "mse"
83
+ },
84
+ "logging": {
85
+ "log_every": 1,
86
+ "use_ui_logger": true
87
+ },
88
+ "model": {
89
+ "name_or_path": "ai-toolkit/Wan2.2-T2V-A14B-Diffusers-bf16",
90
+ "quantize": false,
91
+ "qtype": "qfloat8",
92
+ "quantize_te": false,
93
+ "qtype_te": "qfloat8",
94
+ "arch": "wan22_14b:t2v",
95
+ "low_vram": false,
96
+ "model_kwargs": {
97
+ "train_high_noise": false,
98
+ "train_low_noise": true
99
+ },
100
+ "layer_offloading": false,
101
+ "layer_offloading_text_encoder_percent": 1,
102
+ "layer_offloading_transformer_percent": 1
103
+ },
104
+ "sample": {
105
+ "sampler": "flowmatch",
106
+ "sample_every": 250,
107
+ "width": 1024,
108
+ "height": 1024,
109
+ "samples": [
110
+ {
111
+ "prompt": "l4n4lux, woman with red hair, playing chess at the park, bomb going off in the background"
112
+ }
113
+ ],
114
+ "neg": "",
115
+ "seed": 42,
116
+ "walk_seed": true,
117
+ "guidance_scale": 4,
118
+ "sample_steps": 12,
119
+ "num_frames": 1,
120
+ "fps": 1
121
+ }
122
+ }
123
+ Using SQLite database at /root/lab/ai-toolkit/aitk_db.db
124
+ Job ID: "765fbd95-c627-460c-a232-147504194a44"
125
+
126
+ #############################################
127
+ # Running job: lana-lora-wan2.2
128
+ #############################################
129
+
130
+
131
+ Running 1 process
132
+ Loading Wan model
133
+ Loading transformer 1
134
+
135
+
136
+ Loading transformer 2
137
+
138
+
139
+ Creating DualWanTransformer3DModel
140
+ Loading UMT5EncoderModel
141
+ You set `add_prefix_space`. The tokenizer needs to be converted from the slow tokenizers
142
+ You set `add_prefix_space`. The tokenizer needs to be converted from the slow tokenizers
143
+ Using ai-toolkit/umt5_xxl_encoder for UMT5 encoder.
144
+ `torch_dtype` is deprecated! Use `dtype` instead!
145
+ `torch_dtype` is deprecated! Use `dtype` instead!
146
+
147
+
148
+ Loading VAE
149
+ Making pipe
150
+ Preparing Model
151
+ create LoRA network. base dim (rank): 64, alpha: 64
152
+ neuron dropout: p=None, rank dropout: p=None, module dropout: p=None
153
+ apply LoRA to Conv2d with kernel size (3,3). dim (rank): 16, alpha: 16
154
+ create LoRA for Text Encoder: 0 modules.
155
+ create LoRA for U-Net: 400 modules.
156
+ enable LoRA for U-Net
157
+ #### IMPORTANT RESUMING FROM /root/lab/ai-toolkit/output/lana-lora-wan2.2/lana-lora-wan2.2_000001250_low_noise.safetensors ####
158
+ Loading from /root/lab/ai-toolkit/output/lana-lora-wan2.2/lana-lora-wan2.2_000001250_low_noise.safetensors
159
+ Missing keys: []
160
+ Found step 1250 in metadata, starting from there
161
+ Loading optimizer state from /root/lab/ai-toolkit/output/lana-lora-wan2.2/optimizer.pt
162
+ Updating optimizer LR from params
163
+ Dataset: /root/lab/ai-toolkit/datasets/lana
164
+ - Preprocessing image dimensions
165
+
166
  0%| | 0/72 [00:00<?, ?it/s]
167
  0%| | 0/72 [00:00<?, ?it/s]
168
+
169
+ - Found 72 images
170
+ Bucket sizes for /root/lab/ai-toolkit/datasets/lana:
171
+ 480x512: 72 files
172
+ 1 buckets made
173
+ Dataset: /root/lab/ai-toolkit/datasets/lana
174
+ - Preprocessing image dimensions
175
+
176
  0%| | 0/72 [00:00<?, ?it/s]
177
  0%| | 0/72 [00:00<?, ?it/s]
178
+
179
+ - Found 72 images
180
+ Bucket sizes for /root/lab/ai-toolkit/datasets/lana:
181
+ 720x768: 72 files
182
+ 1 buckets made
183
+ Dataset: /root/lab/ai-toolkit/datasets/lana
184
+ - Preprocessing image dimensions
185
+
186
  0%| | 0/72 [00:00<?, ?it/s]
187
  0%| | 0/72 [00:00<?, ?it/s]
188
+
189
+ - Found 72 images
190
+ Bucket sizes for /root/lab/ai-toolkit/datasets/lana:
191
+ 960x1024: 72 files
192
+ 1 buckets made
193
+ Skipping first sample due to config setting
194
+
logs/0_log.txt ADDED
The diff for this file is too large to render. See raw diff
 
logs/1_log.txt ADDED
The diff for this file is too large to render. See raw diff
 
loss_log.db ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dbbc6e970be6c9bb7bcf44492a48f71f7c4fa8b281d2d10f6f2c1b24823717cd
3
+ size 286720
loss_log.db-shm ADDED
Binary file (32.8 kB). View file
 
loss_log.db-wal ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be17acb9131836b918f041bb52e6c7cb561e01ffb5ae345459835d7755cfd0c2
3
+ size 4120032
optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbfff146829b25fb2f4752f8ae1557191bd1c03e68263780b7f10e5be0322376
3
+ size 623951333
pid.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ 29281
samples/1771653011691__000000250_0.webp ADDED

Git LFS Details

  • SHA256: 0c0e73904bae0c7604935748a0300ada08531e16b7565c9f5388b640374104e0
  • Pointer size: 132 Bytes
  • Size of remote file: 3.57 MB
samples/1771653850701__000000500_0.jpg ADDED

Git LFS Details

  • SHA256: c37f7affc34f8300d38c1f90f0b9c06464a40844765fc59c5871ebcf0f6a7bf5
  • Pointer size: 131 Bytes
  • Size of remote file: 195 kB
samples/1771654478072__000000750_0.jpg ADDED

Git LFS Details

  • SHA256: 6f6777aa78d16d4d084d14310561383ce76ce93082c18137d66446da89167a0f
  • Pointer size: 131 Bytes
  • Size of remote file: 193 kB
samples/1771655093289__000001000_0.jpg ADDED

Git LFS Details

  • SHA256: 4e917d3197476423b937772ed7a228f8351540985f6943854e98dc54fa8a519b
  • Pointer size: 131 Bytes
  • Size of remote file: 193 kB
samples/1771655711953__000001250_0.jpg ADDED

Git LFS Details

  • SHA256: 09651128aa1704658b15ccadd24963de4cdce2cda1db4ecd42571b8fae7e5984
  • Pointer size: 131 Bytes
  • Size of remote file: 196 kB