ThatDustyGuy commited on
Commit
09562b2
·
verified ·
1 Parent(s): ad807c8

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +10 -0
  2. config.yaml +77 -94
  3. dlay_qwen_LoHA_v1.safetensors +3 -0
  4. dlay_qwen_LoHA_v1_000000400.safetensors +3 -0
  5. dlay_qwen_LoHA_v1_000000800.safetensors +3 -0
  6. dlay_qwen_LoHA_v1_000001200.safetensors +3 -0
  7. dlay_qwen_LoHA_v1_000001600.safetensors +3 -0
  8. dlay_qwen_LoHA_v1_000002000.safetensors +3 -0
  9. dlay_qwen_LoHA_v1_000002400.safetensors +3 -0
  10. dlay_qwen_LoHA_v1_000002800.safetensors +3 -0
  11. dlay_qwen_LoHA_v1_000003200.safetensors +3 -0
  12. dlay_qwen_LoHA_v1_000003600.safetensors +3 -0
  13. dlay_qwen_LoHA_v1_000004000.safetensors +3 -0
  14. dlay_qwen_LoHA_v1_000004400.safetensors +3 -0
  15. dlay_qwen_LoHA_v1_000004800.safetensors +3 -0
  16. dlay_qwen_LoHA_v1_000005200.safetensors +3 -0
  17. dlay_qwen_LoHA_v1_000005600.safetensors +3 -0
  18. optimizer.pt +3 -0
  19. samples/.ipynb_checkpoints/1765218798630__000000400_0-checkpoint.jpg +0 -0
  20. samples/.ipynb_checkpoints/1765218865047__000000400_1-checkpoint.jpg +0 -0
  21. samples/.ipynb_checkpoints/1765218931462__000000400_2-checkpoint.jpg +0 -0
  22. samples/.ipynb_checkpoints/1765218997859__000000400_3-checkpoint.jpg +0 -0
  23. samples/.ipynb_checkpoints/1765220474197__000000800_0-checkpoint.jpg +0 -0
  24. samples/.ipynb_checkpoints/1765220540569__000000800_1-checkpoint.jpg +0 -0
  25. samples/.ipynb_checkpoints/1765220606892__000000800_2-checkpoint.jpg +0 -0
  26. samples/.ipynb_checkpoints/1765220673236__000000800_3-checkpoint.jpg +0 -0
  27. samples/.ipynb_checkpoints/1765222149472__000001200_0-checkpoint.jpg +0 -0
  28. samples/.ipynb_checkpoints/1765222215896__000001200_1-checkpoint.jpg +0 -0
  29. samples/.ipynb_checkpoints/1765222282325__000001200_2-checkpoint.jpg +0 -0
  30. samples/.ipynb_checkpoints/1765223823090__000001600_0-checkpoint.jpg +0 -0
  31. samples/.ipynb_checkpoints/1765223889412__000001600_1-checkpoint.jpg +0 -0
  32. samples/.ipynb_checkpoints/1765223955750__000001600_2-checkpoint.jpg +0 -0
  33. samples/.ipynb_checkpoints/1765224022042__000001600_3-checkpoint.jpg +0 -0
  34. samples/.ipynb_checkpoints/1765225498116__000002000_0-checkpoint.jpg +0 -0
  35. samples/.ipynb_checkpoints/1765225564408__000002000_1-checkpoint.jpg +0 -0
  36. samples/.ipynb_checkpoints/1765225630752__000002000_2-checkpoint.jpg +0 -0
  37. samples/.ipynb_checkpoints/1765225697080__000002000_3-checkpoint.jpg +0 -0
  38. samples/.ipynb_checkpoints/1765227174744__000002400_0-checkpoint.jpg +0 -0
  39. samples/.ipynb_checkpoints/1765227241104__000002400_1-checkpoint.jpg +0 -0
  40. samples/.ipynb_checkpoints/1765227307429__000002400_2-checkpoint.jpg +0 -0
  41. samples/.ipynb_checkpoints/1765227373765__000002400_3-checkpoint.jpg +0 -0
  42. samples/.ipynb_checkpoints/1765228854014__000002800_0-checkpoint.jpg +0 -0
  43. samples/.ipynb_checkpoints/1765228920380__000002800_1-checkpoint.jpg +0 -0
  44. samples/.ipynb_checkpoints/1765229053127__000002800_3-checkpoint.jpg +3 -0
  45. samples/.ipynb_checkpoints/1765230530953__000003200_0-checkpoint.jpg +0 -0
  46. samples/.ipynb_checkpoints/1765230597235__000003200_1-checkpoint.jpg +0 -0
  47. samples/.ipynb_checkpoints/1765230663536__000003200_2-checkpoint.jpg +0 -0
  48. samples/.ipynb_checkpoints/1765230729846__000003200_3-checkpoint.jpg +0 -0
  49. samples/.ipynb_checkpoints/1765232211691__000003600_0-checkpoint.jpg +0 -0
  50. samples/.ipynb_checkpoints/1765232278040__000003600_1-checkpoint.jpg +0 -0
.gitattributes CHANGED
@@ -101,3 +101,13 @@ dlay_qwen_lora_v1/samples/1765212508678__000006800_3.jpg filter=lfs diff=lfs mer
101
  dlay_qwen_lora_v1/samples/1765214029041__000007600_3.jpg filter=lfs diff=lfs merge=lfs -text
102
  dlay_qwen_lora_v1/samples/1765214785978__000008000_3.jpg filter=lfs diff=lfs merge=lfs -text
103
  dlay_qwen_lora_v1/samples/1765215538813__000008400_3.jpg filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
101
  dlay_qwen_lora_v1/samples/1765214029041__000007600_3.jpg filter=lfs diff=lfs merge=lfs -text
102
  dlay_qwen_lora_v1/samples/1765214785978__000008000_3.jpg filter=lfs diff=lfs merge=lfs -text
103
  dlay_qwen_lora_v1/samples/1765215538813__000008400_3.jpg filter=lfs diff=lfs merge=lfs -text
104
+ samples/.ipynb_checkpoints/1765229053127__000002800_3-checkpoint.jpg filter=lfs diff=lfs merge=lfs -text
105
+ samples/.ipynb_checkpoints/1765232410784__000003600_3-checkpoint.jpg filter=lfs diff=lfs merge=lfs -text
106
+ samples/.ipynb_checkpoints/1765234085028__000004000_3-checkpoint.jpg filter=lfs diff=lfs merge=lfs -text
107
+ samples/.ipynb_checkpoints/1765235764342__000004400_3-checkpoint.jpg filter=lfs diff=lfs merge=lfs -text
108
+ samples/.ipynb_checkpoints/1765239111417__000005200_3-checkpoint.jpg filter=lfs diff=lfs merge=lfs -text
109
+ samples/1765229053127__000002800_3.jpg filter=lfs diff=lfs merge=lfs -text
110
+ samples/1765232410784__000003600_3.jpg filter=lfs diff=lfs merge=lfs -text
111
+ samples/1765234085028__000004000_3.jpg filter=lfs diff=lfs merge=lfs -text
112
+ samples/1765235764342__000004400_3.jpg filter=lfs diff=lfs merge=lfs -text
113
+ samples/1765239111417__000005200_3.jpg filter=lfs diff=lfs merge=lfs -text
config.yaml CHANGED
@@ -1,119 +1,102 @@
1
  job: extension
2
  config:
3
- name: Qwen-Image-LoKr-DLAY-v2
4
  process:
5
- - type: diffusion_trainer
6
- training_folder: /workspace/ai-toolkit/output
7
- sqlite_db_path: /workspace/ai-toolkit/aitk_db.db
8
- device: cuda
9
- trigger_word: null
10
- performance_log_every: 10
11
  network:
12
- type: lokr
13
- linear: 128
14
- linear_alpha: 64
15
- conv: 32
16
- conv_alpha: 16
17
- lokr_full_rank: true
18
- lokr_factor: 4
 
 
 
19
  network_kwargs:
20
- algo: lokr
21
- factor: 4
22
- dora_wd: true
23
- ignore_if_contains: []
24
- save:
25
- dtype: bf16
26
- save_every: 500
27
- max_step_saves_to_keep: 6
28
- save_format: safetensors
29
- push_to_hub: true
30
  datasets:
31
- - folder_path: /workspace/DLAY-1024/subject
32
- mask_path: /workspace/DLAY-1024/mask
33
- mask_min_value: 0.1
34
- default_caption: ''
35
  caption_ext: txt
36
- caption_dropout_rate: 0.05
37
- cache_latents_to_disk: false
38
- is_reg: false
39
- network_weight: 1
 
40
  resolution:
 
41
  - 1024
42
- controls: []
43
- shrink_video_to_frames: true
44
- num_frames: 1
45
- do_i2v: true
46
- flip_x: false
47
- flip_y: false
48
- control_path_1: null
49
- control_path_2: null
50
- control_path_3: null
51
  train:
52
- batch_size: 1
53
- bypass_guidance_embedding: false
54
- steps: 13000
55
  gradient_accumulation: 1
56
- train_unet: true
57
- train_text_encoder: false
58
- gradient_checkpointing: false
59
- attention_backend: _flash_3
60
- noise_scheduler: flowmatch
61
- optimizer: adamw
62
- timestep_type: weighted
63
- content_or_style: balanced
64
  optimizer_params:
 
 
 
65
  weight_decay: 0.01
66
- unload_text_encoder: false
67
- cache_text_embeddings: false
68
- lr: 0.0001
 
 
 
 
 
 
69
  ema_config:
70
- use_ema: true
71
- ema_decay: 0.99
 
 
 
 
 
 
72
  skip_first_sample: true
73
- force_first_sample: false
74
- disable_sampling: false
75
- dtype: bf16
76
- diff_output_preservation: false
77
- diff_output_preservation_multiplier: 1
78
- diff_output_preservation_class: person
79
- switch_boundary_every: 10
80
- inverted_mask_prior: true
81
- inverted_mask_prior_multiplier: 0.5
82
- loss_type: mse
83
- model:
84
- name_or_path: Qwen/Qwen-Image
85
- quantize: false
86
- qtype: qfloat8
87
- quantize_te: false
88
- qtype_te: qfloat8
89
- arch: qwen_image
90
- low_vram: false
91
- model_kwargs: {}
92
- layer_offloading: false
93
- layer_offloading_text_encoder_percent: 1
94
- layer_offloading_transformer_percent: 1
95
  sample:
96
  sampler: flowmatch
97
- sample_every: 1000
98
  width: 1024
99
  height: 1024
100
- samples:
101
- - prompt: A realistic photo of dlay man on a rocky overlook, gazing out at a
102
- sprawling forest and a winding blue river under a clear sky. Bright, direct
103
- sunlight of a summer afternoon.
104
- - prompt: Cinematic interior shot of dlay man standing in the center of the
105
- Pantheon in Rome, looking up towards the oculus. The vast, coffered dome
106
- is visible above, with light streaming in. Ornate marble floors and classical
107
- architecture surround him.
108
- - prompt: A photorealistic photo of dlay man standing behind a stone wall, looking
109
- out at the Giza pyramids in the sandy desert under a hazy sky.
110
  neg: ''
111
  seed: 42
112
  walk_seed: true
113
- guidance_scale: 4
114
  sample_steps: 25
115
- num_frames: 1
116
- fps: 1
117
  meta:
118
- name: '[DLAY-Qwen-Image--LoKr]'
119
  version: '1.0'
 
1
  job: extension
2
  config:
3
+ name: dlay_qwen_LoHA_v1
4
  process:
5
+ - type: sd_trainer
6
+ training_folder: /root/output
7
+ performance_log_every: 100
8
+ device: cuda:0
 
 
9
  network:
10
+ type: loha
11
+ linear: 64
12
+ linear_alpha: 32
13
+ dropout: 0.0
14
+ use_tucker: false
15
+ use_scalar: true
16
+ weight_decompose: true
17
+ wd_on_out: true
18
+ rs_lora: false
19
+ rank_dropout_scale: false
20
  network_kwargs:
21
+ rank_dropout: 0.02
22
+ model:
23
+ name_or_path: Qwen/Qwen-Image
24
+ arch: qwen_image
25
+ quantize: false
26
+ quantize_te: false
27
+ low_vram: false
28
+ layer_offloading: true
29
+ layer_offloading_transformer_percent: 0.99
 
30
  datasets:
31
+ - folder_path: /root/DATASETS/DLAY/flux2
 
 
 
32
  caption_ext: txt
33
+ default_caption: DLAY, a man with short dark brown hair and a slim build
34
+ mask_path: /root/DATASETS/DLAY/mask
35
+ mask_min_value: 0.0
36
+ invert_mask: false
37
+ loss_multiplier: 1.2
38
  resolution:
39
+ - 640
40
  - 1024
41
+ cache_latents: true
42
+ cache_latents_to_disk: true
43
+ cache_text_embeddings: true
44
+ cache_text_embeddings_to_disk: true
45
+ unload_text_encoder: true
46
+ caption_dropout_rate: 0.05
47
+ shuffle_tokens: false
 
 
48
  train:
49
+ batch_size: 2
 
 
50
  gradient_accumulation: 1
51
+ steps: 6000
52
+ attention_backend: flash
53
+ optimizer: prodigy
54
+ lr: 1.0
 
 
 
 
55
  optimizer_params:
56
+ d_coef: 1.5
57
+ decouple: true
58
+ use_bias_correction: true
59
  weight_decay: 0.01
60
+ safeguard_warmup: true
61
+ betas:
62
+ - 0.9
63
+ - 0.999
64
+ lr_scheduler: cosine_with_warmup
65
+ lr_scheduler_params:
66
+ num_warmup_steps: 200
67
+ num_training_steps: 6000
68
+ dtype: bf16
69
  ema_config:
70
+ use_ema: false
71
+ ema_decay: 0.9995
72
+ gradient_checkpointing: false
73
+ noise_scheduler: flowmatch
74
+ timestep_type: sigmoid
75
+ max_grad_norm: 1.0
76
+ train_unet: true
77
+ train_text_encoder: false
78
  skip_first_sample: true
79
+ save:
80
+ dtype: bfloat16
81
+ save_every: 400
82
+ save_format: safetensors
83
+ max_step_saves_to_keep: 15
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
84
  sample:
85
  sampler: flowmatch
86
+ sample_every: 400
87
  width: 1024
88
  height: 1024
89
+ prompts:
90
+ - DLAY, a man in a professional studio lighting, white background
91
+ - DLAY, a man wearing a suit, confident expression, corporate headshot
92
+ - DLAY, a man in a cinematic photo, close up, detailed skin texture, dramatic
93
+ lighting
94
+ - DLAY, a man wearing casual attire, outdoor setting, natural sunlight
 
 
 
 
95
  neg: ''
96
  seed: 42
97
  walk_seed: true
98
+ guidance_scale: 3.5
99
  sample_steps: 25
 
 
100
  meta:
101
+ name: '[DLAY-man-Qwen-Image-LoHA]'
102
  version: '1.0'
dlay_qwen_LoHA_v1.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78fcc8062ad5fd0db1481a9a05fcc3354bbeca5c9300c666cbfde54a597a40f2
3
+ size 2371152168
dlay_qwen_LoHA_v1_000000400.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17102dc1754a8afd4830b01e2cf18dbb1509e29c2c66195837a1806c9dc278ac
3
+ size 2371152160
dlay_qwen_LoHA_v1_000000800.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ad0b76ed31e8f5fdef58ece7ab394ccdbc9d78a2336288fcf2063c070d48580
3
+ size 2371152160
dlay_qwen_LoHA_v1_000001200.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7cb659fbd8edbf05ee515a5df4d341d239d0eaba438a75adfda416dcc5ba61b2
3
+ size 2371152168
dlay_qwen_LoHA_v1_000001600.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0e07c0660c7e59846b2defb9ab061ad7e7d54a8cecc4f26fd6fd764f3c29d64
3
+ size 2371152168
dlay_qwen_LoHA_v1_000002000.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f40af4d10d5eead0143cb7165e4b9acecacfe07ef09113fa08f6f960a5254df
3
+ size 2371152168
dlay_qwen_LoHA_v1_000002400.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e5398aaeb550fbba7509b5ca9fbbe3b187fe4c9b915dacf0f3255326f02b9c7
3
+ size 2371152168
dlay_qwen_LoHA_v1_000002800.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b48b62cba199d238bf1e32d22494fa5205c4335480c0147407f3019b14b0cdd
3
+ size 2371152168
dlay_qwen_LoHA_v1_000003200.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1653543068554963818136ae4ca0d6dbb8a9eea19c1351a940fa73c7a62fc310
3
+ size 2371152168
dlay_qwen_LoHA_v1_000003600.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b6f7685003b5069232a2cb08ad269a84f8e79712eb179fcb7bc4ca525a5c80a
3
+ size 2371152168
dlay_qwen_LoHA_v1_000004000.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33a68017b2e24df507cd72bcc9ba1ff98c7efd3d7f42a01a05b2c83f74626b3e
3
+ size 2371152168
dlay_qwen_LoHA_v1_000004400.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f640b07ac25c4f157e405de547b3f8ee0d8079226d931812258fdbf46bf2e2b
3
+ size 2371152168
dlay_qwen_LoHA_v1_000004800.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3352e1331ae392c865e44cb65a72a1ef671e0edadfd8bf95bcc40613c30e5d07
3
+ size 2371152168
dlay_qwen_LoHA_v1_000005200.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5314a9fcc2e35aa9fe9b65e64f4edff04e4f0f27ef00556bbe73b352fd458138
3
+ size 2371152168
dlay_qwen_LoHA_v1_000005600.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5532d29aec89ff9fb2db45a57d6616210b44bf4c18253deda4ea7507eeee0d93
3
+ size 2371152168
optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5e403d95d9c98ac08b1d0b29a348a12d8e362edfcd56308f8581822885edfc9
3
+ size 18893089275
samples/.ipynb_checkpoints/1765218798630__000000400_0-checkpoint.jpg ADDED
samples/.ipynb_checkpoints/1765218865047__000000400_1-checkpoint.jpg ADDED
samples/.ipynb_checkpoints/1765218931462__000000400_2-checkpoint.jpg ADDED
samples/.ipynb_checkpoints/1765218997859__000000400_3-checkpoint.jpg ADDED
samples/.ipynb_checkpoints/1765220474197__000000800_0-checkpoint.jpg ADDED
samples/.ipynb_checkpoints/1765220540569__000000800_1-checkpoint.jpg ADDED
samples/.ipynb_checkpoints/1765220606892__000000800_2-checkpoint.jpg ADDED
samples/.ipynb_checkpoints/1765220673236__000000800_3-checkpoint.jpg ADDED
samples/.ipynb_checkpoints/1765222149472__000001200_0-checkpoint.jpg ADDED
samples/.ipynb_checkpoints/1765222215896__000001200_1-checkpoint.jpg ADDED
samples/.ipynb_checkpoints/1765222282325__000001200_2-checkpoint.jpg ADDED
samples/.ipynb_checkpoints/1765223823090__000001600_0-checkpoint.jpg ADDED
samples/.ipynb_checkpoints/1765223889412__000001600_1-checkpoint.jpg ADDED
samples/.ipynb_checkpoints/1765223955750__000001600_2-checkpoint.jpg ADDED
samples/.ipynb_checkpoints/1765224022042__000001600_3-checkpoint.jpg ADDED
samples/.ipynb_checkpoints/1765225498116__000002000_0-checkpoint.jpg ADDED
samples/.ipynb_checkpoints/1765225564408__000002000_1-checkpoint.jpg ADDED
samples/.ipynb_checkpoints/1765225630752__000002000_2-checkpoint.jpg ADDED
samples/.ipynb_checkpoints/1765225697080__000002000_3-checkpoint.jpg ADDED
samples/.ipynb_checkpoints/1765227174744__000002400_0-checkpoint.jpg ADDED
samples/.ipynb_checkpoints/1765227241104__000002400_1-checkpoint.jpg ADDED
samples/.ipynb_checkpoints/1765227307429__000002400_2-checkpoint.jpg ADDED
samples/.ipynb_checkpoints/1765227373765__000002400_3-checkpoint.jpg ADDED
samples/.ipynb_checkpoints/1765228854014__000002800_0-checkpoint.jpg ADDED
samples/.ipynb_checkpoints/1765228920380__000002800_1-checkpoint.jpg ADDED
samples/.ipynb_checkpoints/1765229053127__000002800_3-checkpoint.jpg ADDED

Git LFS Details

  • SHA256: a292c9819383444751392198687c5c970b05274bbb4e3432b577bf52650fadad
  • Pointer size: 131 Bytes
  • Size of remote file: 101 kB
samples/.ipynb_checkpoints/1765230530953__000003200_0-checkpoint.jpg ADDED
samples/.ipynb_checkpoints/1765230597235__000003200_1-checkpoint.jpg ADDED
samples/.ipynb_checkpoints/1765230663536__000003200_2-checkpoint.jpg ADDED
samples/.ipynb_checkpoints/1765230729846__000003200_3-checkpoint.jpg ADDED
samples/.ipynb_checkpoints/1765232211691__000003600_0-checkpoint.jpg ADDED
samples/.ipynb_checkpoints/1765232278040__000003600_1-checkpoint.jpg ADDED