TheMindExpansionNetwork commited on
Commit
0b4a4dd
·
verified ·
1 Parent(s): aa3ecf4

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +4 -0
  2. .job_config.json +135 -0
  3. config.yaml +126 -0
  4. hash_cache_v1.safetensors +3 -0
  5. hash_cache_v1_000002000.safetensors +3 -0
  6. hash_cache_v1_000002250.safetensors +3 -0
  7. hash_cache_v1_000002500.safetensors +3 -0
  8. hash_cache_v1_000002750.safetensors +3 -0
  9. log.txt +0 -0
  10. optimizer.pt +3 -0
  11. pid.txt +1 -0
  12. samples/1763244777125__000000000_0.jpg +0 -0
  13. samples/1763244847638__000000000_1.jpg +0 -0
  14. samples/1763244918161__000000000_2.jpg +0 -0
  15. samples/1763244989127__000000000_3.jpg +0 -0
  16. samples/1763245869172__000000250_0.jpg +0 -0
  17. samples/1763245941492__000000250_1.jpg +0 -0
  18. samples/1763246013882__000000250_2.jpg +0 -0
  19. samples/1763246086279__000000250_3.jpg +0 -0
  20. samples/1763246958297__000000500_0.jpg +0 -0
  21. samples/1763247030518__000000500_1.jpg +0 -0
  22. samples/1763247102833__000000500_2.jpg +0 -0
  23. samples/1763247175174__000000500_3.jpg +0 -0
  24. samples/1763248036622__000000750_0.jpg +0 -0
  25. samples/1763248108868__000000750_1.jpg +0 -0
  26. samples/1763248181412__000000750_2.jpg +0 -0
  27. samples/1763248253941__000000750_3.jpg +0 -0
  28. samples/1763249132486__000001000_0.jpg +0 -0
  29. samples/1763249204958__000001000_1.jpg +0 -0
  30. samples/1763249277546__000001000_2.jpg +0 -0
  31. samples/1763249349926__000001000_3.jpg +0 -0
  32. samples/1763250220760__000001250_0.jpg +0 -0
  33. samples/1763250293230__000001250_1.jpg +0 -0
  34. samples/1763250365742__000001250_2.jpg +0 -0
  35. samples/1763250438055__000001250_3.jpg +0 -0
  36. samples/1763251300994__000001500_0.jpg +0 -0
  37. samples/1763251373348__000001500_1.jpg +0 -0
  38. samples/1763251445767__000001500_2.jpg +0 -0
  39. samples/1763251518184__000001500_3.jpg +0 -0
  40. samples/1763252388902__000001750_0.jpg +0 -0
  41. samples/1763252461313__000001750_1.jpg +0 -0
  42. samples/1763252533715__000001750_2.jpg +0 -0
  43. samples/1763252606026__000001750_3.jpg +0 -0
  44. samples/1763253487029__000002000_0.jpg +0 -0
  45. samples/1763253559402__000002000_1.jpg +0 -0
  46. samples/1763253631997__000002000_2.jpg +0 -0
  47. samples/1763253704491__000002000_3.jpg +0 -0
  48. samples/1763254572411__000002250_0.jpg +0 -0
  49. samples/1763254644904__000002250_1.jpg +0 -0
  50. samples/1763254717481__000002250_2.jpg +3 -0
.gitattributes CHANGED
@@ -33,3 +33,7 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ samples/1763254717481__000002250_2.jpg filter=lfs diff=lfs merge=lfs -text
37
+ samples/1763255798300__000002500_2.jpg filter=lfs diff=lfs merge=lfs -text
38
+ samples/1763256921963__000002750_2.jpg filter=lfs diff=lfs merge=lfs -text
39
+ samples/1763258006174__000003000_2.jpg filter=lfs diff=lfs merge=lfs -text
.job_config.json ADDED
@@ -0,0 +1,135 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "job": "extension",
3
+ "config": {
4
+ "name": "hash_cache_v1",
5
+ "process": [
6
+ {
7
+ "type": "diffusion_trainer",
8
+ "training_folder": "/app/ai-toolkit/output",
9
+ "sqlite_db_path": "/app/ai-toolkit/aitk_db.db",
10
+ "device": "cuda",
11
+ "trigger_word": null,
12
+ "performance_log_every": 10,
13
+ "network": {
14
+ "type": "lora",
15
+ "linear": 32,
16
+ "linear_alpha": 32,
17
+ "conv": 16,
18
+ "conv_alpha": 16,
19
+ "lokr_full_rank": true,
20
+ "lokr_factor": -1,
21
+ "network_kwargs": {
22
+ "ignore_if_contains": []
23
+ }
24
+ },
25
+ "save": {
26
+ "dtype": "bf16",
27
+ "save_every": 250,
28
+ "max_step_saves_to_keep": 4,
29
+ "save_format": "diffusers",
30
+ "push_to_hub": false
31
+ },
32
+ "datasets": [
33
+ {
34
+ "folder_path": "/app/ai-toolkit/datasets/hash_cache",
35
+ "mask_path": null,
36
+ "mask_min_value": 0.1,
37
+ "default_caption": "",
38
+ "caption_ext": "txt",
39
+ "caption_dropout_rate": 0.05,
40
+ "cache_latents_to_disk": false,
41
+ "is_reg": false,
42
+ "network_weight": 1,
43
+ "resolution": [
44
+ 512,
45
+ 768,
46
+ 1024
47
+ ],
48
+ "controls": [],
49
+ "shrink_video_to_frames": true,
50
+ "num_frames": 1,
51
+ "do_i2v": true,
52
+ "flip_x": false,
53
+ "flip_y": false
54
+ }
55
+ ],
56
+ "train": {
57
+ "batch_size": 1,
58
+ "bypass_guidance_embedding": false,
59
+ "steps": 3000,
60
+ "gradient_accumulation": 1,
61
+ "train_unet": true,
62
+ "train_text_encoder": false,
63
+ "gradient_checkpointing": true,
64
+ "noise_scheduler": "flowmatch",
65
+ "optimizer": "adamw8bit",
66
+ "timestep_type": "weighted",
67
+ "content_or_style": "balanced",
68
+ "optimizer_params": {
69
+ "weight_decay": 0.0001
70
+ },
71
+ "unload_text_encoder": false,
72
+ "cache_text_embeddings": false,
73
+ "lr": 0.0001,
74
+ "ema_config": {
75
+ "use_ema": false,
76
+ "ema_decay": 0.99
77
+ },
78
+ "skip_first_sample": false,
79
+ "force_first_sample": false,
80
+ "disable_sampling": false,
81
+ "dtype": "bf16",
82
+ "diff_output_preservation": false,
83
+ "diff_output_preservation_multiplier": 1,
84
+ "diff_output_preservation_class": "person",
85
+ "switch_boundary_every": 1,
86
+ "loss_type": "mse"
87
+ },
88
+ "model": {
89
+ "name_or_path": "Qwen/Qwen-Image",
90
+ "quantize": true,
91
+ "qtype": "qfloat8",
92
+ "quantize_te": true,
93
+ "qtype_te": "qfloat8",
94
+ "arch": "qwen_image",
95
+ "low_vram": true,
96
+ "model_kwargs": {},
97
+ "layer_offloading": false,
98
+ "layer_offloading_text_encoder_percent": 1,
99
+ "layer_offloading_transformer_percent": 1
100
+ },
101
+ "sample": {
102
+ "sampler": "flowmatch",
103
+ "sample_every": 250,
104
+ "width": 1024,
105
+ "height": 1024,
106
+ "samples": [
107
+ {
108
+ "prompt": "Two adult people sitting side-by-side on a couch in a simple room, full bodies fully visible in frame. Neutral lighting, no stylization, no dramatic poses. Both figures look forward calmly with relaxed posture, hands resting naturally. The background is minimal and uncluttered, with a plain wall, soft shadows and a low-table in front. No neon, no props — just clean, natural photographic realism."
109
+ },
110
+ {
111
+ "prompt": "Two adults slightly slouched on a couch, clearly drunk but not cartoonish: relaxed posture, unfocused expressions, leaning into each other casually. Full bodies visible. The room is dim but neutral in tone, with soft warm lighting, subtle background blur and no dramatic color effects. A few bottles or cans on a table in front for context, but environment remains minimal and clean."
112
+ },
113
+ {
114
+ "prompt": "A clean black-and-white line-art drawing of two people sitting on a couch, full bodies visible, simple outlines with minimal shading. Smooth, consistent linework, no stylization like anime or comic — neutral sketchbook quality. Background lightly suggested with simple lines for the couch and wall. No color, no text, no shadows — pure structural line drawing."
115
+ },
116
+ {
117
+ "prompt": "Two human silhouettes sitting on a couch, shown as solid matte shapes with no internal details. Full bodies visible, clean side-by-side posture. The couch is a simple silhouette shape as well. Background is blank white. No shading, no texture — pure flat graphical silhouette intended only for pose and composition reference."
118
+ }
119
+ ],
120
+ "neg": "",
121
+ "seed": 42,
122
+ "walk_seed": true,
123
+ "guidance_scale": 4,
124
+ "sample_steps": 25,
125
+ "num_frames": 1,
126
+ "fps": 1
127
+ }
128
+ }
129
+ ]
130
+ },
131
+ "meta": {
132
+ "name": "[name]",
133
+ "version": "1.0"
134
+ }
135
+ }
config.yaml ADDED
@@ -0,0 +1,126 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ job: extension
2
+ config:
3
+ name: hash_cache_v1
4
+ process:
5
+ - type: diffusion_trainer
6
+ training_folder: /app/ai-toolkit/output
7
+ sqlite_db_path: /app/ai-toolkit/aitk_db.db
8
+ device: cuda
9
+ trigger_word: null
10
+ performance_log_every: 10
11
+ network:
12
+ type: lora
13
+ linear: 32
14
+ linear_alpha: 32
15
+ conv: 16
16
+ conv_alpha: 16
17
+ lokr_full_rank: true
18
+ lokr_factor: -1
19
+ network_kwargs:
20
+ ignore_if_contains: []
21
+ save:
22
+ dtype: bf16
23
+ save_every: 250
24
+ max_step_saves_to_keep: 4
25
+ save_format: diffusers
26
+ push_to_hub: false
27
+ datasets:
28
+ - folder_path: /app/ai-toolkit/datasets/hash_cache
29
+ mask_path: null
30
+ mask_min_value: 0.1
31
+ default_caption: ''
32
+ caption_ext: txt
33
+ caption_dropout_rate: 0.05
34
+ cache_latents_to_disk: false
35
+ is_reg: false
36
+ network_weight: 1
37
+ resolution:
38
+ - 512
39
+ - 768
40
+ - 1024
41
+ controls: []
42
+ shrink_video_to_frames: true
43
+ num_frames: 1
44
+ do_i2v: true
45
+ flip_x: false
46
+ flip_y: false
47
+ train:
48
+ batch_size: 1
49
+ bypass_guidance_embedding: false
50
+ steps: 3000
51
+ gradient_accumulation: 1
52
+ train_unet: true
53
+ train_text_encoder: false
54
+ gradient_checkpointing: true
55
+ noise_scheduler: flowmatch
56
+ optimizer: adamw8bit
57
+ timestep_type: weighted
58
+ content_or_style: balanced
59
+ optimizer_params:
60
+ weight_decay: 0.0001
61
+ unload_text_encoder: false
62
+ cache_text_embeddings: false
63
+ lr: 0.0001
64
+ ema_config:
65
+ use_ema: false
66
+ ema_decay: 0.99
67
+ skip_first_sample: false
68
+ force_first_sample: false
69
+ disable_sampling: false
70
+ dtype: bf16
71
+ diff_output_preservation: false
72
+ diff_output_preservation_multiplier: 1
73
+ diff_output_preservation_class: person
74
+ switch_boundary_every: 1
75
+ loss_type: mse
76
+ model:
77
+ name_or_path: Qwen/Qwen-Image
78
+ quantize: true
79
+ qtype: qfloat8
80
+ quantize_te: true
81
+ qtype_te: qfloat8
82
+ arch: qwen_image
83
+ low_vram: true
84
+ model_kwargs: {}
85
+ layer_offloading: false
86
+ layer_offloading_text_encoder_percent: 1
87
+ layer_offloading_transformer_percent: 1
88
+ sample:
89
+ sampler: flowmatch
90
+ sample_every: 250
91
+ width: 1024
92
+ height: 1024
93
+ samples:
94
+ - prompt: "Two adult people sitting side-by-side on a couch in a simple room,\
95
+ \ full bodies fully visible in frame. Neutral lighting, no stylization,\
96
+ \ no dramatic poses. Both figures look forward calmly with relaxed posture,\
97
+ \ hands resting naturally. The background is minimal and uncluttered, with\
98
+ \ a plain wall, soft shadows and a low-table in front. No neon, no props\
99
+ \ \u2014 just clean, natural photographic realism."
100
+ - prompt: 'Two adults slightly slouched on a couch, clearly drunk but not cartoonish:
101
+ relaxed posture, unfocused expressions, leaning into each other casually.
102
+ Full bodies visible. The room is dim but neutral in tone, with soft warm
103
+ lighting, subtle background blur and no dramatic color effects. A few bottles
104
+ or cans on a table in front for context, but environment remains minimal
105
+ and clean.'
106
+ - prompt: "A clean black-and-white line-art drawing of two people sitting on\
107
+ \ a couch, full bodies visible, simple outlines with minimal shading. Smooth,\
108
+ \ consistent linework, no stylization like anime or comic \u2014 neutral\
109
+ \ sketchbook quality. Background lightly suggested with simple lines for\
110
+ \ the couch and wall. No color, no text, no shadows \u2014 pure structural\
111
+ \ line drawing."
112
+ - prompt: "Two human silhouettes sitting on a couch, shown as solid matte shapes\
113
+ \ with no internal details. Full bodies visible, clean side-by-side posture.\
114
+ \ The couch is a simple silhouette shape as well. Background is blank white.\
115
+ \ No shading, no texture \u2014 pure flat graphical silhouette intended\
116
+ \ only for pose and composition reference."
117
+ neg: ''
118
+ seed: 42
119
+ walk_seed: true
120
+ guidance_scale: 4
121
+ sample_steps: 25
122
+ num_frames: 1
123
+ fps: 1
124
+ meta:
125
+ name: hash_cache_v1
126
+ version: '1.0'
hash_cache_v1.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fcdab1bbb2b305363d034d30f885bca6d3f67b3685706475ae5b974c2b04fe1d
3
+ size 590058824
hash_cache_v1_000002000.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cdff1eca1644da954b2c5c379e3f6299159bcb0596d7183d00eae51ee9454686
3
+ size 590058824
hash_cache_v1_000002250.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1858da18ebec668624a740d2379e6eca19aafcff049df96538a11a52ea71f7bb
3
+ size 590058824
hash_cache_v1_000002500.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:377cc623a5abbfb75d6372091f464440633a651d75c62f27ea0ac56851ea2aab
3
+ size 590058824
hash_cache_v1_000002750.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3516f980a2c016976faed96bf9f8c21e9f4dace8e6e1849839bac2edd8db6e2b
3
+ size 590058824
log.txt ADDED
The diff for this file is too large to render. See raw diff
 
optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fee356929b2770853d09f29520173ebbd992d7526f690e6db892525045550ed0
3
+ size 598613389
pid.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ 343
samples/1763244777125__000000000_0.jpg ADDED
samples/1763244847638__000000000_1.jpg ADDED
samples/1763244918161__000000000_2.jpg ADDED
samples/1763244989127__000000000_3.jpg ADDED
samples/1763245869172__000000250_0.jpg ADDED
samples/1763245941492__000000250_1.jpg ADDED
samples/1763246013882__000000250_2.jpg ADDED
samples/1763246086279__000000250_3.jpg ADDED
samples/1763246958297__000000500_0.jpg ADDED
samples/1763247030518__000000500_1.jpg ADDED
samples/1763247102833__000000500_2.jpg ADDED
samples/1763247175174__000000500_3.jpg ADDED
samples/1763248036622__000000750_0.jpg ADDED
samples/1763248108868__000000750_1.jpg ADDED
samples/1763248181412__000000750_2.jpg ADDED
samples/1763248253941__000000750_3.jpg ADDED
samples/1763249132486__000001000_0.jpg ADDED
samples/1763249204958__000001000_1.jpg ADDED
samples/1763249277546__000001000_2.jpg ADDED
samples/1763249349926__000001000_3.jpg ADDED
samples/1763250220760__000001250_0.jpg ADDED
samples/1763250293230__000001250_1.jpg ADDED
samples/1763250365742__000001250_2.jpg ADDED
samples/1763250438055__000001250_3.jpg ADDED
samples/1763251300994__000001500_0.jpg ADDED
samples/1763251373348__000001500_1.jpg ADDED
samples/1763251445767__000001500_2.jpg ADDED
samples/1763251518184__000001500_3.jpg ADDED
samples/1763252388902__000001750_0.jpg ADDED
samples/1763252461313__000001750_1.jpg ADDED
samples/1763252533715__000001750_2.jpg ADDED
samples/1763252606026__000001750_3.jpg ADDED
samples/1763253487029__000002000_0.jpg ADDED
samples/1763253559402__000002000_1.jpg ADDED
samples/1763253631997__000002000_2.jpg ADDED
samples/1763253704491__000002000_3.jpg ADDED
samples/1763254572411__000002250_0.jpg ADDED
samples/1763254644904__000002250_1.jpg ADDED
samples/1763254717481__000002250_2.jpg ADDED

Git LFS Details

  • SHA256: 6eb246e107006452e04065303f3d32a1e0cd3ab010512fc269e7ccae0884cd29
  • Pointer size: 131 Bytes
  • Size of remote file: 104 kB