GiRLaZo commited on
Commit
8b1effe
·
verified ·
1 Parent(s): 64c6af6

Upload folder using huggingface_hub

Browse files
Files changed (30) hide show
  1. .gitattributes +21 -0
  2. README.md +33 -0
  3. dataset.toml +14 -0
  4. sample/voicemod-key-lora_000144_00_20250202171752.png +3 -0
  5. sample/voicemod-key-lora_000288_00_20250202172504.png +3 -0
  6. sample/voicemod-key-lora_000432_00_20250202173214.png +3 -0
  7. sample/voicemod-key-lora_000576_00_20250202173925.png +3 -0
  8. sample/voicemod-key-lora_000720_00_20250202174635.png +3 -0
  9. sample/voicemod-key-lora_000864_00_20250202175346.png +3 -0
  10. sample/voicemod-key-lora_001008_00_20250202180056.png +3 -0
  11. sample/voicemod-key-lora_001152_00_20250202180806.png +3 -0
  12. sample/voicemod-key-lora_001296_00_20250202181517.png +3 -0
  13. sample/voicemod-key-lora_001440_00_20250202182227.png +3 -0
  14. sample/voicemod-key-lora_001584_00_20250202182937.png +3 -0
  15. sample/voicemod-key-lora_001728_00_20250202183647.png +3 -0
  16. sample/voicemod-key-lora_001872_00_20250202184357.png +3 -0
  17. sample/voicemod-key-lora_002016_00_20250202185107.png +3 -0
  18. sample/voicemod-key-lora_002160_00_20250202185817.png +3 -0
  19. sample/voicemod-key-lora_002304_00_20250202190528.png +3 -0
  20. sample/voicemod-key-lora_002448_00_20250202191239.png +3 -0
  21. sample/voicemod-key-lora_002592_00_20250202191949.png +3 -0
  22. sample/voicemod-key-lora_002736_00_20250202192659.png +3 -0
  23. sample/voicemod-key-lora_002880_00_20250202193409.png +3 -0
  24. sample/voicemod-key-lora_003024_00_20250202194120.png +3 -0
  25. sample_prompts.txt +1 -0
  26. train.sh +34 -0
  27. voicemod-key-lora-000004.safetensors +3 -0
  28. voicemod-key-lora-000008.safetensors +3 -0
  29. voicemod-key-lora-000012.safetensors +3 -0
  30. voicemod-key-lora.safetensors +3 -0
.gitattributes CHANGED
@@ -33,3 +33,24 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ sample/voicemod-key-lora_000144_00_20250202171752.png filter=lfs diff=lfs merge=lfs -text
37
+ sample/voicemod-key-lora_000288_00_20250202172504.png filter=lfs diff=lfs merge=lfs -text
38
+ sample/voicemod-key-lora_000432_00_20250202173214.png filter=lfs diff=lfs merge=lfs -text
39
+ sample/voicemod-key-lora_000576_00_20250202173925.png filter=lfs diff=lfs merge=lfs -text
40
+ sample/voicemod-key-lora_000720_00_20250202174635.png filter=lfs diff=lfs merge=lfs -text
41
+ sample/voicemod-key-lora_000864_00_20250202175346.png filter=lfs diff=lfs merge=lfs -text
42
+ sample/voicemod-key-lora_001008_00_20250202180056.png filter=lfs diff=lfs merge=lfs -text
43
+ sample/voicemod-key-lora_001152_00_20250202180806.png filter=lfs diff=lfs merge=lfs -text
44
+ sample/voicemod-key-lora_001296_00_20250202181517.png filter=lfs diff=lfs merge=lfs -text
45
+ sample/voicemod-key-lora_001440_00_20250202182227.png filter=lfs diff=lfs merge=lfs -text
46
+ sample/voicemod-key-lora_001584_00_20250202182937.png filter=lfs diff=lfs merge=lfs -text
47
+ sample/voicemod-key-lora_001728_00_20250202183647.png filter=lfs diff=lfs merge=lfs -text
48
+ sample/voicemod-key-lora_001872_00_20250202184357.png filter=lfs diff=lfs merge=lfs -text
49
+ sample/voicemod-key-lora_002016_00_20250202185107.png filter=lfs diff=lfs merge=lfs -text
50
+ sample/voicemod-key-lora_002160_00_20250202185817.png filter=lfs diff=lfs merge=lfs -text
51
+ sample/voicemod-key-lora_002304_00_20250202190528.png filter=lfs diff=lfs merge=lfs -text
52
+ sample/voicemod-key-lora_002448_00_20250202191239.png filter=lfs diff=lfs merge=lfs -text
53
+ sample/voicemod-key-lora_002592_00_20250202191949.png filter=lfs diff=lfs merge=lfs -text
54
+ sample/voicemod-key-lora_002736_00_20250202192659.png filter=lfs diff=lfs merge=lfs -text
55
+ sample/voicemod-key-lora_002880_00_20250202193409.png filter=lfs diff=lfs merge=lfs -text
56
+ sample/voicemod-key-lora_003024_00_20250202194120.png filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - text-to-image
4
+ - flux
5
+ - lora
6
+ - diffusers
7
+ - template:sd-lora
8
+ - fluxgym
9
+ widget:
10
+ - output:
11
+ url: sample/voicemod-key-lora_003024_00_20250202194120.png
12
+ text: v01c3m0dk3y
13
+ base_model: black-forest-labs/FLUX.1-dev
14
+ instance_prompt: v01c3m0dk3y
15
+ license: other
16
+ license_name: flux-1-dev-non-commercial-license
17
+ license_link: https://huggingface.co/black-forest-labs/FLUX.1-dev/blob/main/LICENSE.md
18
+ ---
19
+
20
+ # voicemod-key-lora
21
+
22
+ A Flux LoRA trained on a local computer with [Fluxgym](https://github.com/cocktailpeanut/fluxgym)
23
+
24
+ <Gallery />
25
+
26
+ ## Trigger words
27
+
28
+ You should use `v01c3m0dk3y` to trigger the image generation.
29
+
30
+ ## Download model and use it with ComfyUI, AUTOMATIC1111, SD.Next, Invoke AI, Forge, etc.
31
+
32
+ Weights for this model are available in Safetensors format.
33
+
dataset.toml ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [general]
2
+ shuffle_caption = false
3
+ caption_extension = '.txt'
4
+ keep_tokens = 1
5
+
6
+ [[datasets]]
7
+ resolution = 1024
8
+ batch_size = 1
9
+ keep_tokens = 1
10
+
11
+ [[datasets.subsets]]
12
+ image_dir = '/workspace/fluxgym/datasets/voicemod-key-lora'
13
+ class_tokens = 'v01c3m0dk3y'
14
+ num_repeats = 10
sample/voicemod-key-lora_000144_00_20250202171752.png ADDED

Git LFS Details

  • SHA256: 7d3213442ea8ed2ca144348b4392dd12db3489d73ce38268a48a403e6070a923
  • Pointer size: 131 Bytes
  • Size of remote file: 366 kB
sample/voicemod-key-lora_000288_00_20250202172504.png ADDED

Git LFS Details

  • SHA256: 22eacc2bb6b5e047e764675f7db261fbad15062a659c41c30d605bb9e10bc730
  • Pointer size: 131 Bytes
  • Size of remote file: 391 kB
sample/voicemod-key-lora_000432_00_20250202173214.png ADDED

Git LFS Details

  • SHA256: 2eb3e8f5938f147ac03ec954d03238a00e391e6b23b17b13b758c000bf3f6ad9
  • Pointer size: 131 Bytes
  • Size of remote file: 293 kB
sample/voicemod-key-lora_000576_00_20250202173925.png ADDED

Git LFS Details

  • SHA256: 3acd953c3dff4974afe2d056d1515288a4c2a5c9315f01ac080bd51fc4b61112
  • Pointer size: 131 Bytes
  • Size of remote file: 271 kB
sample/voicemod-key-lora_000720_00_20250202174635.png ADDED

Git LFS Details

  • SHA256: a7c8e46965d2bbee0ef0d7d94e0a1340caef2887bcd33cf9b22ac1cd7f83c450
  • Pointer size: 131 Bytes
  • Size of remote file: 336 kB
sample/voicemod-key-lora_000864_00_20250202175346.png ADDED

Git LFS Details

  • SHA256: 30959398ff6c8da626d5e3a11e05e1e6bb56db9743da545c75722a817c7fd6aa
  • Pointer size: 131 Bytes
  • Size of remote file: 277 kB
sample/voicemod-key-lora_001008_00_20250202180056.png ADDED

Git LFS Details

  • SHA256: b94fd496c86eb11d99036b79067a1766ddbf96f846a3aa15804c1e1060d9bf7e
  • Pointer size: 131 Bytes
  • Size of remote file: 280 kB
sample/voicemod-key-lora_001152_00_20250202180806.png ADDED

Git LFS Details

  • SHA256: c43b0fed8c1ec95c69d565b68269135e1af9cfdabe26180b365fbc13660e7aa8
  • Pointer size: 131 Bytes
  • Size of remote file: 295 kB
sample/voicemod-key-lora_001296_00_20250202181517.png ADDED

Git LFS Details

  • SHA256: 1b5d09ef94b1cbb226503fe853e6aba2bb06c235bb0d968054eb10117799ca20
  • Pointer size: 131 Bytes
  • Size of remote file: 341 kB
sample/voicemod-key-lora_001440_00_20250202182227.png ADDED

Git LFS Details

  • SHA256: a3f713f17444de651b9ea2e8dd5309139005491bfde3d4e8f918183da8795658
  • Pointer size: 131 Bytes
  • Size of remote file: 312 kB
sample/voicemod-key-lora_001584_00_20250202182937.png ADDED

Git LFS Details

  • SHA256: f64f9ac9daa2cca1356df1b8f6ebd3555dd83aa5ddd906b28b579e3046fdae25
  • Pointer size: 131 Bytes
  • Size of remote file: 257 kB
sample/voicemod-key-lora_001728_00_20250202183647.png ADDED

Git LFS Details

  • SHA256: 62c8f7f2c14c183be646396f128883551056dcb5461ad12aac8f93b8f56430fd
  • Pointer size: 131 Bytes
  • Size of remote file: 321 kB
sample/voicemod-key-lora_001872_00_20250202184357.png ADDED

Git LFS Details

  • SHA256: c059c439cbae96ad14d71204237995ecb84d36d6b14d2e77c9c90d5204c94d4f
  • Pointer size: 131 Bytes
  • Size of remote file: 291 kB
sample/voicemod-key-lora_002016_00_20250202185107.png ADDED

Git LFS Details

  • SHA256: 41bcab719e0852f76fc78f00bce546611836189474dea0e8362e334315366052
  • Pointer size: 131 Bytes
  • Size of remote file: 307 kB
sample/voicemod-key-lora_002160_00_20250202185817.png ADDED

Git LFS Details

  • SHA256: a9a40628b74da510d804efd750189661beb67172a4682623b2f89357272b839b
  • Pointer size: 131 Bytes
  • Size of remote file: 336 kB
sample/voicemod-key-lora_002304_00_20250202190528.png ADDED

Git LFS Details

  • SHA256: 96b85ff5a3e8f6fc3e34aaf4ad21a8f8558091fe70692221ae151a8aaec37d7f
  • Pointer size: 131 Bytes
  • Size of remote file: 367 kB
sample/voicemod-key-lora_002448_00_20250202191239.png ADDED

Git LFS Details

  • SHA256: e91d8ad896a209c090770d4bb6774dbf2a46cc0ac512fc3d357dc0fc9de2a901
  • Pointer size: 131 Bytes
  • Size of remote file: 333 kB
sample/voicemod-key-lora_002592_00_20250202191949.png ADDED

Git LFS Details

  • SHA256: ffeb4c822623758e3998a88ea71fe1ebe477430bda1753dea1bdabcad51f7cc8
  • Pointer size: 131 Bytes
  • Size of remote file: 348 kB
sample/voicemod-key-lora_002736_00_20250202192659.png ADDED

Git LFS Details

  • SHA256: 1de7ef409f6ec57a36ebc6e558550b6feaa1c26d4ebb94ccd7d88a78f8426e44
  • Pointer size: 131 Bytes
  • Size of remote file: 383 kB
sample/voicemod-key-lora_002880_00_20250202193409.png ADDED

Git LFS Details

  • SHA256: 774410b3e51ee71f1971ecbfb681c861c117b7836c5d98d168451b7de7f805d9
  • Pointer size: 131 Bytes
  • Size of remote file: 278 kB
sample/voicemod-key-lora_003024_00_20250202194120.png ADDED

Git LFS Details

  • SHA256: 22e3035787c274d8954cdbf54f339859bd2d795ba539fdf8131d0921919afb37
  • Pointer size: 131 Bytes
  • Size of remote file: 265 kB
sample_prompts.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ v01c3m0dk3y
train.sh ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ accelerate launch \
2
+ --mixed_precision bf16 \
3
+ --num_cpu_threads_per_process 1 \
4
+ sd-scripts/flux_train_network.py \
5
+ --pretrained_model_name_or_path "/workspace/fluxgym/models/unet/flux1-dev.sft" \
6
+ --clip_l "/workspace/fluxgym/models/clip/clip_l.safetensors" \
7
+ --t5xxl "/workspace/fluxgym/models/clip/t5xxl_fp16.safetensors" \
8
+ --ae "/workspace/fluxgym/models/vae/ae.sft" \
9
+ --cache_latents_to_disk \
10
+ --save_model_as safetensors \
11
+ --sdpa --persistent_data_loader_workers \
12
+ --max_data_loader_n_workers 2 \
13
+ --seed 42 \
14
+ --gradient_checkpointing \
15
+ --mixed_precision bf16 \
16
+ --save_precision bf16 \
17
+ --network_module networks.lora_flux \
18
+ --network_dim 4 \
19
+ --optimizer_type adamw8bit \--sample_prompts="/workspace/fluxgym/outputs/voicemod-key-lora/sample_prompts.txt" --sample_every_n_steps="144" \
20
+ --learning_rate 8e-4 \
21
+ --cache_text_encoder_outputs \
22
+ --cache_text_encoder_outputs_to_disk \
23
+ --fp8_base \
24
+ --highvram \
25
+ --max_train_epochs 16 \
26
+ --save_every_n_epochs 4 \
27
+ --dataset_config "/workspace/fluxgym/outputs/voicemod-key-lora/dataset.toml" \
28
+ --output_dir "/workspace/fluxgym/outputs/voicemod-key-lora" \
29
+ --output_name voicemod-key-lora \
30
+ --timestep_sampling shift \
31
+ --discrete_flow_shift 3.1582 \
32
+ --model_prediction_type raw \
33
+ --guidance_scale 1 \
34
+ --loss_type l2 \
voicemod-key-lora-000004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3d5924a71058939d8e8a00818f1e377e2e736aee476761a8f85038559b64883a
3
+ size 39757408
voicemod-key-lora-000008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5239e5cc5bc20d1871e4f0eed144361f0e1225622d73731d51117a426c1b7af8
3
+ size 39757416
voicemod-key-lora-000012.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51474b8c8c04b25df8bfde19f0f0cee38b55c335f04956fa7b9018da6dbc7b1c
3
+ size 39757416
voicemod-key-lora.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:796a25d8e39d74da4c25c52b5d70b0e033cd15041eb86e0f4e2a16949faa7b71
3
+ size 39757408