Upload folder using huggingface_hub
Browse files- .gitattributes +21 -0
- README.md +33 -0
- dataset.toml +14 -0
- sample/voicemod-key-lora_000144_00_20250202171752.png +3 -0
- sample/voicemod-key-lora_000288_00_20250202172504.png +3 -0
- sample/voicemod-key-lora_000432_00_20250202173214.png +3 -0
- sample/voicemod-key-lora_000576_00_20250202173925.png +3 -0
- sample/voicemod-key-lora_000720_00_20250202174635.png +3 -0
- sample/voicemod-key-lora_000864_00_20250202175346.png +3 -0
- sample/voicemod-key-lora_001008_00_20250202180056.png +3 -0
- sample/voicemod-key-lora_001152_00_20250202180806.png +3 -0
- sample/voicemod-key-lora_001296_00_20250202181517.png +3 -0
- sample/voicemod-key-lora_001440_00_20250202182227.png +3 -0
- sample/voicemod-key-lora_001584_00_20250202182937.png +3 -0
- sample/voicemod-key-lora_001728_00_20250202183647.png +3 -0
- sample/voicemod-key-lora_001872_00_20250202184357.png +3 -0
- sample/voicemod-key-lora_002016_00_20250202185107.png +3 -0
- sample/voicemod-key-lora_002160_00_20250202185817.png +3 -0
- sample/voicemod-key-lora_002304_00_20250202190528.png +3 -0
- sample/voicemod-key-lora_002448_00_20250202191239.png +3 -0
- sample/voicemod-key-lora_002592_00_20250202191949.png +3 -0
- sample/voicemod-key-lora_002736_00_20250202192659.png +3 -0
- sample/voicemod-key-lora_002880_00_20250202193409.png +3 -0
- sample/voicemod-key-lora_003024_00_20250202194120.png +3 -0
- sample_prompts.txt +1 -0
- train.sh +34 -0
- voicemod-key-lora-000004.safetensors +3 -0
- voicemod-key-lora-000008.safetensors +3 -0
- voicemod-key-lora-000012.safetensors +3 -0
- voicemod-key-lora.safetensors +3 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,24 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
sample/voicemod-key-lora_000144_00_20250202171752.png filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
sample/voicemod-key-lora_000288_00_20250202172504.png filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
sample/voicemod-key-lora_000432_00_20250202173214.png filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
sample/voicemod-key-lora_000576_00_20250202173925.png filter=lfs diff=lfs merge=lfs -text
|
| 40 |
+
sample/voicemod-key-lora_000720_00_20250202174635.png filter=lfs diff=lfs merge=lfs -text
|
| 41 |
+
sample/voicemod-key-lora_000864_00_20250202175346.png filter=lfs diff=lfs merge=lfs -text
|
| 42 |
+
sample/voicemod-key-lora_001008_00_20250202180056.png filter=lfs diff=lfs merge=lfs -text
|
| 43 |
+
sample/voicemod-key-lora_001152_00_20250202180806.png filter=lfs diff=lfs merge=lfs -text
|
| 44 |
+
sample/voicemod-key-lora_001296_00_20250202181517.png filter=lfs diff=lfs merge=lfs -text
|
| 45 |
+
sample/voicemod-key-lora_001440_00_20250202182227.png filter=lfs diff=lfs merge=lfs -text
|
| 46 |
+
sample/voicemod-key-lora_001584_00_20250202182937.png filter=lfs diff=lfs merge=lfs -text
|
| 47 |
+
sample/voicemod-key-lora_001728_00_20250202183647.png filter=lfs diff=lfs merge=lfs -text
|
| 48 |
+
sample/voicemod-key-lora_001872_00_20250202184357.png filter=lfs diff=lfs merge=lfs -text
|
| 49 |
+
sample/voicemod-key-lora_002016_00_20250202185107.png filter=lfs diff=lfs merge=lfs -text
|
| 50 |
+
sample/voicemod-key-lora_002160_00_20250202185817.png filter=lfs diff=lfs merge=lfs -text
|
| 51 |
+
sample/voicemod-key-lora_002304_00_20250202190528.png filter=lfs diff=lfs merge=lfs -text
|
| 52 |
+
sample/voicemod-key-lora_002448_00_20250202191239.png filter=lfs diff=lfs merge=lfs -text
|
| 53 |
+
sample/voicemod-key-lora_002592_00_20250202191949.png filter=lfs diff=lfs merge=lfs -text
|
| 54 |
+
sample/voicemod-key-lora_002736_00_20250202192659.png filter=lfs diff=lfs merge=lfs -text
|
| 55 |
+
sample/voicemod-key-lora_002880_00_20250202193409.png filter=lfs diff=lfs merge=lfs -text
|
| 56 |
+
sample/voicemod-key-lora_003024_00_20250202194120.png filter=lfs diff=lfs merge=lfs -text
|
README.md
ADDED
|
@@ -0,0 +1,33 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
tags:
|
| 3 |
+
- text-to-image
|
| 4 |
+
- flux
|
| 5 |
+
- lora
|
| 6 |
+
- diffusers
|
| 7 |
+
- template:sd-lora
|
| 8 |
+
- fluxgym
|
| 9 |
+
widget:
|
| 10 |
+
- output:
|
| 11 |
+
url: sample/voicemod-key-lora_003024_00_20250202194120.png
|
| 12 |
+
text: v01c3m0dk3y
|
| 13 |
+
base_model: black-forest-labs/FLUX.1-dev
|
| 14 |
+
instance_prompt: v01c3m0dk3y
|
| 15 |
+
license: other
|
| 16 |
+
license_name: flux-1-dev-non-commercial-license
|
| 17 |
+
license_link: https://huggingface.co/black-forest-labs/FLUX.1-dev/blob/main/LICENSE.md
|
| 18 |
+
---
|
| 19 |
+
|
| 20 |
+
# voicemod-key-lora
|
| 21 |
+
|
| 22 |
+
A Flux LoRA trained on a local computer with [Fluxgym](https://github.com/cocktailpeanut/fluxgym)
|
| 23 |
+
|
| 24 |
+
<Gallery />
|
| 25 |
+
|
| 26 |
+
## Trigger words
|
| 27 |
+
|
| 28 |
+
You should use `v01c3m0dk3y` to trigger the image generation.
|
| 29 |
+
|
| 30 |
+
## Download model and use it with ComfyUI, AUTOMATIC1111, SD.Next, Invoke AI, Forge, etc.
|
| 31 |
+
|
| 32 |
+
Weights for this model are available in Safetensors format.
|
| 33 |
+
|
dataset.toml
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[general]
|
| 2 |
+
shuffle_caption = false
|
| 3 |
+
caption_extension = '.txt'
|
| 4 |
+
keep_tokens = 1
|
| 5 |
+
|
| 6 |
+
[[datasets]]
|
| 7 |
+
resolution = 1024
|
| 8 |
+
batch_size = 1
|
| 9 |
+
keep_tokens = 1
|
| 10 |
+
|
| 11 |
+
[[datasets.subsets]]
|
| 12 |
+
image_dir = '/workspace/fluxgym/datasets/voicemod-key-lora'
|
| 13 |
+
class_tokens = 'v01c3m0dk3y'
|
| 14 |
+
num_repeats = 10
|
sample/voicemod-key-lora_000144_00_20250202171752.png
ADDED
|
Git LFS Details
|
sample/voicemod-key-lora_000288_00_20250202172504.png
ADDED
|
Git LFS Details
|
sample/voicemod-key-lora_000432_00_20250202173214.png
ADDED
|
Git LFS Details
|
sample/voicemod-key-lora_000576_00_20250202173925.png
ADDED
|
Git LFS Details
|
sample/voicemod-key-lora_000720_00_20250202174635.png
ADDED
|
Git LFS Details
|
sample/voicemod-key-lora_000864_00_20250202175346.png
ADDED
|
Git LFS Details
|
sample/voicemod-key-lora_001008_00_20250202180056.png
ADDED
|
Git LFS Details
|
sample/voicemod-key-lora_001152_00_20250202180806.png
ADDED
|
Git LFS Details
|
sample/voicemod-key-lora_001296_00_20250202181517.png
ADDED
|
Git LFS Details
|
sample/voicemod-key-lora_001440_00_20250202182227.png
ADDED
|
Git LFS Details
|
sample/voicemod-key-lora_001584_00_20250202182937.png
ADDED
|
Git LFS Details
|
sample/voicemod-key-lora_001728_00_20250202183647.png
ADDED
|
Git LFS Details
|
sample/voicemod-key-lora_001872_00_20250202184357.png
ADDED
|
Git LFS Details
|
sample/voicemod-key-lora_002016_00_20250202185107.png
ADDED
|
Git LFS Details
|
sample/voicemod-key-lora_002160_00_20250202185817.png
ADDED
|
Git LFS Details
|
sample/voicemod-key-lora_002304_00_20250202190528.png
ADDED
|
Git LFS Details
|
sample/voicemod-key-lora_002448_00_20250202191239.png
ADDED
|
Git LFS Details
|
sample/voicemod-key-lora_002592_00_20250202191949.png
ADDED
|
Git LFS Details
|
sample/voicemod-key-lora_002736_00_20250202192659.png
ADDED
|
Git LFS Details
|
sample/voicemod-key-lora_002880_00_20250202193409.png
ADDED
|
Git LFS Details
|
sample/voicemod-key-lora_003024_00_20250202194120.png
ADDED
|
Git LFS Details
|
sample_prompts.txt
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
v01c3m0dk3y
|
train.sh
ADDED
|
@@ -0,0 +1,34 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
accelerate launch \
|
| 2 |
+
--mixed_precision bf16 \
|
| 3 |
+
--num_cpu_threads_per_process 1 \
|
| 4 |
+
sd-scripts/flux_train_network.py \
|
| 5 |
+
--pretrained_model_name_or_path "/workspace/fluxgym/models/unet/flux1-dev.sft" \
|
| 6 |
+
--clip_l "/workspace/fluxgym/models/clip/clip_l.safetensors" \
|
| 7 |
+
--t5xxl "/workspace/fluxgym/models/clip/t5xxl_fp16.safetensors" \
|
| 8 |
+
--ae "/workspace/fluxgym/models/vae/ae.sft" \
|
| 9 |
+
--cache_latents_to_disk \
|
| 10 |
+
--save_model_as safetensors \
|
| 11 |
+
--sdpa --persistent_data_loader_workers \
|
| 12 |
+
--max_data_loader_n_workers 2 \
|
| 13 |
+
--seed 42 \
|
| 14 |
+
--gradient_checkpointing \
|
| 15 |
+
--mixed_precision bf16 \
|
| 16 |
+
--save_precision bf16 \
|
| 17 |
+
--network_module networks.lora_flux \
|
| 18 |
+
--network_dim 4 \
|
| 19 |
+
--optimizer_type adamw8bit \--sample_prompts="/workspace/fluxgym/outputs/voicemod-key-lora/sample_prompts.txt" --sample_every_n_steps="144" \
|
| 20 |
+
--learning_rate 8e-4 \
|
| 21 |
+
--cache_text_encoder_outputs \
|
| 22 |
+
--cache_text_encoder_outputs_to_disk \
|
| 23 |
+
--fp8_base \
|
| 24 |
+
--highvram \
|
| 25 |
+
--max_train_epochs 16 \
|
| 26 |
+
--save_every_n_epochs 4 \
|
| 27 |
+
--dataset_config "/workspace/fluxgym/outputs/voicemod-key-lora/dataset.toml" \
|
| 28 |
+
--output_dir "/workspace/fluxgym/outputs/voicemod-key-lora" \
|
| 29 |
+
--output_name voicemod-key-lora \
|
| 30 |
+
--timestep_sampling shift \
|
| 31 |
+
--discrete_flow_shift 3.1582 \
|
| 32 |
+
--model_prediction_type raw \
|
| 33 |
+
--guidance_scale 1 \
|
| 34 |
+
--loss_type l2 \
|
voicemod-key-lora-000004.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3d5924a71058939d8e8a00818f1e377e2e736aee476761a8f85038559b64883a
|
| 3 |
+
size 39757408
|
voicemod-key-lora-000008.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5239e5cc5bc20d1871e4f0eed144361f0e1225622d73731d51117a426c1b7af8
|
| 3 |
+
size 39757416
|
voicemod-key-lora-000012.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:51474b8c8c04b25df8bfde19f0f0cee38b55c335f04956fa7b9018da6dbc7b1c
|
| 3 |
+
size 39757416
|
voicemod-key-lora.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:796a25d8e39d74da4c25c52b5d70b0e033cd15041eb86e0f4e2a16949faa7b71
|
| 3 |
+
size 39757408
|