zhangyi617 commited on
Commit
1d49271
·
verified ·
1 Parent(s): 19c26b0

End of training

Browse files
.gitattributes CHANGED
@@ -33,3 +33,7 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ image_0.png filter=lfs diff=lfs merge=lfs -text
37
+ image_1.png filter=lfs diff=lfs merge=lfs -text
38
+ image_2.png filter=lfs diff=lfs merge=lfs -text
39
+ image_3.png filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model: CompVis/stable-diffusion-v1-4
3
+ library_name: diffusers
4
+ license: creativeml-openrail-m
5
+ inference: true
6
+ tags:
7
+ - stable-diffusion
8
+ - stable-diffusion-diffusers
9
+ - text-to-image
10
+ - diffusers
11
+ - diffusers-training
12
+ - lora
13
+ ---
14
+
15
+ <!-- This model card has been generated automatically according to the information the training script had access to. You
16
+ should probably proofread and complete it, then remove this comment. -->
17
+
18
+
19
+ # LoRA text2image fine-tuning - zhangyi617/sd14_coco_lora
20
+ These are LoRA adaption weights for CompVis/stable-diffusion-v1-4. The weights were fine-tuned on the zhangyi617/coco_fintune_1500 dataset. You can find some example images in the following.
21
+
22
+ ![img_0](./image_0.png)
23
+ ![img_1](./image_1.png)
24
+ ![img_2](./image_2.png)
25
+ ![img_3](./image_3.png)
26
+
27
+
28
+
29
+ ## Intended uses & limitations
30
+
31
+ #### How to use
32
+
33
+ ```python
34
+ # TODO: add an example code snippet for running this diffusion pipeline
35
+ ```
36
+
37
+ #### Limitations and bias
38
+
39
+ [TODO: provide examples of latent issues and potential remediations]
40
+
41
+ ## Training details
42
+
43
+ [TODO: describe the data used to train the model]
checkpoint-7500/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a1b0c72ef2c937dd683c8d05b9a60efe7eb95aefacc6208bfcac49d2f0848b1
3
+ size 1722353544
checkpoint-7500/optimizer.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a76c27ff2a7c79316637edf4462e7944ffe2c5d2efaeb89135b3a3e41946c19c
3
+ size 6592523
checkpoint-7500/pytorch_lora_weights.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d20691f7cff6edeee63f6396c286d054bb3a30553ca52b1731ecb2436e2e163
3
+ size 3226184
checkpoint-7500/random_states_0.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2bd41d95da40a8de3f6e6733aeeffef92e4f9fa8a33ad2e1a6328e9fe483fb64
3
+ size 14821
checkpoint-7500/scaler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:642827d515e7c3d88d20c04224822701abbbc9250deb1d366045f974d08b8258
3
+ size 1383
checkpoint-7500/scheduler.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d281af8a60239e76b15e1d2e343babbafc26161bae5b5b6d52289b7c39a95994
3
+ size 1401
image_0.png ADDED

Git LFS Details

  • SHA256: de3e6965b3661395d1fea2b99508c95f175f6b98843fd542e6bcb62e99fdb9e9
  • Pointer size: 131 Bytes
  • Size of remote file: 468 kB
image_1.png ADDED

Git LFS Details

  • SHA256: cee552541ff8a1d9126af07a07982cd7681947282d63e1c3b68a3746ea7acb21
  • Pointer size: 131 Bytes
  • Size of remote file: 489 kB
image_2.png ADDED

Git LFS Details

  • SHA256: c7052d1bb8709a5ccd89c48baf2a2bfa0f2020a027ee000f2903de9d69ce3fc5
  • Pointer size: 131 Bytes
  • Size of remote file: 451 kB
image_3.png ADDED

Git LFS Details

  • SHA256: 596651f62780a000210ac88306ae49f5430458da1ee050a9ea913819545d203d
  • Pointer size: 131 Bytes
  • Size of remote file: 480 kB
logs/text2image-fine-tune/1770933519.1858947/events.out.tfevents.1770933519.wmgubws17.wmgds.wmg.warwick.ac.uk.3526251.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3582b7478ea2da29754caae67e5f6797ee901059b8b9884932a21394b1c53eb5
3
+ size 2439
logs/text2image-fine-tune/1770933519.1873183/hparams.yml ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: false
6
+ cache_dir: null
7
+ caption_column: text
8
+ center_crop: true
9
+ checkpointing_steps: 4000
10
+ checkpoints_total_limit: null
11
+ dataloader_num_workers: 8
12
+ dataset_config_name: null
13
+ dataset_name: zhangyi617/coco_fintune_1500
14
+ enable_xformers_memory_efficient_attention: false
15
+ gradient_accumulation_steps: 1
16
+ gradient_checkpointing: false
17
+ hub_model_id: sd14_coco_lora
18
+ hub_token: null
19
+ image_column: image
20
+ image_interpolation_mode: lanczos
21
+ learning_rate: 0.0001
22
+ local_rank: -1
23
+ logging_dir: logs
24
+ lr_scheduler: cosine
25
+ lr_warmup_steps: 0
26
+ max_grad_norm: 4.0
27
+ max_train_samples: null
28
+ max_train_steps: 7500
29
+ mixed_precision: fp16
30
+ noise_offset: 0
31
+ num_train_epochs: 20
32
+ num_validation_images: 4
33
+ output_dir: output_models/sd14_coco_lora
34
+ prediction_type: null
35
+ pretrained_model_name_or_path: CompVis/stable-diffusion-v1-4
36
+ push_to_hub: true
37
+ random_flip: true
38
+ rank: 4
39
+ report_to: tensorboard
40
+ resolution: 512
41
+ resume_from_checkpoint: null
42
+ revision: null
43
+ scale_lr: false
44
+ seed: 42
45
+ snr_gamma: null
46
+ train_batch_size: 4
47
+ train_data_dir: null
48
+ use_8bit_adam: false
49
+ validation_epochs: 1
50
+ validation_prompt: a car is driving down the road with another car
51
+ variant: null
logs/text2image-fine-tune/1770933561.5664878/events.out.tfevents.1770933561.wmgubws17.wmgds.wmg.warwick.ac.uk.3527609.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a29c6efda4aecbe42d3a8be60ec96875b1b31ac61b78b65b3f448d777abc0d5f
3
+ size 2439
logs/text2image-fine-tune/1770933561.567896/hparams.yml ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: false
6
+ cache_dir: null
7
+ caption_column: text
8
+ center_crop: true
9
+ checkpointing_steps: 7500
10
+ checkpoints_total_limit: null
11
+ dataloader_num_workers: 8
12
+ dataset_config_name: null
13
+ dataset_name: zhangyi617/coco_fintune_1500
14
+ enable_xformers_memory_efficient_attention: false
15
+ gradient_accumulation_steps: 1
16
+ gradient_checkpointing: false
17
+ hub_model_id: sd14_coco_lora
18
+ hub_token: null
19
+ image_column: image
20
+ image_interpolation_mode: lanczos
21
+ learning_rate: 0.0001
22
+ local_rank: -1
23
+ logging_dir: logs
24
+ lr_scheduler: cosine
25
+ lr_warmup_steps: 0
26
+ max_grad_norm: 4.0
27
+ max_train_samples: null
28
+ max_train_steps: 7500
29
+ mixed_precision: fp16
30
+ noise_offset: 0
31
+ num_train_epochs: 20
32
+ num_validation_images: 4
33
+ output_dir: output_models/sd14_coco_lora
34
+ prediction_type: null
35
+ pretrained_model_name_or_path: CompVis/stable-diffusion-v1-4
36
+ push_to_hub: true
37
+ random_flip: true
38
+ rank: 4
39
+ report_to: tensorboard
40
+ resolution: 512
41
+ resume_from_checkpoint: null
42
+ revision: null
43
+ scale_lr: false
44
+ seed: 42
45
+ snr_gamma: null
46
+ train_batch_size: 4
47
+ train_data_dir: null
48
+ use_8bit_adam: false
49
+ validation_epochs: 1
50
+ validation_prompt: a car is driving down the road with another car
51
+ variant: null
logs/text2image-fine-tune/events.out.tfevents.1770933519.wmgubws17.wmgds.wmg.warwick.ac.uk.3526251.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78bff893ec0d464343418450af330d1302daa6b78b07484987587ac256d9a289
3
+ size 952
logs/text2image-fine-tune/events.out.tfevents.1770933561.wmgubws17.wmgds.wmg.warwick.ac.uk.3527609.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30a6a8840584f20f6e445561294c3b246e18b7507e900675ccc23d58824e5fe9
3
+ size 40505980
pytorch_lora_weights.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d20691f7cff6edeee63f6396c286d054bb3a30553ca52b1731ecb2436e2e163
3
+ size 3226184