briannlongzhao commited on
Commit
e34e691
·
verified ·
1 Parent(s): e7212f4

End of training

Browse files
README.md CHANGED
@@ -2,21 +2,16 @@
2
  ---
3
  license: creativeml-openrail-m
4
  base_model: stabilityai/stable-diffusion-2-1
5
- instance_prompt: a photo of <new1> carbonara
6
  tags:
7
  - stable-diffusion
8
  - stable-diffusion-diffusers
9
  - text-to-image
10
  - diffusers
11
- - custom-diffusion
12
  inference: true
13
  ---
14
 
15
- # Custom Diffusion - briannlongzhao/96
 
16
 
17
- These are Custom Diffusion adaption weights for stabilityai/stable-diffusion-2-1. The weights were trained on a photo of <new1> carbonara using [Custom Diffusion](https://www.cs.cmu.edu/~custom-diffusion). You can find some example images in the following.
18
 
19
-
20
-
21
-
22
- For more details on the training, please follow [this link](https://github.com/huggingface/diffusers/blob/main/examples/custom_diffusion).
 
2
  ---
3
  license: creativeml-openrail-m
4
  base_model: stabilityai/stable-diffusion-2-1
 
5
  tags:
6
  - stable-diffusion
7
  - stable-diffusion-diffusers
8
  - text-to-image
9
  - diffusers
10
+ - textual_inversion
11
  inference: true
12
  ---
13
 
14
+ # Textual inversion text2image fine-tuning - briannlongzhao/96
15
+ These are textual inversion adaption weights for stabilityai/stable-diffusion-2-1. You can find some example images in the following.
16
 
 
17
 
 
 
 
 
learned_embeds.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:779e05eac8faafa7c15d052416e15008fb31e0f936bb0a5ed50461759615524e
3
  size 4208
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17ec9350a010d249c0d37b75ea513bbeaed5a1736fb7e80735058f6daa352174
3
  size 4208
logs/textual_inversion/1706461856.3066196/events.out.tfevents.1706461856.node-0.2648.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b75c09bc3c79c2e4fa04c34c928a9447ee5d2de42059078eb4db67e7e69f8ec
3
+ size 2508
logs/textual_inversion/1706461857.2446911/hparams.yml ADDED
@@ -0,0 +1,50 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: false
6
+ center_crop: false
7
+ checkpointing_steps: 500
8
+ checkpoints_total_limit: null
9
+ class_name: carbonara
10
+ dataloader_num_workers: 0
11
+ enable_xformers_memory_efficient_attention: true
12
+ gradient_accumulation_steps: 4
13
+ gradient_checkpointing: false
14
+ hub_model_id: null
15
+ hub_token: null
16
+ idx: 96
17
+ initializer_token: carbonara
18
+ learnable_property: object
19
+ learning_rate: 0.008
20
+ local_rank: -1
21
+ logging_dir: logs
22
+ lr_num_cycles: 1
23
+ lr_scheduler: constant
24
+ lr_warmup_steps: 0
25
+ max_train_steps: 35
26
+ mixed_precision: fp16
27
+ no_safe_serialization: false
28
+ num_train_epochs: 5
29
+ num_validation_images: 4
30
+ num_vectors: 1
31
+ output_dir: /mnt/default/textual_inversion_models_medium/96
32
+ placeholder_token: <carbonara>
33
+ pretrained_model_name_or_path: stabilityai/stable-diffusion-2-1
34
+ push_to_hub: true
35
+ repeats: 1
36
+ report_to: tensorboard
37
+ resolution: 512
38
+ resume_from_checkpoint: null
39
+ revision: null
40
+ save_as_full_pipeline: false
41
+ save_steps: 500
42
+ scale_lr: true
43
+ seed: null
44
+ tokenizer_name: null
45
+ train_batch_size: 4
46
+ train_data_dir: /mnt/default/imagenet/images/train_medium/n07831146
47
+ validation_epochs: null
48
+ validation_prompt: null
49
+ validation_steps: 100
50
+ wnid: n07831146
logs/textual_inversion/1706473796.846059/events.out.tfevents.1706473797.node-0.2625.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0eaae73deba2bd66e96e3e5b6014b3ada0d915067d9b7aff2ed68070ccec8475
3
+ size 2508
logs/textual_inversion/1706473797.790008/hparams.yml ADDED
@@ -0,0 +1,50 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: false
6
+ center_crop: false
7
+ checkpointing_steps: 500
8
+ checkpoints_total_limit: null
9
+ class_name: carbonara
10
+ dataloader_num_workers: 0
11
+ enable_xformers_memory_efficient_attention: true
12
+ gradient_accumulation_steps: 4
13
+ gradient_checkpointing: false
14
+ hub_model_id: null
15
+ hub_token: null
16
+ idx: 96
17
+ initializer_token: carbonara
18
+ learnable_property: object
19
+ learning_rate: 0.008
20
+ local_rank: -1
21
+ logging_dir: logs
22
+ lr_num_cycles: 1
23
+ lr_scheduler: constant
24
+ lr_warmup_steps: 0
25
+ max_train_steps: 35
26
+ mixed_precision: fp16
27
+ no_safe_serialization: false
28
+ num_train_epochs: 5
29
+ num_validation_images: 4
30
+ num_vectors: 1
31
+ output_dir: /mnt/default/textual_inversion_models_medium/96
32
+ placeholder_token: <carbonara>
33
+ pretrained_model_name_or_path: stabilityai/stable-diffusion-2-1
34
+ push_to_hub: true
35
+ repeats: 1
36
+ report_to: tensorboard
37
+ resolution: 512
38
+ resume_from_checkpoint: null
39
+ revision: null
40
+ save_as_full_pipeline: false
41
+ save_steps: 500
42
+ scale_lr: true
43
+ seed: null
44
+ tokenizer_name: null
45
+ train_batch_size: 4
46
+ train_data_dir: /mnt/default/imagenet/images/train_medium/n07831146
47
+ validation_epochs: null
48
+ validation_prompt: null
49
+ validation_steps: 100
50
+ wnid: n07831146
logs/textual_inversion/events.out.tfevents.1706461856.node-0.2648.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3dc88fa392d6b4c2eb68c8cdb7c38a7a8be03e1d1bafe5385fdbffd49dee74e1
3
+ size 4176
logs/textual_inversion/events.out.tfevents.1706473796.node-0.2625.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0261c1da4428b02ae5ad7dab9e5a13d6422ee934b02673ba55e1cb7153b994f
3
+ size 10326
text_encoder/config.json CHANGED
@@ -19,7 +19,7 @@
19
  "num_hidden_layers": 23,
20
  "pad_token_id": 1,
21
  "projection_dim": 512,
22
- "torch_dtype": "float16",
23
  "transformers_version": "4.28.1",
24
- "vocab_size": 49408
25
  }
 
19
  "num_hidden_layers": 23,
20
  "pad_token_id": 1,
21
  "projection_dim": 512,
22
+ "torch_dtype": "float32",
23
  "transformers_version": "4.28.1",
24
+ "vocab_size": 49409
25
  }
text_encoder/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:681c555376658c81dc273f2d737a2aeb23ddb6d1d8e5b3a7064636d359a22668
3
- size 680821096
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ff6c66e9a2e3643e99726f04c94013374241edce3ab717dc12302650aaa003d
3
+ size 1361601112
unet/diffusion_pytorch_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c16c85ca4d0ee5c42bcf07c63ba4670db0b4cb55e65ecf80ac37da8ab6fdba41
3
- size 3463726504
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a3a4d7978884c5e4ef00b62641b1b544b257be2f6715d984188610ad6475ad2
3
+ size 1731904736
vae/config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "_class_name": "AutoencoderKL",
3
  "_diffusers_version": "0.25.1",
4
- "_name_or_path": "/home/aiscuser/.cache/huggingface/hub/models--stabilityai--stable-diffusion-2-1/snapshots/5cae40e6a2745ae2b01ad92ae5043f95f23644d6/vae",
5
  "act_fn": "silu",
6
  "block_out_channels": [
7
  128,
 
1
  {
2
  "_class_name": "AutoencoderKL",
3
  "_diffusers_version": "0.25.1",
4
+ "_name_or_path": "stabilityai/stable-diffusion-2-1",
5
  "act_fn": "silu",
6
  "block_out_channels": [
7
  128,
vae/diffusion_pytorch_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2aa1f43011b553a4cba7f37456465cdbd48aab7b54b9348b890e8058ea7683ec
3
- size 334643268
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e4c08995484ee61270175e9e7a072b66a6e4eeb5f0c266667fe1f45b90daf9a
3
+ size 167335342