Trkkk commited on Oct 28, 2024

Commit

43fa641

verified ·

1 Parent(s): e9802b9

End of training

Browse files

Files changed (24) hide show

checkpoint-2500/optimizer.bin +3 -0
checkpoint-2500/random_states_0.pkl +3 -0
checkpoint-2500/scaler.pt +3 -0
checkpoint-2500/scheduler.bin +3 -0
checkpoint-2500/unet/config.json +68 -0
checkpoint-2500/unet/diffusion_pytorch_model.safetensors +3 -0
checkpoint-2500/unet_ema/config.json +75 -0
checkpoint-2500/unet_ema/diffusion_pytorch_model.safetensors +3 -0
checkpoint-3000/optimizer.bin +3 -0
checkpoint-3000/random_states_0.pkl +3 -0
checkpoint-3000/scaler.pt +3 -0
checkpoint-3000/scheduler.bin +3 -0
checkpoint-3000/unet/config.json +68 -0
checkpoint-3000/unet/diffusion_pytorch_model.safetensors +3 -0
checkpoint-3000/unet_ema/config.json +75 -0
checkpoint-3000/unet_ema/diffusion_pytorch_model.safetensors +3 -0
logs/text2image-fine-tune/1730072866.6577718/events.out.tfevents.1730072866.IPEG-WS-008.21260.1 +3 -0
logs/text2image-fine-tune/1730072866.6947837/hparams.yml +55 -0
logs/text2image-fine-tune/1730073089.0494921/events.out.tfevents.1730073089.IPEG-WS-008.18144.1 +3 -0
logs/text2image-fine-tune/1730073089.0918372/hparams.yml +55 -0
logs/text2image-fine-tune/events.out.tfevents.1730072866.IPEG-WS-008.21260.0 +3 -0
logs/text2image-fine-tune/events.out.tfevents.1730073089.IPEG-WS-008.18144.0 +3 -0
unet/diffusion_pytorch_model.safetensors +1 -1
val_imgs_grid.png +0 -0

checkpoint-2500/optimizer.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ffe6385d8a76688a1d2ccb46bbe9c30fffbf575af9bfea2d8b92b9f1f1bce84e
+size 6876750164

checkpoint-2500/random_states_0.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d9d915da7f02a86e31ee6f75b8849f0950863ba8994f67a7fc9e9194e604c03e
+size 14408

checkpoint-2500/scaler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2abcdcf339ec48efe17ec29ff331c8a500302e54c8dc37756e2c01a35c6025f4
+size 988

checkpoint-2500/scheduler.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:87a49c4a26f62f0aa84f4b656eef4c3465103beed2061780e76c86467dbea981
+size 1000

checkpoint-2500/unet/config.json ADDED Viewed

	@@ -0,0 +1,68 @@

+{
+  "_class_name": "UNet2DConditionModel",
+  "_diffusers_version": "0.32.0.dev0",
+  "_name_or_path": "CompVis/stable-diffusion-v1-4",
+  "act_fn": "silu",
+  "addition_embed_type": null,
+  "addition_embed_type_num_heads": 64,
+  "addition_time_embed_dim": null,
+  "attention_head_dim": 8,
+  "attention_type": "default",
+  "block_out_channels": [
+    320,
+    640,
+    1280,
+    1280
+  ],
+  "center_input_sample": false,
+  "class_embed_type": null,
+  "class_embeddings_concat": false,
+  "conv_in_kernel": 3,
+  "conv_out_kernel": 3,
+  "cross_attention_dim": 768,
+  "cross_attention_norm": null,
+  "down_block_types": [
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "DownBlock2D"
+  ],
+  "downsample_padding": 1,
+  "dropout": 0.0,
+  "dual_cross_attention": false,
+  "encoder_hid_dim": null,
+  "encoder_hid_dim_type": null,
+  "flip_sin_to_cos": true,
+  "freq_shift": 0,
+  "in_channels": 4,
+  "layers_per_block": 2,
+  "mid_block_only_cross_attention": null,
+  "mid_block_scale_factor": 1,
+  "mid_block_type": "UNetMidBlock2DCrossAttn",
+  "norm_eps": 1e-05,
+  "norm_num_groups": 32,
+  "num_attention_heads": null,
+  "num_class_embeds": null,
+  "only_cross_attention": false,
+  "out_channels": 4,
+  "projection_class_embeddings_input_dim": null,
+  "resnet_out_scale_factor": 1.0,
+  "resnet_skip_time_act": false,
+  "resnet_time_scale_shift": "default",
+  "reverse_transformer_layers_per_block": null,
+  "sample_size": 64,
+  "time_cond_proj_dim": null,
+  "time_embedding_act_fn": null,
+  "time_embedding_dim": null,
+  "time_embedding_type": "positional",
+  "timestep_post_act": null,
+  "transformer_layers_per_block": 1,
+  "up_block_types": [
+    "UpBlock2D",
+    "CrossAttnUpBlock2D",
+    "CrossAttnUpBlock2D",
+    "CrossAttnUpBlock2D"
+  ],
+  "upcast_attention": false,
+  "use_linear_projection": false
+}

checkpoint-2500/unet/diffusion_pytorch_model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e416d3f63a01d1690f5b5fc995ca8b4de4c7b4bd338850b62598b49f3e0b947a
+size 3438167536

checkpoint-2500/unet_ema/config.json ADDED Viewed

	@@ -0,0 +1,75 @@

+{
+  "_class_name": "UNet2DConditionModel",
+  "_diffusers_version": "0.32.0.dev0",
+  "_name_or_path": "CompVis/stable-diffusion-v1-4",
+  "act_fn": "silu",
+  "addition_embed_type": null,
+  "addition_embed_type_num_heads": 64,
+  "addition_time_embed_dim": null,
+  "attention_head_dim": 8,
+  "attention_type": "default",
+  "block_out_channels": [
+    320,
+    640,
+    1280,
+    1280
+  ],
+  "center_input_sample": false,
+  "class_embed_type": null,
+  "class_embeddings_concat": false,
+  "conv_in_kernel": 3,
+  "conv_out_kernel": 3,
+  "cross_attention_dim": 768,
+  "cross_attention_norm": null,
+  "decay": 0.9999,
+  "down_block_types": [
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "DownBlock2D"
+  ],
+  "downsample_padding": 1,
+  "dropout": 0.0,
+  "dual_cross_attention": false,
+  "encoder_hid_dim": null,
+  "encoder_hid_dim_type": null,
+  "flip_sin_to_cos": true,
+  "freq_shift": 0,
+  "in_channels": 4,
+  "inv_gamma": 1.0,
+  "layers_per_block": 2,
+  "mid_block_only_cross_attention": null,
+  "mid_block_scale_factor": 1,
+  "mid_block_type": "UNetMidBlock2DCrossAttn",
+  "min_decay": 0.0,
+  "norm_eps": 1e-05,
+  "norm_num_groups": 32,
+  "num_attention_heads": null,
+  "num_class_embeds": null,
+  "only_cross_attention": false,
+  "optimization_step": 2500,
+  "out_channels": 4,
+  "power": 0.6666666666666666,
+  "projection_class_embeddings_input_dim": null,
+  "resnet_out_scale_factor": 1.0,
+  "resnet_skip_time_act": false,
+  "resnet_time_scale_shift": "default",
+  "reverse_transformer_layers_per_block": null,
+  "sample_size": 64,
+  "time_cond_proj_dim": null,
+  "time_embedding_act_fn": null,
+  "time_embedding_dim": null,
+  "time_embedding_type": "positional",
+  "timestep_post_act": null,
+  "transformer_layers_per_block": 1,
+  "up_block_types": [
+    "UpBlock2D",
+    "CrossAttnUpBlock2D",
+    "CrossAttnUpBlock2D",
+    "CrossAttnUpBlock2D"
+  ],
+  "upcast_attention": false,
+  "update_after_step": 0,
+  "use_ema_warmup": false,
+  "use_linear_projection": false
+}

checkpoint-2500/unet_ema/diffusion_pytorch_model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d303a986868bb1669669824555d32dc7c570cb93cc0c5246b1a2cf933ad35cf6
+size 3438167536

checkpoint-3000/optimizer.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ae99e0b8f5f1f60ce1a9006dbf2f7ec9fd98eb84cfbec0bfc7bd55434153b4b7
+size 6876750164

checkpoint-3000/random_states_0.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:96e3020305e5f7def3f4f8486056afad3a29127a881e8b01294ef39b1a59b78b
+size 14408

checkpoint-3000/scaler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5a69396ad64f717c1fe9ac5ae1dc4b1de2873fe7d50a35b2ee41044e4ffdfc3d
+size 988

checkpoint-3000/scheduler.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9cd157c3e520fe67f80ed2bb1dc152730c79b5ece6a75d207b88cbe9517b4bf7
+size 1000

checkpoint-3000/unet/config.json ADDED Viewed

	@@ -0,0 +1,68 @@

+{
+  "_class_name": "UNet2DConditionModel",
+  "_diffusers_version": "0.32.0.dev0",
+  "_name_or_path": "CompVis/stable-diffusion-v1-4",
+  "act_fn": "silu",
+  "addition_embed_type": null,
+  "addition_embed_type_num_heads": 64,
+  "addition_time_embed_dim": null,
+  "attention_head_dim": 8,
+  "attention_type": "default",
+  "block_out_channels": [
+    320,
+    640,
+    1280,
+    1280
+  ],
+  "center_input_sample": false,
+  "class_embed_type": null,
+  "class_embeddings_concat": false,
+  "conv_in_kernel": 3,
+  "conv_out_kernel": 3,
+  "cross_attention_dim": 768,
+  "cross_attention_norm": null,
+  "down_block_types": [
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "DownBlock2D"
+  ],
+  "downsample_padding": 1,
+  "dropout": 0.0,
+  "dual_cross_attention": false,
+  "encoder_hid_dim": null,
+  "encoder_hid_dim_type": null,
+  "flip_sin_to_cos": true,
+  "freq_shift": 0,
+  "in_channels": 4,
+  "layers_per_block": 2,
+  "mid_block_only_cross_attention": null,
+  "mid_block_scale_factor": 1,
+  "mid_block_type": "UNetMidBlock2DCrossAttn",
+  "norm_eps": 1e-05,
+  "norm_num_groups": 32,
+  "num_attention_heads": null,
+  "num_class_embeds": null,
+  "only_cross_attention": false,
+  "out_channels": 4,
+  "projection_class_embeddings_input_dim": null,
+  "resnet_out_scale_factor": 1.0,
+  "resnet_skip_time_act": false,
+  "resnet_time_scale_shift": "default",
+  "reverse_transformer_layers_per_block": null,
+  "sample_size": 64,
+  "time_cond_proj_dim": null,
+  "time_embedding_act_fn": null,
+  "time_embedding_dim": null,
+  "time_embedding_type": "positional",
+  "timestep_post_act": null,
+  "transformer_layers_per_block": 1,
+  "up_block_types": [
+    "UpBlock2D",
+    "CrossAttnUpBlock2D",
+    "CrossAttnUpBlock2D",
+    "CrossAttnUpBlock2D"
+  ],
+  "upcast_attention": false,
+  "use_linear_projection": false
+}

checkpoint-3000/unet/diffusion_pytorch_model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:495c7cf4d59488e75c91360559bd8b9b2e99de21300c50db482985810051c98a
+size 3438167536

checkpoint-3000/unet_ema/config.json ADDED Viewed

	@@ -0,0 +1,75 @@

+{
+  "_class_name": "UNet2DConditionModel",
+  "_diffusers_version": "0.32.0.dev0",
+  "_name_or_path": "CompVis/stable-diffusion-v1-4",
+  "act_fn": "silu",
+  "addition_embed_type": null,
+  "addition_embed_type_num_heads": 64,
+  "addition_time_embed_dim": null,
+  "attention_head_dim": 8,
+  "attention_type": "default",
+  "block_out_channels": [
+    320,
+    640,
+    1280,
+    1280
+  ],
+  "center_input_sample": false,
+  "class_embed_type": null,
+  "class_embeddings_concat": false,
+  "conv_in_kernel": 3,
+  "conv_out_kernel": 3,
+  "cross_attention_dim": 768,
+  "cross_attention_norm": null,
+  "decay": 0.9999,
+  "down_block_types": [
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "DownBlock2D"
+  ],
+  "downsample_padding": 1,
+  "dropout": 0.0,
+  "dual_cross_attention": false,
+  "encoder_hid_dim": null,
+  "encoder_hid_dim_type": null,
+  "flip_sin_to_cos": true,
+  "freq_shift": 0,
+  "in_channels": 4,
+  "inv_gamma": 1.0,
+  "layers_per_block": 2,
+  "mid_block_only_cross_attention": null,
+  "mid_block_scale_factor": 1,
+  "mid_block_type": "UNetMidBlock2DCrossAttn",
+  "min_decay": 0.0,
+  "norm_eps": 1e-05,
+  "norm_num_groups": 32,
+  "num_attention_heads": null,
+  "num_class_embeds": null,
+  "only_cross_attention": false,
+  "optimization_step": 3000,
+  "out_channels": 4,
+  "power": 0.6666666666666666,
+  "projection_class_embeddings_input_dim": null,
+  "resnet_out_scale_factor": 1.0,
+  "resnet_skip_time_act": false,
+  "resnet_time_scale_shift": "default",
+  "reverse_transformer_layers_per_block": null,
+  "sample_size": 64,
+  "time_cond_proj_dim": null,
+  "time_embedding_act_fn": null,
+  "time_embedding_dim": null,
+  "time_embedding_type": "positional",
+  "timestep_post_act": null,
+  "transformer_layers_per_block": 1,
+  "up_block_types": [
+    "UpBlock2D",
+    "CrossAttnUpBlock2D",
+    "CrossAttnUpBlock2D",
+    "CrossAttnUpBlock2D"
+  ],
+  "upcast_attention": false,
+  "update_after_step": 0,
+  "use_ema_warmup": false,
+  "use_linear_projection": false
+}

checkpoint-3000/unet_ema/diffusion_pytorch_model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:52899fbeea249abae4130e5fc0cc69337da1cce17cffda3d783d6775fe2f393f
+size 3438167536

logs/text2image-fine-tune/1730072866.6577718/events.out.tfevents.1730072866.IPEG-WS-008.21260.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:aeed22324bcb8baa8ee680485ce253ad5050c189c968f8b625c48764132309e0
+size 2527

logs/text2image-fine-tune/1730072866.6947837/hparams.yml ADDED Viewed

	@@ -0,0 +1,55 @@

+adam_beta1: 0.9
+adam_beta2: 0.999
+adam_epsilon: 1.0e-08
+adam_weight_decay: 0.01
+allow_tf32: false
+cache_dir: null
+caption_column: caption
+center_crop: true
+checkpointing_steps: 500
+checkpoints_total_limit: null
+dataloader_num_workers: 0
+dataset_config_name: null
+dataset_name: Trkkk/hannover_text_img
+dream_detail_preservation: 1.0
+dream_training: false
+enable_xformers_memory_efficient_attention: false
+foreach_ema: false
+gradient_accumulation_steps: 4
+gradient_checkpointing: true
+hub_model_id: Trkkk/stable_diffusion
+hub_token: null
+image_column: image
+input_perturbation: 0
+learning_rate: 1.0e-05
+local_rank: -1
+logging_dir: logs
+lr_scheduler: constant
+lr_warmup_steps: 0
+max_grad_norm: 1.0
+max_train_samples: null
+max_train_steps: 3000
+mixed_precision: fp16
+noise_offset: 0
+non_ema_revision: null
+num_train_epochs: 108
+offload_ema: false
+output_dir: ./fine_tuned_model_v4
+prediction_type: null
+pretrained_model_name_or_path: CompVis/stable-diffusion-v1-4
+push_to_hub: false
+random_flip: true
+report_to: tensorboard
+resolution: 256
+resume_from_checkpoint: null
+revision: null
+scale_lr: false
+seed: null
+snr_gamma: null
+tracker_project_name: text2image-fine-tune
+train_batch_size: 1
+train_data_dir: null
+use_8bit_adam: false
+use_ema: true
+validation_epochs: 5
+variant: null

logs/text2image-fine-tune/1730073089.0494921/events.out.tfevents.1730073089.IPEG-WS-008.18144.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:de47fd277a0e3a7bea37703ee94d62e976fedb3977361d8ab71172e37bd84f1a
+size 2527

logs/text2image-fine-tune/1730073089.0918372/hparams.yml ADDED Viewed

	@@ -0,0 +1,55 @@

+adam_beta1: 0.9
+adam_beta2: 0.999
+adam_epsilon: 1.0e-08
+adam_weight_decay: 0.01
+allow_tf32: false
+cache_dir: null
+caption_column: caption
+center_crop: true
+checkpointing_steps: 500
+checkpoints_total_limit: null
+dataloader_num_workers: 0
+dataset_config_name: null
+dataset_name: Trkkk/hannover_text_img
+dream_detail_preservation: 1.0
+dream_training: false
+enable_xformers_memory_efficient_attention: false
+foreach_ema: false
+gradient_accumulation_steps: 4
+gradient_checkpointing: true
+hub_model_id: Trkkk/stable_diffusion
+hub_token: null
+image_column: image
+input_perturbation: 0
+learning_rate: 1.0e-05
+local_rank: -1
+logging_dir: logs
+lr_scheduler: constant
+lr_warmup_steps: 0
+max_grad_norm: 1.0
+max_train_samples: null
+max_train_steps: 3000
+mixed_precision: fp16
+noise_offset: 0
+non_ema_revision: null
+num_train_epochs: 108
+offload_ema: false
+output_dir: ./fine_tuned_model_v4
+prediction_type: null
+pretrained_model_name_or_path: CompVis/stable-diffusion-v1-4
+push_to_hub: true
+random_flip: true
+report_to: tensorboard
+resolution: 256
+resume_from_checkpoint: null
+revision: null
+scale_lr: false
+seed: null
+snr_gamma: null
+tracker_project_name: text2image-fine-tune
+train_batch_size: 1
+train_data_dir: null
+use_8bit_adam: false
+use_ema: true
+validation_epochs: 5
+variant: null

logs/text2image-fine-tune/events.out.tfevents.1730072866.IPEG-WS-008.21260.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5e77338f9e3cc2f54236d0369b1a1b2682edfd4d35e0c376b655490a9b475fac
+size 1432

logs/text2image-fine-tune/events.out.tfevents.1730073089.IPEG-WS-008.18144.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:249ee64f3d2ef325ecc9702b82704de992603ba7399695aac733614d1cf99cf0
+size 9505698

unet/diffusion_pytorch_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d6f0ed9d8f70206585f5c5fe4b7471e32db4cb22cb8c9cf5fe3334d291a7e786
 size 3438167536

 version https://git-lfs.github.com/spec/v1
+oid sha256:52899fbeea249abae4130e5fc0cc69337da1cce17cffda3d783d6775fe2f393f
 size 3438167536

val_imgs_grid.png CHANGED Viewed