kwanY commited on Apr 8, 2025

Commit

59e0fe9

verified ·

1 Parent(s): 8ecd882

End of training

Browse files

Files changed (23) hide show

.gitattributes +2 -0
README.md +45 -0
checkpoint-10000/controlnet/config.json +57 -0
checkpoint-10000/controlnet/diffusion_pytorch_model.safetensors +3 -0
checkpoint-10000/optimizer.bin +3 -0
checkpoint-10000/random_states_0.pkl +3 -0
checkpoint-10000/scaler.pt +3 -0
checkpoint-10000/scheduler.bin +3 -0
checkpoint-20000/controlnet/config.json +57 -0
checkpoint-20000/controlnet/diffusion_pytorch_model.safetensors +3 -0
checkpoint-20000/optimizer.bin +3 -0
checkpoint-20000/random_states_0.pkl +3 -0
checkpoint-20000/scaler.pt +3 -0
checkpoint-20000/scheduler.bin +3 -0
config.json +57 -0
diffusion_pytorch_model.safetensors +3 -0
image_control.png +0 -0
images_0.png +3 -0
images_1.png +3 -0
logs/CTRL/1744013281.7752044/events.out.tfevents.1744013281.workspace-zd8unyjaj5q9-0.7332.1 +3 -0
logs/CTRL/1744013281.7773879/hparams.yml +54 -0
logs/CTRL/events-Copy1.out.tfevents.1744013281.workspace-zd8unyjaj5q9-0.7332.0 +3 -0
logs/CTRL/events.out.tfevents.1744013281.workspace-zd8unyjaj5q9-0.7332.0 +3 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+images_0.png filter=lfs diff=lfs merge=lfs -text
+images_1.png filter=lfs diff=lfs merge=lfs -text

README.md ADDED Viewed

	@@ -0,0 +1,45 @@

+---
+base_model: SG161222/RealVisXL_V3.0
+library_name: diffusers
+license: openrail++
+inference: true
+tags:
+- stable-diffusion-xl
+- stable-diffusion-xl-diffusers
+- text-to-image
+- diffusers
+- controlnet
+- diffusers-training
+---
+<!-- This model card has been generated automatically according to the information the training script had access to. You
+should probably proofread and complete it, then remove this comment. -->
+# controlnet-kwanY/CTRL
+These are controlnet weights trained on SG161222/RealVisXL_V3.0 with new type of conditioning.
+You can find some example images below.
+prompt: A render of a head of Disney character
+![images_0)](./images_0.png)
+prompt: a FHD head of an Orc
+![images_1)](./images_1.png)
+## Intended uses & limitations
+#### How to use
+```python
+# TODO: add an example code snippet for running this diffusion pipeline
+```
+#### Limitations and bias
+[TODO: provide examples of latent issues and potential remediations]
+## Training details
+[TODO: describe the data used to train the model]

checkpoint-10000/controlnet/config.json ADDED Viewed

	@@ -0,0 +1,57 @@

+{
+  "_class_name": "ControlNetModel",
+  "_diffusers_version": "0.31.0",
+  "act_fn": "silu",
+  "addition_embed_type": "text_time",
+  "addition_embed_type_num_heads": 64,
+  "addition_time_embed_dim": 256,
+  "attention_head_dim": [
+    5,
+    10,
+    20
+  ],
+  "block_out_channels": [
+    320,
+    640,
+    1280
+  ],
+  "class_embed_type": null,
+  "conditioning_channels": 3,
+  "conditioning_embedding_out_channels": [
+    16,
+    32,
+    96,
+    256
+  ],
+  "controlnet_conditioning_channel_order": "rgb",
+  "cross_attention_dim": 2048,
+  "down_block_types": [
+    "DownBlock2D",
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D"
+  ],
+  "downsample_padding": 1,
+  "encoder_hid_dim": null,
+  "encoder_hid_dim_type": null,
+  "flip_sin_to_cos": true,
+  "freq_shift": 0,
+  "global_pool_conditions": false,
+  "in_channels": 4,
+  "layers_per_block": 2,
+  "mid_block_scale_factor": 1,
+  "mid_block_type": "UNetMidBlock2DCrossAttn",
+  "norm_eps": 1e-05,
+  "norm_num_groups": 32,
+  "num_attention_heads": null,
+  "num_class_embeds": null,
+  "only_cross_attention": false,
+  "projection_class_embeddings_input_dim": 2816,
+  "resnet_time_scale_shift": "default",
+  "transformer_layers_per_block": [
+    1,
+    2,
+    10
+  ],
+  "upcast_attention": null,
+  "use_linear_projection": true
+}

checkpoint-10000/controlnet/diffusion_pytorch_model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ff22233d994ec5b44893c18ca2b143d19c5ffcb38adb01cef6a3d36e28f671c3
+size 5004167864

checkpoint-10000/optimizer.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0b90e749a3e95507df52e80c746c64a73728f8d2b871b5d834b8d91342fcd9c2
+size 10008840997

checkpoint-10000/random_states_0.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7068776a2fb4656f53670363771caebc1bedd82676c9f5a1a1b53315ff1be2d2
+size 14663

checkpoint-10000/scaler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9be2ad76dcbc923b00e6a142f6db62aad4a46c47bb83864ccb68ddc899d0ce78
+size 557

checkpoint-10000/scheduler.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e6bcd4cb37625cab1478c5f801ecf8dcfe8513c2acdf383cd99f5bc953b5e8a3
+size 563

checkpoint-20000/controlnet/config.json ADDED Viewed

	@@ -0,0 +1,57 @@

+{
+  "_class_name": "ControlNetModel",
+  "_diffusers_version": "0.31.0",
+  "act_fn": "silu",
+  "addition_embed_type": "text_time",
+  "addition_embed_type_num_heads": 64,
+  "addition_time_embed_dim": 256,
+  "attention_head_dim": [
+    5,
+    10,
+    20
+  ],
+  "block_out_channels": [
+    320,
+    640,
+    1280
+  ],
+  "class_embed_type": null,
+  "conditioning_channels": 3,
+  "conditioning_embedding_out_channels": [
+    16,
+    32,
+    96,
+    256
+  ],
+  "controlnet_conditioning_channel_order": "rgb",
+  "cross_attention_dim": 2048,
+  "down_block_types": [
+    "DownBlock2D",
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D"
+  ],
+  "downsample_padding": 1,
+  "encoder_hid_dim": null,
+  "encoder_hid_dim_type": null,
+  "flip_sin_to_cos": true,
+  "freq_shift": 0,
+  "global_pool_conditions": false,
+  "in_channels": 4,
+  "layers_per_block": 2,
+  "mid_block_scale_factor": 1,
+  "mid_block_type": "UNetMidBlock2DCrossAttn",
+  "norm_eps": 1e-05,
+  "norm_num_groups": 32,
+  "num_attention_heads": null,
+  "num_class_embeds": null,
+  "only_cross_attention": false,
+  "projection_class_embeddings_input_dim": 2816,
+  "resnet_time_scale_shift": "default",
+  "transformer_layers_per_block": [
+    1,
+    2,
+    10
+  ],
+  "upcast_attention": null,
+  "use_linear_projection": true
+}

checkpoint-20000/controlnet/diffusion_pytorch_model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7b89450e0c2275fb5be5693606a50fc6589142ba63f502b2989112eee882d3c5
+size 5004167864

checkpoint-20000/optimizer.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b98d922d7e755bf47288027677d341a89a5c7b56ced4036732e241cf8054fb00
+size 10008840997

checkpoint-20000/random_states_0.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:36e2c45dcf5a1f98eb8a0682c5841167a0b3a50e2ca629f34feaa92fc012595b
+size 14663

checkpoint-20000/scaler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a4786ac513887705dfbc8aa8e25c9a017b3fc72fd4e6c2df34c0644ac662b7c4
+size 557

checkpoint-20000/scheduler.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d6af40fe1d26f16a16476a6515b0cb875814a602dabb7d83b4f2ad749c139b74
+size 563

config.json ADDED Viewed

	@@ -0,0 +1,57 @@

+{
+  "_class_name": "ControlNetModel",
+  "_diffusers_version": "0.31.0",
+  "act_fn": "silu",
+  "addition_embed_type": "text_time",
+  "addition_embed_type_num_heads": 64,
+  "addition_time_embed_dim": 256,
+  "attention_head_dim": [
+    5,
+    10,
+    20
+  ],
+  "block_out_channels": [
+    320,
+    640,
+    1280
+  ],
+  "class_embed_type": null,
+  "conditioning_channels": 3,
+  "conditioning_embedding_out_channels": [
+    16,
+    32,
+    96,
+    256
+  ],
+  "controlnet_conditioning_channel_order": "rgb",
+  "cross_attention_dim": 2048,
+  "down_block_types": [
+    "DownBlock2D",
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D"
+  ],
+  "downsample_padding": 1,
+  "encoder_hid_dim": null,
+  "encoder_hid_dim_type": null,
+  "flip_sin_to_cos": true,
+  "freq_shift": 0,
+  "global_pool_conditions": false,
+  "in_channels": 4,
+  "layers_per_block": 2,
+  "mid_block_scale_factor": 1,
+  "mid_block_type": "UNetMidBlock2DCrossAttn",
+  "norm_eps": 1e-05,
+  "norm_num_groups": 32,
+  "num_attention_heads": null,
+  "num_class_embeds": null,
+  "only_cross_attention": false,
+  "projection_class_embeddings_input_dim": 2816,
+  "resnet_time_scale_shift": "default",
+  "transformer_layers_per_block": [
+    1,
+    2,
+    10
+  ],
+  "upcast_attention": null,
+  "use_linear_projection": true
+}

diffusion_pytorch_model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7b89450e0c2275fb5be5693606a50fc6589142ba63f502b2989112eee882d3c5
+size 5004167864

image_control.png ADDED Viewed

images_0.png ADDED Viewed

Git LFS Details

SHA256: 74329dabd99a294081cf2532f7ae5aa7adfc565fe1d96192c053ea720e65474b
Pointer size: 131 Bytes
Size of remote file: 800 kB

images_1.png ADDED Viewed

Git LFS Details

SHA256: 9ca71309e87b2fdef1d7d139fe97edcc04ffb0bb44f6ed821e2031e953755df9
Pointer size: 131 Bytes
Size of remote file: 761 kB

logs/CTRL/1744013281.7752044/events.out.tfevents.1744013281.workspace-zd8unyjaj5q9-0.7332.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7bc3858d13b1dfcfcbab6983eb3750b464594870d18fd5cc4281a7b507535d94
+size 2542

logs/CTRL/1744013281.7773879/hparams.yml ADDED Viewed

	@@ -0,0 +1,54 @@

+adam_beta1: 0.9
+adam_beta2: 0.999
+adam_epsilon: 1.0e-08
+adam_weight_decay: 0.01
+allow_tf32: false
+cache_dir: ./cache
+caption_column: image_caption
+checkpointing_steps: 10000
+checkpoints_total_limit: null
+conditioning_image_column: lmk_img
+controlnet_model_name_or_path: null
+crops_coords_top_left_h: 0
+crops_coords_top_left_w: 0
+dataloader_num_workers: 0
+dataset_config_name: null
+dataset_name: kwanY/EAS_data2
+enable_npu_flash_attention: false
+enable_xformers_memory_efficient_attention: true
+gradient_accumulation_steps: 4
+gradient_checkpointing: true
+hub_model_id: null
+hub_token: null
+image_column: image
+learning_rate: 1.0e-05
+logging_dir: logs
+lr_num_cycles: 1
+lr_power: 1.0
+lr_scheduler: constant
+lr_warmup_steps: 500
+max_grad_norm: 1.0
+max_train_samples: null
+max_train_steps: 20000
+mixed_precision: fp16
+num_train_epochs: 16
+num_validation_images: 4
+output_dir: CTRL
+pretrained_model_name_or_path: SG161222/RealVisXL_V3.0
+pretrained_vae_model_name_or_path: null
+proportion_empty_prompts: 0
+push_to_hub: true
+report_to: tensorboard
+resolution: 512
+resume_from_checkpoint: null
+revision: null
+scale_lr: false
+seed: null
+set_grads_to_none: false
+tokenizer_name: null
+tracker_project_name: CTRL
+train_batch_size: 4
+train_data_dir: null
+use_8bit_adam: false
+validation_steps: 3000
+variant: null

logs/CTRL/events-Copy1.out.tfevents.1744013281.workspace-zd8unyjaj5q9-0.7332.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f55f10d49fbccdc76ce1bdf608dab109b6cae446828544a7e5855ac74fd44242
+size 13495277

logs/CTRL/events.out.tfevents.1744013281.workspace-zd8unyjaj5q9-0.7332.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4e2b6948d277cbd6a54d69b6cdab6340e43087ec6f4a12874a1774f427e3ee85
+size 18050566