diff --git a/.gitattributes b/.gitattributes index c7d9f3332a950355d5a77d85000f05e6f45435ea..2b3390966e1fe27f8df90996c30703599b0a34a8 100644 --- a/.gitattributes +++ b/.gitattributes @@ -32,3 +32,6 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +images_0.png filter=lfs diff=lfs merge=lfs -text +images_1.png filter=lfs diff=lfs merge=lfs -text +images_2.png filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000000000000000000000000000000000000..5522b71205407ce5bcbca13ab054d68f1fec66ae --- /dev/null +++ b/README.md @@ -0,0 +1,24 @@ + +--- +license: creativeml-openrail-m +base_model: stabilityai/stable-diffusion-2-1-base +tags: +- stable-diffusion +- stable-diffusion-diffusers +- text-to-image +- diffusers +- controlnet +inference: true +--- + +# controlnet-killah-t-cell/boxes_cn + +These are controlnet weights trained on stabilityai/stable-diffusion-2-1-base with new type of conditioning. +You can find some example images below. +prompt: Two men wearing hats with trees in the background +![images_0)](./images_0.png) +prompt: Two Girls smiling, professional dslr photograph, dark background, studio lights, high quality +![images_1)](./images_1.png) +prompt: a clown, oil on canvas, bittersweet expression +![images_2)](./images_2.png) + diff --git a/checkpoint-10/controlnet/config.json b/checkpoint-10/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..53b3d3e22340c0e0c4cf0028c244ac2e3bef6b33 --- /dev/null +++ b/checkpoint-10/controlnet/config.json @@ -0,0 +1,47 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.18.0.dev0", + "act_fn": "silu", + "attention_head_dim": [ + 5, + 10, + 20, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "class_embed_type": null, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 1024, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": null, + "resnet_time_scale_shift": "default", + "upcast_attention": false, + "use_linear_projection": true +} diff --git a/checkpoint-10/controlnet/diffusion_pytorch_model.bin b/checkpoint-10/controlnet/diffusion_pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..4457d531f3ca9ac5c998ed3f947732e358689c99 --- /dev/null +++ b/checkpoint-10/controlnet/diffusion_pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e1b839df77004959d160081a17b0c4eb7f52e183d4fe2ab5e03b846f9fa1280 +size 1457056057 diff --git a/checkpoint-10/optimizer.bin b/checkpoint-10/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..a1c99259d1212d4f1919c98614ea2c6c1e30b6ab --- /dev/null +++ b/checkpoint-10/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:335643b7a3aedfcad0907730e33dcc9dc63ff594e6c3c2196368d5cdf3699f4c +size 2914110681 diff --git a/checkpoint-10/random_states_0.pkl b/checkpoint-10/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..1c223fdfec7ac6d5d4b8d59c69da2b4f6db45f8c --- /dev/null +++ b/checkpoint-10/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b81ebaa34b14ef0dc6caa6f36b837df041efc1c067f8aaeb40177fc22052255f +size 14791 diff --git a/checkpoint-10/scheduler.bin b/checkpoint-10/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..ddbf152cb78531f1974f4c9ad4496474e5b193fd --- /dev/null +++ b/checkpoint-10/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40d0b17e9c9b0baf0c44a59b9d7e8b78aed0545d5ab2b9d9d9dbb13aed8db9e8 +size 563 diff --git a/checkpoint-10000/controlnet/config.json b/checkpoint-10000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..53b3d3e22340c0e0c4cf0028c244ac2e3bef6b33 --- /dev/null +++ b/checkpoint-10000/controlnet/config.json @@ -0,0 +1,47 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.18.0.dev0", + "act_fn": "silu", + "attention_head_dim": [ + 5, + 10, + 20, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "class_embed_type": null, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 1024, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": null, + "resnet_time_scale_shift": "default", + "upcast_attention": false, + "use_linear_projection": true +} diff --git a/checkpoint-10000/controlnet/diffusion_pytorch_model.bin b/checkpoint-10000/controlnet/diffusion_pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..4f8935e01841f672b315b06cad59846c976484f3 --- /dev/null +++ b/checkpoint-10000/controlnet/diffusion_pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01df5dc8bbe168f8aa6139648390cc6085a52c3d1458794aaa1dffe2019a40b8 +size 1457056057 diff --git a/checkpoint-10000/optimizer.bin b/checkpoint-10000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..90dea53d7a9d3cbc2c88ed9dd3fb8f0ec543d3f4 --- /dev/null +++ b/checkpoint-10000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5167d154a7eb89dc88cfd64579c30d3537ab9fabf69d894296a1b8ff2c827e54 +size 2914110681 diff --git a/checkpoint-10000/random_states_0.pkl b/checkpoint-10000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..f4fd9bb766ad7623de67a27dbcbf8efd65063e3f --- /dev/null +++ b/checkpoint-10000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10db186535e4379766ed74cda594992fc675e2796f796a132bde91acaefdfb49 +size 14663 diff --git a/checkpoint-10000/scheduler.bin b/checkpoint-10000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..dfea8b103660873f57a0b99214cb9acb641ced7b --- /dev/null +++ b/checkpoint-10000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6bcd4cb37625cab1478c5f801ecf8dcfe8513c2acdf383cd99f5bc953b5e8a3 +size 563 diff --git a/checkpoint-12000/controlnet/config.json b/checkpoint-12000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..53b3d3e22340c0e0c4cf0028c244ac2e3bef6b33 --- /dev/null +++ b/checkpoint-12000/controlnet/config.json @@ -0,0 +1,47 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.18.0.dev0", + "act_fn": "silu", + "attention_head_dim": [ + 5, + 10, + 20, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "class_embed_type": null, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 1024, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": null, + "resnet_time_scale_shift": "default", + "upcast_attention": false, + "use_linear_projection": true +} diff --git a/checkpoint-12000/controlnet/diffusion_pytorch_model.bin b/checkpoint-12000/controlnet/diffusion_pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..b6f808a8da45a466478d3d124bc9775addf82ab6 --- /dev/null +++ b/checkpoint-12000/controlnet/diffusion_pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:774a78ac3a36684e6eaeaa6c1a7af4657f876ab86127900e62c0185dfd266082 +size 1457056057 diff --git a/checkpoint-12000/optimizer.bin b/checkpoint-12000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..9741e4f51c92fe63608b8753bb49c3b43f8e9f47 --- /dev/null +++ b/checkpoint-12000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:448f5cbef0ed524ff2fe99fe95dc692edb0430fdfce2311e9f2f8730a96f5aa6 +size 2914110681 diff --git a/checkpoint-12000/random_states_0.pkl b/checkpoint-12000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..1bd4e75dd21d0f0798dda0a1ccf8798643470d35 --- /dev/null +++ b/checkpoint-12000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51d294a310f23b082a7c13cb8b27dcb7b7737b3c6d6744b466c0ed97b4f801dc +size 14663 diff --git a/checkpoint-12000/scheduler.bin b/checkpoint-12000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..e6243fe8b64a7112d637d0f1a8abdad6968fc7e8 --- /dev/null +++ b/checkpoint-12000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9855aba5ac021cfcebb517ce8e7c056e6a3e01548a489078133809249c0000db +size 563 diff --git a/checkpoint-20/controlnet/config.json b/checkpoint-20/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..53b3d3e22340c0e0c4cf0028c244ac2e3bef6b33 --- /dev/null +++ b/checkpoint-20/controlnet/config.json @@ -0,0 +1,47 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.18.0.dev0", + "act_fn": "silu", + "attention_head_dim": [ + 5, + 10, + 20, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "class_embed_type": null, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 1024, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": null, + "resnet_time_scale_shift": "default", + "upcast_attention": false, + "use_linear_projection": true +} diff --git a/checkpoint-20/controlnet/diffusion_pytorch_model.bin b/checkpoint-20/controlnet/diffusion_pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..9e73d2128725a8fccd0a391eb9a7505b5a778100 --- /dev/null +++ b/checkpoint-20/controlnet/diffusion_pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a6f578a7f0b5f63c69ae31d9765f8d28917706e5b36754989f779db58c25ae0 +size 1457056057 diff --git a/checkpoint-20/optimizer.bin b/checkpoint-20/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..78e8ee2710cf2eb187e59bbeab5d65e46320943e --- /dev/null +++ b/checkpoint-20/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7de0bbcb219f343eecf5862e8bd388760273028829d94cb82b9d3edf1cd72d3 +size 2914110681 diff --git a/checkpoint-20/random_states_0.pkl b/checkpoint-20/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..cea3e7f4b7f83db853d16cda397454fea0b2abef --- /dev/null +++ b/checkpoint-20/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f165526ba2a23f9980a8001e55eea7e6dad863926ba01e79d5f3a3b4161508a +size 14791 diff --git a/checkpoint-20/scheduler.bin b/checkpoint-20/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..07000351facc107c206fb4dc6ac02fc2ce8d77ef --- /dev/null +++ b/checkpoint-20/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86a75911787b041c041f381c3e28503763c6aad82e7a6c622f01430ef08131df +size 563 diff --git a/checkpoint-2000/controlnet/config.json b/checkpoint-2000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..53b3d3e22340c0e0c4cf0028c244ac2e3bef6b33 --- /dev/null +++ b/checkpoint-2000/controlnet/config.json @@ -0,0 +1,47 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.18.0.dev0", + "act_fn": "silu", + "attention_head_dim": [ + 5, + 10, + 20, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "class_embed_type": null, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 1024, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": null, + "resnet_time_scale_shift": "default", + "upcast_attention": false, + "use_linear_projection": true +} diff --git a/checkpoint-2000/controlnet/diffusion_pytorch_model.bin b/checkpoint-2000/controlnet/diffusion_pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..88a8809c6623c2db691deb7a9862f2a284bb7ec4 --- /dev/null +++ b/checkpoint-2000/controlnet/diffusion_pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cafff2c2b43d48134e1b740a56061e84b6cdb35a3652cec6caebaa6b5cada01 +size 1457056057 diff --git a/checkpoint-2000/optimizer.bin b/checkpoint-2000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..a579f34080fe8d4bca587b688fc9ca97eb15cd88 --- /dev/null +++ b/checkpoint-2000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e684e37f37e4f9ae167bc2a40c326365fcbbef342b897a46387ebeb6ea0a5fea +size 2914110681 diff --git a/checkpoint-2000/random_states_0.pkl b/checkpoint-2000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..5ae4a9f39a8655e9a0fe22db98fb787ba7529954 --- /dev/null +++ b/checkpoint-2000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d21181e3f0a1106d895fc027646f0e2941c04a67a64092310a324efb028c41c9 +size 14663 diff --git a/checkpoint-2000/scheduler.bin b/checkpoint-2000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..64373fe7f87efc1d992d705ae49aa37ba7ddd6b1 --- /dev/null +++ b/checkpoint-2000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfe94afd21b04fe331bf93a36e6de4869425c4da4a32303493f7f8b96dd6ca61 +size 563 diff --git a/checkpoint-4000/controlnet/config.json b/checkpoint-4000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..53b3d3e22340c0e0c4cf0028c244ac2e3bef6b33 --- /dev/null +++ b/checkpoint-4000/controlnet/config.json @@ -0,0 +1,47 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.18.0.dev0", + "act_fn": "silu", + "attention_head_dim": [ + 5, + 10, + 20, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "class_embed_type": null, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 1024, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": null, + "resnet_time_scale_shift": "default", + "upcast_attention": false, + "use_linear_projection": true +} diff --git a/checkpoint-4000/controlnet/diffusion_pytorch_model.bin b/checkpoint-4000/controlnet/diffusion_pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..d7079052b6d3ca08f29eed09cefa1193c1d31628 --- /dev/null +++ b/checkpoint-4000/controlnet/diffusion_pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83c35a86740708615dcc6575ac2c8b9edbc49e3038412f2ce4093e7bbacd014b +size 1457056057 diff --git a/checkpoint-4000/optimizer.bin b/checkpoint-4000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..985826ec1cba26f46383225ce4103b46e26f331a --- /dev/null +++ b/checkpoint-4000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:673f16de14ece3a579a49fd87f6e85fa5ac5a9d1a73f7736f76eb2322943ee70 +size 2914110681 diff --git a/checkpoint-4000/random_states_0.pkl b/checkpoint-4000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..0a69e5ac210177c26743c28f5c38c10c87ea3b88 --- /dev/null +++ b/checkpoint-4000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fed6e24d24a0334da266a7924e615b8edd93d87704c5e4943b9e8d46392d87d +size 14663 diff --git a/checkpoint-4000/scheduler.bin b/checkpoint-4000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..313279d03cea02360a7b766639ab1649570431af --- /dev/null +++ b/checkpoint-4000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7edd8082ac389d0c946c2ac507fc3e4d21eaad8a44fcb3f7b57ebbd1b62363dc +size 563 diff --git a/checkpoint-5000/controlnet/config.json b/checkpoint-5000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..53b3d3e22340c0e0c4cf0028c244ac2e3bef6b33 --- /dev/null +++ b/checkpoint-5000/controlnet/config.json @@ -0,0 +1,47 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.18.0.dev0", + "act_fn": "silu", + "attention_head_dim": [ + 5, + 10, + 20, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "class_embed_type": null, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 1024, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": null, + "resnet_time_scale_shift": "default", + "upcast_attention": false, + "use_linear_projection": true +} diff --git a/checkpoint-5000/controlnet/diffusion_pytorch_model.bin b/checkpoint-5000/controlnet/diffusion_pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..50a7bdd2b401257cf4f7e5567f70c25985261fc4 --- /dev/null +++ b/checkpoint-5000/controlnet/diffusion_pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ff212b02b6a5bab57dc69e67348f324c7e99eb5225d513f9123680a3cb707dc +size 1457056057 diff --git a/checkpoint-5000/optimizer.bin b/checkpoint-5000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..441859f1e372916baf8188c3966a0f75f3fc8b9a --- /dev/null +++ b/checkpoint-5000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75d84050bc1a15dd68bfc77d3f2094912f97419ecde82e943273d06ce2d5e711 +size 2914110681 diff --git a/checkpoint-5000/random_states_0.pkl b/checkpoint-5000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..44e781abe7b4cab3db1f2c4b771a18238cc75837 --- /dev/null +++ b/checkpoint-5000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00f1d0b5a28175b6f61a46b0eee3c06d28902b51790db398c0bcb28e93ac927d +size 14727 diff --git a/checkpoint-5000/scheduler.bin b/checkpoint-5000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..c37dd5f1ba284353140794600e68bbd00f948e8b --- /dev/null +++ b/checkpoint-5000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00b6b035e89b3f614d8a7babea59ef588908ea69ffc4eb871a24c002d6356cdc +size 563 diff --git a/checkpoint-6000/controlnet/config.json b/checkpoint-6000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..53b3d3e22340c0e0c4cf0028c244ac2e3bef6b33 --- /dev/null +++ b/checkpoint-6000/controlnet/config.json @@ -0,0 +1,47 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.18.0.dev0", + "act_fn": "silu", + "attention_head_dim": [ + 5, + 10, + 20, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "class_embed_type": null, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 1024, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": null, + "resnet_time_scale_shift": "default", + "upcast_attention": false, + "use_linear_projection": true +} diff --git a/checkpoint-6000/controlnet/diffusion_pytorch_model.bin b/checkpoint-6000/controlnet/diffusion_pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..ea5e25f1bde75dad3018164b5e26e20e6900abf0 --- /dev/null +++ b/checkpoint-6000/controlnet/diffusion_pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fc103000db7a68813523b804b97d63b106b5a529a6605fd8f466dee0a546e29 +size 1457056057 diff --git a/checkpoint-6000/optimizer.bin b/checkpoint-6000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..ac55e78e93412ba7698ca1e4b050dc61f190474d --- /dev/null +++ b/checkpoint-6000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4847c704d2250b6c4e7aae8abde414846163f1ec4fbf63d73827bef9741ef84a +size 2914110681 diff --git a/checkpoint-6000/random_states_0.pkl b/checkpoint-6000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..913872645d9610d4aaa01019d33286b2cee4f5ab --- /dev/null +++ b/checkpoint-6000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf2d3d5e5df3d7cafc42875e3147e740c8875449c2d0329b314dc28f909e7eee +size 14663 diff --git a/checkpoint-6000/scheduler.bin b/checkpoint-6000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..7413abefc4f8286274da3243afd962fa1696fff1 --- /dev/null +++ b/checkpoint-6000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a0df2dffc0559ef6134e0571ccfecb406ec3a612efe566ae6f1c62bcf1ab353 +size 563 diff --git a/checkpoint-8000/controlnet/config.json b/checkpoint-8000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..53b3d3e22340c0e0c4cf0028c244ac2e3bef6b33 --- /dev/null +++ b/checkpoint-8000/controlnet/config.json @@ -0,0 +1,47 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.18.0.dev0", + "act_fn": "silu", + "attention_head_dim": [ + 5, + 10, + 20, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "class_embed_type": null, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 1024, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": null, + "resnet_time_scale_shift": "default", + "upcast_attention": false, + "use_linear_projection": true +} diff --git a/checkpoint-8000/controlnet/diffusion_pytorch_model.bin b/checkpoint-8000/controlnet/diffusion_pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..5aa058219ab894ad9b9284547641520b25282ae9 --- /dev/null +++ b/checkpoint-8000/controlnet/diffusion_pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44582a20461ff087100df2a77ad55fe991dcfb917c9dbc9d1e6fd11d8c4acaa6 +size 1457056057 diff --git a/checkpoint-8000/optimizer.bin b/checkpoint-8000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..12266100d5ac3202f7beb72269777c9913655903 --- /dev/null +++ b/checkpoint-8000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2068d7219fd717bc7cbe19b2fa57cc66187783e033b2657d8d08f18292a19524 +size 2914110681 diff --git a/checkpoint-8000/random_states_0.pkl b/checkpoint-8000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..b4414a48142d6e342d9b0129ba65c590bc117286 --- /dev/null +++ b/checkpoint-8000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fad684947aff459619dbbb6389d5d70c892ae1c097eff6768fe5feffe63297a1 +size 14663 diff --git a/checkpoint-8000/scheduler.bin b/checkpoint-8000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..3474e1011e1462a8eab544164dfbd39366ca4da4 --- /dev/null +++ b/checkpoint-8000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:630cc19a3cb4ed5f1d67a0d535bfec489c348a6a88102d8fe945e1a1baf47eb6 +size 563 diff --git a/config.json b/config.json new file mode 100644 index 0000000000000000000000000000000000000000..53b3d3e22340c0e0c4cf0028c244ac2e3bef6b33 --- /dev/null +++ b/config.json @@ -0,0 +1,47 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.18.0.dev0", + "act_fn": "silu", + "attention_head_dim": [ + 5, + 10, + 20, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "class_embed_type": null, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 1024, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": null, + "resnet_time_scale_shift": "default", + "upcast_attention": false, + "use_linear_projection": true +} diff --git a/diffusion_pytorch_model.bin b/diffusion_pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..fc60cf07f7106e741abfdfbc5b58a13ae4ccd5c2 --- /dev/null +++ b/diffusion_pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac644575fc6dbf001f3d9836209ae77145040cbb9d54cbb8a932c17d635b3898 +size 1457056057 diff --git a/image_control.png b/image_control.png new file mode 100644 index 0000000000000000000000000000000000000000..2886ac967b0293e8f23f20aaaea8316130d840a7 Binary files /dev/null and b/image_control.png differ diff --git a/images_0.png b/images_0.png new file mode 100644 index 0000000000000000000000000000000000000000..b8cc9e14228ea1f51fd463ef55300006582a8629 --- /dev/null +++ b/images_0.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ef7a9ae6803c893b662ced0a4df0a277a5c9842e605d6248b1ed6423e9b9b87 +size 1923448 diff --git a/images_1.png b/images_1.png new file mode 100644 index 0000000000000000000000000000000000000000..38539812cf48a6f7c9e16fbb94236543e52e6144 --- /dev/null +++ b/images_1.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:665379a56285f7becc1a188a9a89d39a0188b39a94dccf6f1bbcf575bbeea251 +size 1591066 diff --git a/images_2.png b/images_2.png new file mode 100644 index 0000000000000000000000000000000000000000..3fd0d4e1ececc53c879b06655a19cfe8a488f5b3 --- /dev/null +++ b/images_2.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40dcb771e737292a354b897a47c7f84ab31fc63b6dc65d014396019ef8fc8ff1 +size 1734464