diff --git a/.gitattributes b/.gitattributes index a6344aac8c09253b3b630fb776ae94478aa0275b..27f9ad3400e04dbc449df227bbf12df7696a54df 100644 --- a/.gitattributes +++ b/.gitattributes @@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +images_0.png filter=lfs diff=lfs merge=lfs -text diff --git a/.ipynb_checkpoints/Untitled-checkpoint.ipynb b/.ipynb_checkpoints/Untitled-checkpoint.ipynb new file mode 100644 index 0000000000000000000000000000000000000000..363fcab7ed6e9634e198cf5555ceb88932c9a245 --- /dev/null +++ b/.ipynb_checkpoints/Untitled-checkpoint.ipynb @@ -0,0 +1,6 @@ +{ + "cells": [], + "metadata": {}, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git a/README.md b/README.md new file mode 100644 index 0000000000000000000000000000000000000000..21095a7a02e45be12f1c8c39e7aaef0a98e6f085 --- /dev/null +++ b/README.md @@ -0,0 +1,43 @@ +--- +license: openrail++ +library_name: diffusers +tags: +- stable-diffusion-xl +- stable-diffusion-xl-diffusers +- text-to-image +- diffusers +- controlnet +- diffusers-training +base_model: stabilityai/stable-diffusion-xl-base-1.0 +inference: true +--- + + + + +# controlnet-sylviam00/output + +These are controlnet weights trained on stabilityai/stable-diffusion-xl-base-1.0 with new type of conditioning. +You can find some example images below. + +prompt: baby with black hair +![images_0)](./images_0.png) + + + +## Intended uses & limitations + +#### How to use + +```python +# TODO: add an example code snippet for running this diffusion pipeline +``` + +#### Limitations and bias + +[TODO: provide examples of latent issues and potential remediations] + +## Training details + +[TODO: describe the data used to train the model] \ No newline at end of file diff --git a/Untitled.ipynb b/Untitled.ipynb new file mode 100644 index 0000000000000000000000000000000000000000..1eb8dfbf8a8b3c9257f416ce5f0647a41e1801e7 --- /dev/null +++ b/Untitled.ipynb @@ -0,0 +1,159 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 2, + "id": "afd90476-00e7-49ca-a2e0-11276cdb5f2c", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "/home/ubuntu/ControlNet-xl/diffusers/src\n" + ] + } + ], + "source": [ + "%cd ~/ControlNet-xl/diffusers/src" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "id": "756973fb-a3a3-4893-b269-0de115ca5782", + "metadata": {}, + "outputs": [], + "source": [ + "from diffusers import StableDiffusionControlNetPipeline, ControlNetModel, UniPCMultistepScheduler\n", + "from diffusers.utils import load_image\n", + "import torch" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "id": "504793ad-e2c8-4b65-bf64-afb10d899d81", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "/home/ubuntu/ControlNet-xl/diffusers/examples/controlnet\n" + ] + } + ], + "source": [ + "%cd ~/ControlNet-xl/diffusers/examples/controlnet" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "id": "72a40359-e9ca-492b-b28c-d69ec88b5d30", + "metadata": {}, + "outputs": [ + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "b4e02de11c7243cfa566d271f41f293a", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + "Loading pipeline components...: 0%| | 0/5 [00:00\u001b[0;34m\u001b[0m\n\u001b[1;32m 19\u001b[0m \u001b[0;31m# generate image\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 20\u001b[0m \u001b[0mgenerator\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mtorch\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mmanual_seed\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;36m0\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 21\u001b[0;31m image = pipe(\n\u001b[0m\u001b[1;32m 22\u001b[0m \u001b[0mprompt\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mnum_inference_steps\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;36m20\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mgenerator\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mgenerator\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mimage\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mcontrol_image\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 23\u001b[0m ).images[0]\n", + "\u001b[0;32m/usr/lib/python3/dist-packages/torch/utils/_contextlib.py\u001b[0m in \u001b[0;36mdecorate_context\u001b[0;34m(*args, **kwargs)\u001b[0m\n\u001b[1;32m 113\u001b[0m \u001b[0;32mdef\u001b[0m \u001b[0mdecorate_context\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 114\u001b[0m \u001b[0;32mwith\u001b[0m \u001b[0mctx_factory\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 115\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0mfunc\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 116\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 117\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0mdecorate_context\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/ControlNet-xl/diffusers/src/diffusers/pipelines/controlnet/pipeline_controlnet.py\u001b[0m in \u001b[0;36m__call__\u001b[0;34m(self, prompt, image, height, width, num_inference_steps, timesteps, sigmas, guidance_scale, negative_prompt, num_images_per_prompt, eta, generator, latents, prompt_embeds, negative_prompt_embeds, ip_adapter_image, ip_adapter_image_embeds, output_type, return_dict, cross_attention_kwargs, controlnet_conditioning_scale, guess_mode, control_guidance_start, control_guidance_end, clip_skip, callback_on_step_end, callback_on_step_end_tensor_inputs, **kwargs)\u001b[0m\n\u001b[1;32m 1267\u001b[0m \u001b[0mcond_scale\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mcontrolnet_cond_scale\u001b[0m \u001b[0;34m*\u001b[0m \u001b[0mcontrolnet_keep\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mi\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1268\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 1269\u001b[0;31m down_block_res_samples, mid_block_res_sample = self.controlnet(\n\u001b[0m\u001b[1;32m 1270\u001b[0m \u001b[0mcontrol_model_input\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1271\u001b[0m \u001b[0mt\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m/usr/lib/python3/dist-packages/torch/nn/modules/module.py\u001b[0m in \u001b[0;36m_call_impl\u001b[0;34m(self, *args, **kwargs)\u001b[0m\n\u001b[1;32m 1499\u001b[0m \u001b[0;32mor\u001b[0m \u001b[0m_global_backward_pre_hooks\u001b[0m \u001b[0;32mor\u001b[0m \u001b[0m_global_backward_hooks\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1500\u001b[0m or _global_forward_hooks or _global_forward_pre_hooks):\n\u001b[0;32m-> 1501\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0mforward_call\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 1502\u001b[0m \u001b[0;31m# Do not call functions when jit is used\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1503\u001b[0m \u001b[0mfull_backward_hooks\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mnon_full_backward_hooks\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;34m[\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m[\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/.local/lib/python3.10/site-packages/accelerate/hooks.py\u001b[0m in \u001b[0;36mnew_forward\u001b[0;34m(module, *args, **kwargs)\u001b[0m\n\u001b[1;32m 164\u001b[0m \u001b[0moutput\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mmodule\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_old_forward\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 165\u001b[0m \u001b[0;32melse\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 166\u001b[0;31m \u001b[0moutput\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mmodule\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_old_forward\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 167\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0mmodule\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_hf_hook\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mpost_forward\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mmodule\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0moutput\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 168\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/ControlNet-xl/diffusers/src/diffusers/models/controlnet.py\u001b[0m in \u001b[0;36mforward\u001b[0;34m(self, sample, timestep, encoder_hidden_states, controlnet_cond, conditioning_scale, class_labels, timestep_cond, attention_mask, added_cond_kwargs, cross_attention_kwargs, guess_mode, return_dict)\u001b[0m\n\u001b[1;32m 776\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 777\u001b[0m \u001b[0;32melif\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mconfig\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0maddition_embed_type\u001b[0m \u001b[0;34m==\u001b[0m \u001b[0;34m\"text_time\"\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 778\u001b[0;31m \u001b[0;32mif\u001b[0m \u001b[0;34m\"text_embeds\"\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0;32min\u001b[0m \u001b[0madded_cond_kwargs\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 779\u001b[0m raise ValueError(\n\u001b[1;32m 780\u001b[0m \u001b[0;34mf\"{self.__class__} has the config param `addition_embed_type` set to 'text_time' which requires the keyword argument `text_embeds` to be passed in `added_cond_kwargs`\"\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;31mTypeError\u001b[0m: argument of type 'NoneType' is not iterable" + ] + } + ], + "source": [ + "base_model_path = \"stabilityai/stable-diffusion-xl-base-1.0\"\n", + "#controlnet_path = \"georgefen/Face-Landmark-ControlNet\"\n", + "controlnet_path = \"./output\"\n", + "\n", + "controlnet = ControlNetModel.from_pretrained(controlnet_path, torch_dtype=torch.float16)\n", + "pipe = StableDiffusionControlNetPipeline.from_pretrained(\n", + " base_model_path, controlnet=controlnet, torch_dtype=torch.float16, safety_checker = None,\n", + " requires_safety_checker = False\n", + ")\n", + "\n", + "# speed up diffusion process with faster scheduler and memory optimization\n", + "pipe.scheduler = UniPCMultistepScheduler.from_config(pipe.scheduler.config)\n", + "# memory optimization.\n", + "pipe.enable_model_cpu_offload()\n", + "\n", + "control_image = load_image(\"./00000_con.png\")\n", + "prompt = \"baby\"\n", + "\n", + "# generate image\n", + "generator = torch.manual_seed(0)\n", + "image = pipe(\n", + " prompt, num_inference_steps=20, generator=generator, image=control_image\n", + ").images[0]\n", + "image.save(\"./00000_out.png\")" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "4cda01b0-228e-4f52-94cd-ca803fa5a9af", + "metadata": {}, + "outputs": [], + "source": [] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.10.12" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git a/checkpoint-1000/controlnet/config.json b/checkpoint-1000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..040c087b669e780e6231ca7ba37885da8d59ce81 --- /dev/null +++ b/checkpoint-1000/controlnet/config.json @@ -0,0 +1,57 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.28.0.dev0", + "act_fn": "silu", + "addition_embed_type": "text_time", + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": 256, + "attention_head_dim": [ + 5, + 10, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 2048, + "down_block_types": [ + "DownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": 2816, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": [ + 1, + 2, + 10 + ], + "upcast_attention": null, + "use_linear_projection": true +} diff --git a/checkpoint-1000/controlnet/diffusion_pytorch_model.safetensors b/checkpoint-1000/controlnet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2e183ba17cec2d2b9bb914915127d4c41cf4a6e7 --- /dev/null +++ b/checkpoint-1000/controlnet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aec114504c12a891debe7532773f2c1545b13515b7877c152d424241b597d609 +size 5004167864 diff --git a/checkpoint-1000/optimizer.bin b/checkpoint-1000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..2a41b75ae506f0ca17ae5038b5c305fea9dcebe4 --- /dev/null +++ b/checkpoint-1000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dc8ef72fb8c3d1d32e13fb835c79fee88c6385cbeaa8e3a501dd3951ec0ce08 +size 10008840997 diff --git a/checkpoint-1000/random_states_0.pkl b/checkpoint-1000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..a6264c0b21e751c82e19ed8bd2ac773393401acd --- /dev/null +++ b/checkpoint-1000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f77328309e5aafb22c9ca4e36d9e20c8e775493690f48de77f0ce4d62613e15 +size 14599 diff --git a/checkpoint-1000/scaler.pt b/checkpoint-1000/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..efdbd3c795f6b0d4144e68355e99c220ccdedd09 --- /dev/null +++ b/checkpoint-1000/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68cff80b680ddf6e7abbef98b5f336b97f9b5963e2209307f639383870e8cc71 +size 557 diff --git a/checkpoint-1000/scheduler.bin b/checkpoint-1000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..2948b016ab3f41add89fdea0efa6587d63a96d23 --- /dev/null +++ b/checkpoint-1000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f34912fa092355c5a950e4967ea28cbb3556238a7857baa5999d228cde0ae4c3 +size 563 diff --git a/checkpoint-10000/controlnet/config.json b/checkpoint-10000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..040c087b669e780e6231ca7ba37885da8d59ce81 --- /dev/null +++ b/checkpoint-10000/controlnet/config.json @@ -0,0 +1,57 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.28.0.dev0", + "act_fn": "silu", + "addition_embed_type": "text_time", + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": 256, + "attention_head_dim": [ + 5, + 10, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 2048, + "down_block_types": [ + "DownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": 2816, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": [ + 1, + 2, + 10 + ], + "upcast_attention": null, + "use_linear_projection": true +} diff --git a/checkpoint-10000/controlnet/diffusion_pytorch_model.safetensors b/checkpoint-10000/controlnet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..60125c95e44c32c35e4c8ce853a119494e1aafee --- /dev/null +++ b/checkpoint-10000/controlnet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c833f0c159e1e84a7684b3013f0bec5f0ae1cb47aa65a23e6e1e3df925af97e7 +size 5004167864 diff --git a/checkpoint-10000/optimizer.bin b/checkpoint-10000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..0fdd4e06f4111a27af66643c73730898bb027265 --- /dev/null +++ b/checkpoint-10000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3efa7f81870edec59aad6d8ff8807dace1111e92d44764c73c70df4b605399c1 +size 10008840997 diff --git a/checkpoint-10000/random_states_0.pkl b/checkpoint-10000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..8b0e814bd1d1740627f9283de07693c1c5c037c6 --- /dev/null +++ b/checkpoint-10000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6094ebf87697c597a09756d8d36fe3bfb9e91abb3a6dda294a55003ea9ead779 +size 14599 diff --git a/checkpoint-10000/scaler.pt b/checkpoint-10000/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..b345659e084dfa08f03a221d79b2e302a4748dfe --- /dev/null +++ b/checkpoint-10000/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9be2ad76dcbc923b00e6a142f6db62aad4a46c47bb83864ccb68ddc899d0ce78 +size 557 diff --git a/checkpoint-10000/scheduler.bin b/checkpoint-10000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..dfea8b103660873f57a0b99214cb9acb641ced7b --- /dev/null +++ b/checkpoint-10000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6bcd4cb37625cab1478c5f801ecf8dcfe8513c2acdf383cd99f5bc953b5e8a3 +size 563 diff --git a/checkpoint-2000/controlnet/config.json b/checkpoint-2000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..040c087b669e780e6231ca7ba37885da8d59ce81 --- /dev/null +++ b/checkpoint-2000/controlnet/config.json @@ -0,0 +1,57 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.28.0.dev0", + "act_fn": "silu", + "addition_embed_type": "text_time", + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": 256, + "attention_head_dim": [ + 5, + 10, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 2048, + "down_block_types": [ + "DownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": 2816, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": [ + 1, + 2, + 10 + ], + "upcast_attention": null, + "use_linear_projection": true +} diff --git a/checkpoint-2000/controlnet/diffusion_pytorch_model.safetensors b/checkpoint-2000/controlnet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3ee728c05b2a4019ac7c2a6197ccf2ed907a2363 --- /dev/null +++ b/checkpoint-2000/controlnet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f220b03bce8265377c851382dee85a92dd5e2cc3fadb277f51e59ce09bb0141 +size 5004167864 diff --git a/checkpoint-2000/optimizer.bin b/checkpoint-2000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..71e86bef997dd39bc2dffb280a345f540f260cef --- /dev/null +++ b/checkpoint-2000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4d548a8ca5fb62e0e8b89f04272bb3299244a6432abb5a0d70f1c71234241ca +size 10008840997 diff --git a/checkpoint-2000/random_states_0.pkl b/checkpoint-2000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..cd0527d2a90d56b8bf30ad743bf80582f48d1647 --- /dev/null +++ b/checkpoint-2000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81eaf5c921fa2d7cbab8071dc0301b2ec15fdab95596daf172b8166f981bbf7 +size 14599 diff --git a/checkpoint-2000/scaler.pt b/checkpoint-2000/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..21ece35416ce79724d347155f11cfa297b97cabc --- /dev/null +++ b/checkpoint-2000/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd2de9749828adacdf103bf6e9592702bb7067a2c1df27dd62ab38c1eb8c070f +size 557 diff --git a/checkpoint-2000/scheduler.bin b/checkpoint-2000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..64373fe7f87efc1d992d705ae49aa37ba7ddd6b1 --- /dev/null +++ b/checkpoint-2000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfe94afd21b04fe331bf93a36e6de4869425c4da4a32303493f7f8b96dd6ca61 +size 563 diff --git a/checkpoint-3000/controlnet/config.json b/checkpoint-3000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..040c087b669e780e6231ca7ba37885da8d59ce81 --- /dev/null +++ b/checkpoint-3000/controlnet/config.json @@ -0,0 +1,57 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.28.0.dev0", + "act_fn": "silu", + "addition_embed_type": "text_time", + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": 256, + "attention_head_dim": [ + 5, + 10, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 2048, + "down_block_types": [ + "DownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": 2816, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": [ + 1, + 2, + 10 + ], + "upcast_attention": null, + "use_linear_projection": true +} diff --git a/checkpoint-3000/controlnet/diffusion_pytorch_model.safetensors b/checkpoint-3000/controlnet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..94d123a875a4e7ebadac3740a13d93bf9a2c36d7 --- /dev/null +++ b/checkpoint-3000/controlnet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a8dccb8dcb05f91a03c30645f958bdfb71c21626da4c144dacc54c3fcbb7492 +size 5004167864 diff --git a/checkpoint-3000/optimizer.bin b/checkpoint-3000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..bbc3e7f2e104bb9e7ecd6c330e9add5a863c7da9 --- /dev/null +++ b/checkpoint-3000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dd032af0679caa70a46f4d43a60aaa524662dc53d6525b6239448c4f77f92b5 +size 10008840997 diff --git a/checkpoint-3000/random_states_0.pkl b/checkpoint-3000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..849afa8986b4e90c91dc808ab39f66a7af8a5ba2 --- /dev/null +++ b/checkpoint-3000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e361dda8a471a9752db230d2b3d76af21805f3ec40939a068a3463a562ab209c +size 14599 diff --git a/checkpoint-3000/scaler.pt b/checkpoint-3000/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..2888c9ddc2c30e6b47ce0e6abcc8e2d1303aab00 --- /dev/null +++ b/checkpoint-3000/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb1f9398b77268202e8e1465734a63d123b1ef11c27f20f2473677e9883a6869 +size 557 diff --git a/checkpoint-3000/scheduler.bin b/checkpoint-3000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..0b6eaa6a5a88bbc1e19c9479751f75698e848c9d --- /dev/null +++ b/checkpoint-3000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d6ec0338061ab706b1805a9e2966ca126b26619cd90bb73133127681b9de370 +size 563 diff --git a/checkpoint-4000/controlnet/config.json b/checkpoint-4000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..040c087b669e780e6231ca7ba37885da8d59ce81 --- /dev/null +++ b/checkpoint-4000/controlnet/config.json @@ -0,0 +1,57 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.28.0.dev0", + "act_fn": "silu", + "addition_embed_type": "text_time", + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": 256, + "attention_head_dim": [ + 5, + 10, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 2048, + "down_block_types": [ + "DownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": 2816, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": [ + 1, + 2, + 10 + ], + "upcast_attention": null, + "use_linear_projection": true +} diff --git a/checkpoint-4000/controlnet/diffusion_pytorch_model.safetensors b/checkpoint-4000/controlnet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..69e737cc019c61b315020d0fd221fc0e4ebb5428 --- /dev/null +++ b/checkpoint-4000/controlnet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ab9b3831cfa71debce180e161926e87c3fcf3529c647042940964af9fd55c70 +size 5004167864 diff --git a/checkpoint-4000/optimizer.bin b/checkpoint-4000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..604c8fdd48b7fd209d051afb8ce872f3b6720c0e --- /dev/null +++ b/checkpoint-4000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0a412c5ee466eb02dc29d962d624605893c492d61d0e65c4ff7f343ed4ea48e +size 10008840997 diff --git a/checkpoint-4000/random_states_0.pkl b/checkpoint-4000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..158ab9b568cecff79997d0550905e26c50e8fea0 --- /dev/null +++ b/checkpoint-4000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39e927ecbaa140716d50566200ca64b673c5829e96d06087bb4b2e3b797c88da +size 14599 diff --git a/checkpoint-4000/scaler.pt b/checkpoint-4000/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6dfc1dc5fe962ebf4423f5d584aeb4e90dc01be --- /dev/null +++ b/checkpoint-4000/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09a61ecdaa4a69ba865e0b9e19169660549c34c60a83537ab5ece413678520ab +size 557 diff --git a/checkpoint-4000/scheduler.bin b/checkpoint-4000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..313279d03cea02360a7b766639ab1649570431af --- /dev/null +++ b/checkpoint-4000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7edd8082ac389d0c946c2ac507fc3e4d21eaad8a44fcb3f7b57ebbd1b62363dc +size 563 diff --git a/checkpoint-5000/controlnet/config.json b/checkpoint-5000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..040c087b669e780e6231ca7ba37885da8d59ce81 --- /dev/null +++ b/checkpoint-5000/controlnet/config.json @@ -0,0 +1,57 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.28.0.dev0", + "act_fn": "silu", + "addition_embed_type": "text_time", + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": 256, + "attention_head_dim": [ + 5, + 10, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 2048, + "down_block_types": [ + "DownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": 2816, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": [ + 1, + 2, + 10 + ], + "upcast_attention": null, + "use_linear_projection": true +} diff --git a/checkpoint-5000/controlnet/diffusion_pytorch_model.safetensors b/checkpoint-5000/controlnet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..215c0c01d2357de724950741a6bdc98b4da5f496 --- /dev/null +++ b/checkpoint-5000/controlnet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3e3b43c0b6abcf94df69d0cae78082383d1ed619ad0b8bf0abc7fdd5f45e97e +size 5004167864 diff --git a/checkpoint-5000/optimizer.bin b/checkpoint-5000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..4fa57f605bd18a4923f01f08448d22ab5a84f99f --- /dev/null +++ b/checkpoint-5000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de68397a0018cced56ca9571fbe7d04c89c43f2649d5c25ba940062df806539c +size 10008840997 diff --git a/checkpoint-5000/random_states_0.pkl b/checkpoint-5000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..ab4742e82d8384cae1a87731f7b1263b017351aa --- /dev/null +++ b/checkpoint-5000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ceaa85cbd30c99b8a99dec89078c36df5402a5b069636f7379f2289df89b0124 +size 14599 diff --git a/checkpoint-5000/scaler.pt b/checkpoint-5000/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a0a5a2d6700d39df12b85e2a8ee02926333f46a --- /dev/null +++ b/checkpoint-5000/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a41313b6733b65c1acca917a7c2ced06503c11b898e6cd5de1e6a9f13bfb54ef +size 557 diff --git a/checkpoint-5000/scheduler.bin b/checkpoint-5000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..c37dd5f1ba284353140794600e68bbd00f948e8b --- /dev/null +++ b/checkpoint-5000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00b6b035e89b3f614d8a7babea59ef588908ea69ffc4eb871a24c002d6356cdc +size 563 diff --git a/checkpoint-6000/controlnet/config.json b/checkpoint-6000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..040c087b669e780e6231ca7ba37885da8d59ce81 --- /dev/null +++ b/checkpoint-6000/controlnet/config.json @@ -0,0 +1,57 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.28.0.dev0", + "act_fn": "silu", + "addition_embed_type": "text_time", + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": 256, + "attention_head_dim": [ + 5, + 10, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 2048, + "down_block_types": [ + "DownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": 2816, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": [ + 1, + 2, + 10 + ], + "upcast_attention": null, + "use_linear_projection": true +} diff --git a/checkpoint-6000/controlnet/diffusion_pytorch_model.safetensors b/checkpoint-6000/controlnet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c8b1d555ed8086c166b665dbec1af6e555a2cb45 --- /dev/null +++ b/checkpoint-6000/controlnet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47364f1693f3765122cbb5d8b37bd3c9f749f6c47781feb398467ed315c34f6e +size 5004167864 diff --git a/checkpoint-6000/optimizer.bin b/checkpoint-6000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..17d15da0fc5fa3f15cede1948e297bc89842b7b1 --- /dev/null +++ b/checkpoint-6000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8bed8dcf81c967258251fef1fa6fdf906ba83f22d389bccb2a04f63a38d99ed +size 10008840997 diff --git a/checkpoint-6000/random_states_0.pkl b/checkpoint-6000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..0d2acc228a6c3994ddb37a7d7cb4114dd31091fd --- /dev/null +++ b/checkpoint-6000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1c1c6f7e064c8200fccac9ad3f6a7b7dc6e871c4056fa4b9ea847b8581bc36d +size 14599 diff --git a/checkpoint-6000/scaler.pt b/checkpoint-6000/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fd17ac3026715d5a68d70922df4742631319059 --- /dev/null +++ b/checkpoint-6000/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a00ef97fc41c0d653df466126d855f16646dd10726d3ac99a23f55ca70ec19a +size 557 diff --git a/checkpoint-6000/scheduler.bin b/checkpoint-6000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..7413abefc4f8286274da3243afd962fa1696fff1 --- /dev/null +++ b/checkpoint-6000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a0df2dffc0559ef6134e0571ccfecb406ec3a612efe566ae6f1c62bcf1ab353 +size 563 diff --git a/checkpoint-7000/controlnet/config.json b/checkpoint-7000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..040c087b669e780e6231ca7ba37885da8d59ce81 --- /dev/null +++ b/checkpoint-7000/controlnet/config.json @@ -0,0 +1,57 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.28.0.dev0", + "act_fn": "silu", + "addition_embed_type": "text_time", + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": 256, + "attention_head_dim": [ + 5, + 10, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 2048, + "down_block_types": [ + "DownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": 2816, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": [ + 1, + 2, + 10 + ], + "upcast_attention": null, + "use_linear_projection": true +} diff --git a/checkpoint-7000/controlnet/diffusion_pytorch_model.safetensors b/checkpoint-7000/controlnet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a503c5c77bde7d77aef151382a61553a45b01f30 --- /dev/null +++ b/checkpoint-7000/controlnet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84ad26c41c69645235529088e7ddc5486fe11992f1ba38eacd77899b3f325bae +size 5004167864 diff --git a/checkpoint-7000/optimizer.bin b/checkpoint-7000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..453e101549830426ef65d8a5710478f983b8194f --- /dev/null +++ b/checkpoint-7000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36d3b2a7a2aa8db83e10055d14cf0764fed6ddf9bfc69a0b8b4228c4679cc220 +size 10008840997 diff --git a/checkpoint-7000/random_states_0.pkl b/checkpoint-7000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..6b7815252ed98401ae52ed84a01104e66f204f71 --- /dev/null +++ b/checkpoint-7000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a45a5926d9a6a8352d5f769a6a8990c22e4039d6f1dee9898b04542abed01db4 +size 14599 diff --git a/checkpoint-7000/scaler.pt b/checkpoint-7000/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ceac8d008df631f48c13ff48e83da859977ff02 --- /dev/null +++ b/checkpoint-7000/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d22aed3a858ee389297b2101bb2ed7ee9e37744f1a1f75273dbdf045d65b041a +size 557 diff --git a/checkpoint-7000/scheduler.bin b/checkpoint-7000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..5d3f4d330277dbbc7bdd2058db7f7c8331323e27 --- /dev/null +++ b/checkpoint-7000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0e6cbbd05427cb09a990f303190d8f0051084080c856964101f9aea5e481068 +size 563 diff --git a/checkpoint-8000/controlnet/config.json b/checkpoint-8000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..040c087b669e780e6231ca7ba37885da8d59ce81 --- /dev/null +++ b/checkpoint-8000/controlnet/config.json @@ -0,0 +1,57 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.28.0.dev0", + "act_fn": "silu", + "addition_embed_type": "text_time", + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": 256, + "attention_head_dim": [ + 5, + 10, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 2048, + "down_block_types": [ + "DownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": 2816, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": [ + 1, + 2, + 10 + ], + "upcast_attention": null, + "use_linear_projection": true +} diff --git a/checkpoint-8000/controlnet/diffusion_pytorch_model.safetensors b/checkpoint-8000/controlnet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..138ebef58c56c7753fbe3842160c5529edfe7eee --- /dev/null +++ b/checkpoint-8000/controlnet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7da0d28f7dab991e4a987f4bac29a7c4eb332cc3a723f8e58856aa1f4fa7e4e2 +size 5004167864 diff --git a/checkpoint-8000/optimizer.bin b/checkpoint-8000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..542371e4b59e9cc9e9cd2160776d6a64849a1ce3 --- /dev/null +++ b/checkpoint-8000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d1d9b3c82dc21ade498b64810f524a8a38d476b651e756a1ecb0c71f159c9f6 +size 10008840997 diff --git a/checkpoint-8000/random_states_0.pkl b/checkpoint-8000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..7af4bd7d91c3d5a4fa555c58ee9a45bcb352ed1f --- /dev/null +++ b/checkpoint-8000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3334ab6cc5485796d375c2c774e7f6d03cc6e388e9cff13487e59300a640b282 +size 14599 diff --git a/checkpoint-8000/scaler.pt b/checkpoint-8000/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd25dc8bd6a1a15851636b4ebafe829cb0ed1b0d --- /dev/null +++ b/checkpoint-8000/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b278cd6e09360f31a3d837f80dee4c2ce4d9c9d186a939ecf157e1a0deb793f3 +size 557 diff --git a/checkpoint-8000/scheduler.bin b/checkpoint-8000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..3474e1011e1462a8eab544164dfbd39366ca4da4 --- /dev/null +++ b/checkpoint-8000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:630cc19a3cb4ed5f1d67a0d535bfec489c348a6a88102d8fe945e1a1baf47eb6 +size 563 diff --git a/checkpoint-9000/controlnet/config.json b/checkpoint-9000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..040c087b669e780e6231ca7ba37885da8d59ce81 --- /dev/null +++ b/checkpoint-9000/controlnet/config.json @@ -0,0 +1,57 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.28.0.dev0", + "act_fn": "silu", + "addition_embed_type": "text_time", + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": 256, + "attention_head_dim": [ + 5, + 10, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 2048, + "down_block_types": [ + "DownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": 2816, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": [ + 1, + 2, + 10 + ], + "upcast_attention": null, + "use_linear_projection": true +} diff --git a/checkpoint-9000/controlnet/diffusion_pytorch_model.safetensors b/checkpoint-9000/controlnet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2e5a826eab59be9328416a828f7783ec0ce469d1 --- /dev/null +++ b/checkpoint-9000/controlnet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43fcf91dd4ec72ffe88107939863fee6f8d24dda3b9bc9bdd4d76d46e5c7032f +size 5004167864 diff --git a/checkpoint-9000/optimizer.bin b/checkpoint-9000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..1e4a6ab1d41804a4c1fe7f23c12afaff7576c955 --- /dev/null +++ b/checkpoint-9000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ebdd36153c916ca9308eea430ab2d310349b7b8c1185bb04cb5df9dce0c77e1 +size 10008840997 diff --git a/checkpoint-9000/random_states_0.pkl b/checkpoint-9000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..a8ffabe1b786f7ced5a19d5ba9a927593d133197 --- /dev/null +++ b/checkpoint-9000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e24b1e895c71c638d2a0b0a010fddd50866ca3a8c6de64fb0abf286879be2b62 +size 14599 diff --git a/checkpoint-9000/scaler.pt b/checkpoint-9000/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c7306b1b0e5b21e2fec7bb12b5a46cc7b66591f --- /dev/null +++ b/checkpoint-9000/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4be7a7b56cfc3e79d33648a4c49d4f11c6593d8d653b129207b2e38f2684a284 +size 557 diff --git a/checkpoint-9000/scheduler.bin b/checkpoint-9000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..441f03705c86ea73ba155600524d371b9ec283e5 --- /dev/null +++ b/checkpoint-9000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c13d19a790c3b70de0c58d8be6eda53cbc852819b276ffcfe81fcb4f0bbdb79a +size 563 diff --git a/config.json b/config.json new file mode 100644 index 0000000000000000000000000000000000000000..040c087b669e780e6231ca7ba37885da8d59ce81 --- /dev/null +++ b/config.json @@ -0,0 +1,57 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.28.0.dev0", + "act_fn": "silu", + "addition_embed_type": "text_time", + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": 256, + "attention_head_dim": [ + 5, + 10, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 2048, + "down_block_types": [ + "DownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": 2816, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": [ + 1, + 2, + 10 + ], + "upcast_attention": null, + "use_linear_projection": true +} diff --git a/diffusion_pytorch_model.safetensors b/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..60125c95e44c32c35e4c8ce853a119494e1aafee --- /dev/null +++ b/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c833f0c159e1e84a7684b3013f0bec5f0ae1cb47aa65a23e6e1e3df925af97e7 +size 5004167864 diff --git a/image_control.png b/image_control.png new file mode 100644 index 0000000000000000000000000000000000000000..e4f5e7a95df58a9561713fda98f465a869740d32 Binary files /dev/null and b/image_control.png differ diff --git a/images_0.png b/images_0.png new file mode 100644 index 0000000000000000000000000000000000000000..573ec563060b089dbaa89fd0b36f1ab48d68f1fb --- /dev/null +++ b/images_0.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f96f942541ee30077203e346ccb13410dd6785ab949ee20b9ecd7056e51d008 +size 1384259 diff --git a/logs/sd_xl_train_controlnet/1715654774.1921992/events.out.tfevents.1715654774.132-145-137-145.3057.1 b/logs/sd_xl_train_controlnet/1715654774.1921992/events.out.tfevents.1715654774.132-145-137-145.3057.1 new file mode 100644 index 0000000000000000000000000000000000000000..a5d6ab0b4bd135f5d021b44812021ecd740241b7 --- /dev/null +++ b/logs/sd_xl_train_controlnet/1715654774.1921992/events.out.tfevents.1715654774.132-145-137-145.3057.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7577e1e2d1693f3397d0cc099ef552c0148c75012a288159799b91b1540d11d1 +size 2591 diff --git a/logs/sd_xl_train_controlnet/1715654774.2111096/hparams.yml b/logs/sd_xl_train_controlnet/1715654774.2111096/hparams.yml new file mode 100644 index 0000000000000000000000000000000000000000..ecfcc78af7347038e106468cacbacb68baab61d5 --- /dev/null +++ b/logs/sd_xl_train_controlnet/1715654774.2111096/hparams.yml @@ -0,0 +1,54 @@ +adam_beta1: 0.9 +adam_beta2: 0.999 +adam_epsilon: 1.0e-08 +adam_weight_decay: 0.01 +allow_tf32: false +cache_dir: null +caption_column: caption +checkpointing_steps: 1000 +checkpoints_total_limit: null +conditioning_image_column: condition_img +controlnet_model_name_or_path: null +crops_coords_top_left_h: 0 +crops_coords_top_left_w: 0 +dataloader_num_workers: 0 +dataset_config_name: null +dataset_name: cld07/captioned_ffhq_50k_512 +enable_npu_flash_attention: false +enable_xformers_memory_efficient_attention: false +gradient_accumulation_steps: 1 +gradient_checkpointing: false +hub_model_id: null +hub_token: null +image_column: source_image +learning_rate: 1.0e-05 +logging_dir: logs +lr_num_cycles: 1 +lr_power: 1.0 +lr_scheduler: constant +lr_warmup_steps: 500 +max_grad_norm: 1.0 +max_train_samples: null +max_train_steps: 10000 +mixed_precision: fp16 +num_train_epochs: 1 +num_validation_images: 4 +output_dir: ./output +pretrained_model_name_or_path: stabilityai/stable-diffusion-xl-base-1.0 +pretrained_vae_model_name_or_path: null +proportion_empty_prompts: 0 +push_to_hub: true +report_to: tensorboard +resolution: 512 +resume_from_checkpoint: null +revision: null +scale_lr: false +seed: 42 +set_grads_to_none: false +tokenizer_name: null +tracker_project_name: sd_xl_train_controlnet +train_batch_size: 4 +train_data_dir: null +use_8bit_adam: false +validation_steps: 1000 +variant: null diff --git a/logs/sd_xl_train_controlnet/events.out.tfevents.1715654774.132-145-137-145.3057.0 b/logs/sd_xl_train_controlnet/events.out.tfevents.1715654774.132-145-137-145.3057.0 new file mode 100644 index 0000000000000000000000000000000000000000..8d976e9ab79d381b116eb1224360e8e876c327d8 --- /dev/null +++ b/logs/sd_xl_train_controlnet/events.out.tfevents.1715654774.132-145-137-145.3057.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26e87f08f41ad0120c05878a40012142fce4a1addf0c4ae603164a998ad8f0e6 +size 2372327