update model

Files changed (3) hide show

README.md CHANGED Viewed

@@ -1,3 +1,43 @@
 ---
 license: apache-2.0
 ---

 ---
 license: apache-2.0
+tags:
+- pytorch
+- diffusers
+- text-to-image
 ---
+# Chinese Latent Diffusion Model
+我们开源了适配模型 `alibaba-pai/pai-diffusion-general-large-zh` 的 ControlNet，输入图像的 Canny 特征，进行可控的生成。
+* Github: [EasyNLP](https://github.com/alibaba/EasyNLP)
+```python
+from diffusers import StableDiffusionControlNetPipeline, ControlNetModel
+from PIL import Image
+import numpy as np
+import cv2
+def to_canny(image):
+    low_threshold = 100
+    high_threshold = 200
+    image = np.array(image)
+    image = cv2.Canny(image, low_threshold, high_threshold)
+    image = image[:, :, None]
+    image = np.concatenate([image, image, image], axis=2)
+    image = Image.fromarray(image)
+    return image
+controlnet_id = "alibaba-pai/pai-diffusion-general-large-zh-controlnet-canny"
+controlnet = ControlNetModel.from_pretrained(controlnet_id)
+model_id = "alibaba-pai/pai-diffusion-general-large-zh"
+pipe = StableDiffusionControlNetPipeline.from_pretrained(model_id, controlnet=controlnet)
+pipe = pipe.to("cuda")
+image = Image.open("bird.png")
+image_canny = to_canny(image)
+prompt = "白色羽毛的小鸟"
+image = pipe(prompt, image_canny).images[0]
+image.save("result.png")
+```

config.json ADDED Viewed

+{
+  "_class_name": "ControlNetModel",
+  "_diffusers_version": "0.15.0.dev0",
+  "act_fn": "silu",
+  "attention_head_dim": 8,
+  "block_out_channels": [
+    320,
+    640,
+    1280,
+    1280
+  ],
+  "class_embed_type": null,
+  "conditioning_embedding_out_channels": [
+    16,
+    32,
+    96,
+    256
+  ],
+  "controlnet_conditioning_channel_order": "rgb",
+  "cross_attention_dim": 768,
+  "down_block_types": [
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "DownBlock2D"
+  ],
+  "downsample_padding": 1,
+  "flip_sin_to_cos": true,
+  "freq_shift": 0,
+  "in_channels": 4,
+  "layers_per_block": 2,
+  "mid_block_scale_factor": 1,
+  "norm_eps": 1e-05,
+  "norm_num_groups": 32,
+  "num_class_embeds": null,
+  "only_cross_attention": false,
+  "projection_class_embeddings_input_dim": null,
+  "resnet_time_scale_shift": "default",
+  "upcast_attention": false,
+  "use_linear_projection": false
+}

diffusion_pytorch_model.bin ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:1eaf3fbae4cdb6c2ab909c12c85b5aa695a7b58157903730ab0fa74b8a0142a7
+size 1445248857