Upload StableCascadeDecoderPipeline
Browse files- decoder/config.json +15 -15
- decoder/diffusion_pytorch_model.safetensors +2 -2
- model_index.json +8 -12
- text_encoder/config.json +1 -1
- text_encoder/model.safetensors +1 -1
decoder/config.json
CHANGED
|
@@ -1,12 +1,12 @@
|
|
| 1 |
{
|
| 2 |
"_class_name": "StableCascadeUNet",
|
| 3 |
"_diffusers_version": "0.30.2",
|
| 4 |
-
"_name_or_path": "
|
| 5 |
"block_out_channels": [
|
| 6 |
320,
|
| 7 |
-
|
| 8 |
-
|
| 9 |
-
|
| 10 |
],
|
| 11 |
"block_types_per_layer": [
|
| 12 |
[
|
|
@@ -41,9 +41,9 @@
|
|
| 41 |
],
|
| 42 |
"down_num_layers_per_block": [
|
| 43 |
2,
|
| 44 |
-
|
| 45 |
-
|
| 46 |
-
|
| 47 |
],
|
| 48 |
"dropout": [
|
| 49 |
0,
|
|
@@ -56,9 +56,9 @@
|
|
| 56 |
"kernel_size": 3,
|
| 57 |
"num_attention_heads": [
|
| 58 |
0,
|
| 59 |
-
|
| 60 |
-
|
| 61 |
-
|
| 62 |
],
|
| 63 |
"out_channels": 4,
|
| 64 |
"patch_size": 2,
|
|
@@ -70,15 +70,15 @@
|
|
| 70 |
],
|
| 71 |
"timestep_ratio_embedding_dim": 64,
|
| 72 |
"up_blocks_repeat_mappers": [
|
| 73 |
-
|
| 74 |
-
|
| 75 |
2,
|
| 76 |
2
|
| 77 |
],
|
| 78 |
"up_num_layers_per_block": [
|
| 79 |
-
|
| 80 |
-
|
| 81 |
-
|
| 82 |
2
|
| 83 |
]
|
| 84 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"_class_name": "StableCascadeUNet",
|
| 3 |
"_diffusers_version": "0.30.2",
|
| 4 |
+
"_name_or_path": "stabilityai/stable-cascade",
|
| 5 |
"block_out_channels": [
|
| 6 |
320,
|
| 7 |
+
576,
|
| 8 |
+
1152,
|
| 9 |
+
1152
|
| 10 |
],
|
| 11 |
"block_types_per_layer": [
|
| 12 |
[
|
|
|
|
| 41 |
],
|
| 42 |
"down_num_layers_per_block": [
|
| 43 |
2,
|
| 44 |
+
4,
|
| 45 |
+
14,
|
| 46 |
+
4
|
| 47 |
],
|
| 48 |
"dropout": [
|
| 49 |
0,
|
|
|
|
| 56 |
"kernel_size": 3,
|
| 57 |
"num_attention_heads": [
|
| 58 |
0,
|
| 59 |
+
9,
|
| 60 |
+
18,
|
| 61 |
+
18
|
| 62 |
],
|
| 63 |
"out_channels": 4,
|
| 64 |
"patch_size": 2,
|
|
|
|
| 70 |
],
|
| 71 |
"timestep_ratio_embedding_dim": 64,
|
| 72 |
"up_blocks_repeat_mappers": [
|
| 73 |
+
2,
|
| 74 |
+
2,
|
| 75 |
2,
|
| 76 |
2
|
| 77 |
],
|
| 78 |
"up_num_layers_per_block": [
|
| 79 |
+
4,
|
| 80 |
+
14,
|
| 81 |
+
4,
|
| 82 |
2
|
| 83 |
]
|
| 84 |
}
|
decoder/diffusion_pytorch_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7dcb3fc8b1e3f2a1756503472043a7d6810003a418b60b08674633b20b452ffb
|
| 3 |
+
size 2797989648
|
model_index.json
CHANGED
|
@@ -1,20 +1,12 @@
|
|
| 1 |
{
|
| 2 |
-
"_class_name": "
|
| 3 |
"_diffusers_version": "0.30.2",
|
| 4 |
-
"_name_or_path": "stabilityai/stable-cascade
|
| 5 |
-
"
|
| 6 |
-
"transformers",
|
| 7 |
-
"CLIPImageProcessor"
|
| 8 |
-
],
|
| 9 |
-
"image_encoder": [
|
| 10 |
-
"transformers",
|
| 11 |
-
"CLIPVisionModelWithProjection"
|
| 12 |
-
],
|
| 13 |
-
"prior": [
|
| 14 |
"diffusers",
|
| 15 |
"StableCascadeUNet"
|
| 16 |
],
|
| 17 |
-
"
|
| 18 |
"scheduler": [
|
| 19 |
"diffusers",
|
| 20 |
"DDPMWuerstchenScheduler"
|
|
@@ -26,5 +18,9 @@
|
|
| 26 |
"tokenizer": [
|
| 27 |
"transformers",
|
| 28 |
"CLIPTokenizerFast"
|
|
|
|
|
|
|
|
|
|
|
|
|
| 29 |
]
|
| 30 |
}
|
|
|
|
| 1 |
{
|
| 2 |
+
"_class_name": "StableCascadeDecoderPipeline",
|
| 3 |
"_diffusers_version": "0.30.2",
|
| 4 |
+
"_name_or_path": "stabilityai/stable-cascade",
|
| 5 |
+
"decoder": [
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 6 |
"diffusers",
|
| 7 |
"StableCascadeUNet"
|
| 8 |
],
|
| 9 |
+
"latent_dim_scale": 10.67,
|
| 10 |
"scheduler": [
|
| 11 |
"diffusers",
|
| 12 |
"DDPMWuerstchenScheduler"
|
|
|
|
| 18 |
"tokenizer": [
|
| 19 |
"transformers",
|
| 20 |
"CLIPTokenizerFast"
|
| 21 |
+
],
|
| 22 |
+
"vqgan": [
|
| 23 |
+
"wuerstchen",
|
| 24 |
+
"PaellaVQModel"
|
| 25 |
]
|
| 26 |
}
|
text_encoder/config.json
CHANGED
|
@@ -1,5 +1,5 @@
|
|
| 1 |
{
|
| 2 |
-
"_name_or_path": "/root/.cache/huggingface/hub/models--stabilityai--stable-cascade
|
| 3 |
"architectures": [
|
| 4 |
"CLIPTextModelWithProjection"
|
| 5 |
],
|
|
|
|
| 1 |
{
|
| 2 |
+
"_name_or_path": "/root/.cache/huggingface/hub/models--stabilityai--stable-cascade/snapshots/a89f66d459ae653e3b4d4f992a7c3789d0dc4d16/text_encoder",
|
| 3 |
"architectures": [
|
| 4 |
"CLIPTextModelWithProjection"
|
| 5 |
],
|
text_encoder/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2778702264
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:30e7a50f59884f068ac6bdc41b0ade553f23c0cbe2eaf3bac76369d2c39bfa37
|
| 3 |
size 2778702264
|