add vae encoder component
Browse files- README.md +3 -2
- model_index.json +5 -1
- scheduler/scheduler_config.json +1 -1
- tokenizer/tokenizer_config.json +1 -1
- unet/openvino_model.xml +15 -15
- vae_encoder/openvino_model.bin +3 -0
- vae_encoder/openvino_model.xml +0 -0
README.md
CHANGED
|
@@ -3,8 +3,9 @@ license: apache-2.0
|
|
| 3 |
---
|
| 4 |
|
| 5 |
```python
|
| 6 |
-
from optimum.intel.openvino
|
| 7 |
|
| 8 |
-
|
|
|
|
| 9 |
```
|
| 10 |
|
|
|
|
| 3 |
---
|
| 4 |
|
| 5 |
```python
|
| 6 |
+
from optimum.intel.openvino import OVStableDiffusionPipeline
|
| 7 |
|
| 8 |
+
model_id = "hf-internal-testing/tiny-stable-diffusion-openvino"
|
| 9 |
+
pipe = OVStableDiffusionPipeline.from_pretrained(model_id)
|
| 10 |
```
|
| 11 |
|
model_index.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
{
|
| 2 |
"_class_name": "OVStableDiffusionPipeline",
|
| 3 |
-
"_diffusers_version": "0.
|
| 4 |
"feature_extractor": [
|
| 5 |
"transformers",
|
| 6 |
"CLIPFeatureExtractor"
|
|
@@ -28,5 +28,9 @@
|
|
| 28 |
"vae_decoder": [
|
| 29 |
"optimum",
|
| 30 |
"OVModelVaeDecoder"
|
|
|
|
|
|
|
|
|
|
|
|
|
| 31 |
]
|
| 32 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"_class_name": "OVStableDiffusionPipeline",
|
| 3 |
+
"_diffusers_version": "0.14.0",
|
| 4 |
"feature_extractor": [
|
| 5 |
"transformers",
|
| 6 |
"CLIPFeatureExtractor"
|
|
|
|
| 28 |
"vae_decoder": [
|
| 29 |
"optimum",
|
| 30 |
"OVModelVaeDecoder"
|
| 31 |
+
],
|
| 32 |
+
"vae_encoder": [
|
| 33 |
+
"optimum",
|
| 34 |
+
"OVModelVaeEncoder"
|
| 35 |
]
|
| 36 |
}
|
scheduler/scheduler_config.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
{
|
| 2 |
"_class_name": "PNDMScheduler",
|
| 3 |
-
"_diffusers_version": "0.
|
| 4 |
"beta_end": 0.012,
|
| 5 |
"beta_schedule": "scaled_linear",
|
| 6 |
"beta_start": 0.00085,
|
|
|
|
| 1 |
{
|
| 2 |
"_class_name": "PNDMScheduler",
|
| 3 |
+
"_diffusers_version": "0.14.0",
|
| 4 |
"beta_end": 0.012,
|
| 5 |
"beta_schedule": "scaled_linear",
|
| 6 |
"beta_start": 0.00085,
|
tokenizer/tokenizer_config.json
CHANGED
|
@@ -19,7 +19,7 @@
|
|
| 19 |
},
|
| 20 |
"errors": "replace",
|
| 21 |
"model_max_length": 77,
|
| 22 |
-
"name_or_path": "/tmp/
|
| 23 |
"pad_token": "<|endoftext|>",
|
| 24 |
"special_tokens_map_file": "/home/lysandre/.cache/huggingface/transformers/18a566598f286c9139f88160c99f84eec492a26bd22738fa9cb44d5b7e0a5c76.cce1206abbad28826f000510f22f354e53e66a97f7c23745a7dfe27609cc07f5",
|
| 25 |
"tokenizer_class": "CLIPTokenizer",
|
|
|
|
| 19 |
},
|
| 20 |
"errors": "replace",
|
| 21 |
"model_max_length": 77,
|
| 22 |
+
"name_or_path": "/tmp/tmp6i7rva3d/tokenizer",
|
| 23 |
"pad_token": "<|endoftext|>",
|
| 24 |
"special_tokens_map_file": "/home/lysandre/.cache/huggingface/transformers/18a566598f286c9139f88160c99f84eec492a26bd22738fa9cb44d5b7e0a5c76.cce1206abbad28826f000510f22f354e53e66a97f7c23745a7dfe27609cc07f5",
|
| 25 |
"tokenizer_class": "CLIPTokenizer",
|
unet/openvino_model.xml
CHANGED
|
@@ -27,7 +27,7 @@
|
|
| 27 |
</output>
|
| 28 |
</layer>
|
| 29 |
<layer id="0" name="encoder_hidden_states" type="Parameter" version="opset1">
|
| 30 |
-
<data shape="?,77
|
| 31 |
<rt_info>
|
| 32 |
<attribute name="fused_names" version="0" value="encoder_hidden_states" />
|
| 33 |
</rt_info>
|
|
@@ -35,7 +35,7 @@
|
|
| 35 |
<port id="0" precision="FP32" names="encoder_hidden_states">
|
| 36 |
<dim>-1</dim>
|
| 37 |
<dim>77</dim>
|
| 38 |
-
<dim
|
| 39 |
</port>
|
| 40 |
</output>
|
| 41 |
</layer>
|
|
@@ -1436,7 +1436,7 @@
|
|
| 1436 |
</port>
|
| 1437 |
</output>
|
| 1438 |
</layer>
|
| 1439 |
-
<layer id="92" name="
|
| 1440 |
<data element_type="i64" shape="1" offset="58936" size="8" />
|
| 1441 |
<rt_info>
|
| 1442 |
<attribute name="fused_names" version="0" value="/Reshape" />
|
|
@@ -12418,7 +12418,7 @@
|
|
| 12418 |
<port id="0" precision="FP32">
|
| 12419 |
<dim>-1</dim>
|
| 12420 |
<dim>77</dim>
|
| 12421 |
-
<dim
|
| 12422 |
</port>
|
| 12423 |
<port id="1" precision="FP32">
|
| 12424 |
<dim>32</dim>
|
|
@@ -13418,7 +13418,7 @@
|
|
| 13418 |
<port id="0" precision="FP32">
|
| 13419 |
<dim>-1</dim>
|
| 13420 |
<dim>77</dim>
|
| 13421 |
-
<dim
|
| 13422 |
</port>
|
| 13423 |
<port id="1" precision="FP32">
|
| 13424 |
<dim>32</dim>
|
|
@@ -22714,7 +22714,7 @@
|
|
| 22714 |
<port id="0" precision="FP32">
|
| 22715 |
<dim>-1</dim>
|
| 22716 |
<dim>77</dim>
|
| 22717 |
-
<dim
|
| 22718 |
</port>
|
| 22719 |
<port id="1" precision="FP32">
|
| 22720 |
<dim>32</dim>
|
|
@@ -23714,7 +23714,7 @@
|
|
| 23714 |
<port id="0" precision="FP32">
|
| 23715 |
<dim>-1</dim>
|
| 23716 |
<dim>77</dim>
|
| 23717 |
-
<dim
|
| 23718 |
</port>
|
| 23719 |
<port id="1" precision="FP32">
|
| 23720 |
<dim>32</dim>
|
|
@@ -33010,7 +33010,7 @@
|
|
| 33010 |
<port id="0" precision="FP32">
|
| 33011 |
<dim>-1</dim>
|
| 33012 |
<dim>77</dim>
|
| 33013 |
-
<dim
|
| 33014 |
</port>
|
| 33015 |
<port id="1" precision="FP32">
|
| 33016 |
<dim>32</dim>
|
|
@@ -34010,7 +34010,7 @@
|
|
| 34010 |
<port id="0" precision="FP32">
|
| 34011 |
<dim>-1</dim>
|
| 34012 |
<dim>77</dim>
|
| 34013 |
-
<dim
|
| 34014 |
</port>
|
| 34015 |
<port id="1" precision="FP32">
|
| 34016 |
<dim>32</dim>
|
|
@@ -45425,7 +45425,7 @@
|
|
| 45425 |
<port id="0" precision="FP32">
|
| 45426 |
<dim>-1</dim>
|
| 45427 |
<dim>77</dim>
|
| 45428 |
-
<dim
|
| 45429 |
</port>
|
| 45430 |
<port id="1" precision="FP32">
|
| 45431 |
<dim>32</dim>
|
|
@@ -46425,7 +46425,7 @@
|
|
| 46425 |
<port id="0" precision="FP32">
|
| 46426 |
<dim>-1</dim>
|
| 46427 |
<dim>77</dim>
|
| 46428 |
-
<dim
|
| 46429 |
</port>
|
| 46430 |
<port id="1" precision="FP32">
|
| 46431 |
<dim>32</dim>
|
|
@@ -55980,7 +55980,7 @@
|
|
| 55980 |
<port id="0" precision="FP32">
|
| 55981 |
<dim>-1</dim>
|
| 55982 |
<dim>77</dim>
|
| 55983 |
-
<dim
|
| 55984 |
</port>
|
| 55985 |
<port id="1" precision="FP32">
|
| 55986 |
<dim>32</dim>
|
|
@@ -56980,7 +56980,7 @@
|
|
| 56980 |
<port id="0" precision="FP32">
|
| 56981 |
<dim>-1</dim>
|
| 56982 |
<dim>77</dim>
|
| 56983 |
-
<dim
|
| 56984 |
</port>
|
| 56985 |
<port id="1" precision="FP32">
|
| 56986 |
<dim>32</dim>
|
|
@@ -66561,7 +66561,7 @@
|
|
| 66561 |
<port id="0" precision="FP32">
|
| 66562 |
<dim>-1</dim>
|
| 66563 |
<dim>77</dim>
|
| 66564 |
-
<dim
|
| 66565 |
</port>
|
| 66566 |
<port id="1" precision="FP32">
|
| 66567 |
<dim>32</dim>
|
|
@@ -67561,7 +67561,7 @@
|
|
| 67561 |
<port id="0" precision="FP32">
|
| 67562 |
<dim>-1</dim>
|
| 67563 |
<dim>77</dim>
|
| 67564 |
-
<dim
|
| 67565 |
</port>
|
| 67566 |
<port id="1" precision="FP32">
|
| 67567 |
<dim>32</dim>
|
|
|
|
| 27 |
</output>
|
| 28 |
</layer>
|
| 29 |
<layer id="0" name="encoder_hidden_states" type="Parameter" version="opset1">
|
| 30 |
+
<data shape="?,77,32" element_type="f32" />
|
| 31 |
<rt_info>
|
| 32 |
<attribute name="fused_names" version="0" value="encoder_hidden_states" />
|
| 33 |
</rt_info>
|
|
|
|
| 35 |
<port id="0" precision="FP32" names="encoder_hidden_states">
|
| 36 |
<dim>-1</dim>
|
| 37 |
<dim>77</dim>
|
| 38 |
+
<dim>32</dim>
|
| 39 |
</port>
|
| 40 |
</output>
|
| 41 |
</layer>
|
|
|
|
| 1436 |
</port>
|
| 1437 |
</output>
|
| 1438 |
</layer>
|
| 1439 |
+
<layer id="92" name="Constant_274101" type="Const" version="opset1">
|
| 1440 |
<data element_type="i64" shape="1" offset="58936" size="8" />
|
| 1441 |
<rt_info>
|
| 1442 |
<attribute name="fused_names" version="0" value="/Reshape" />
|
|
|
|
| 12418 |
<port id="0" precision="FP32">
|
| 12419 |
<dim>-1</dim>
|
| 12420 |
<dim>77</dim>
|
| 12421 |
+
<dim>32</dim>
|
| 12422 |
</port>
|
| 12423 |
<port id="1" precision="FP32">
|
| 12424 |
<dim>32</dim>
|
|
|
|
| 13418 |
<port id="0" precision="FP32">
|
| 13419 |
<dim>-1</dim>
|
| 13420 |
<dim>77</dim>
|
| 13421 |
+
<dim>32</dim>
|
| 13422 |
</port>
|
| 13423 |
<port id="1" precision="FP32">
|
| 13424 |
<dim>32</dim>
|
|
|
|
| 22714 |
<port id="0" precision="FP32">
|
| 22715 |
<dim>-1</dim>
|
| 22716 |
<dim>77</dim>
|
| 22717 |
+
<dim>32</dim>
|
| 22718 |
</port>
|
| 22719 |
<port id="1" precision="FP32">
|
| 22720 |
<dim>32</dim>
|
|
|
|
| 23714 |
<port id="0" precision="FP32">
|
| 23715 |
<dim>-1</dim>
|
| 23716 |
<dim>77</dim>
|
| 23717 |
+
<dim>32</dim>
|
| 23718 |
</port>
|
| 23719 |
<port id="1" precision="FP32">
|
| 23720 |
<dim>32</dim>
|
|
|
|
| 33010 |
<port id="0" precision="FP32">
|
| 33011 |
<dim>-1</dim>
|
| 33012 |
<dim>77</dim>
|
| 33013 |
+
<dim>32</dim>
|
| 33014 |
</port>
|
| 33015 |
<port id="1" precision="FP32">
|
| 33016 |
<dim>32</dim>
|
|
|
|
| 34010 |
<port id="0" precision="FP32">
|
| 34011 |
<dim>-1</dim>
|
| 34012 |
<dim>77</dim>
|
| 34013 |
+
<dim>32</dim>
|
| 34014 |
</port>
|
| 34015 |
<port id="1" precision="FP32">
|
| 34016 |
<dim>32</dim>
|
|
|
|
| 45425 |
<port id="0" precision="FP32">
|
| 45426 |
<dim>-1</dim>
|
| 45427 |
<dim>77</dim>
|
| 45428 |
+
<dim>32</dim>
|
| 45429 |
</port>
|
| 45430 |
<port id="1" precision="FP32">
|
| 45431 |
<dim>32</dim>
|
|
|
|
| 46425 |
<port id="0" precision="FP32">
|
| 46426 |
<dim>-1</dim>
|
| 46427 |
<dim>77</dim>
|
| 46428 |
+
<dim>32</dim>
|
| 46429 |
</port>
|
| 46430 |
<port id="1" precision="FP32">
|
| 46431 |
<dim>32</dim>
|
|
|
|
| 55980 |
<port id="0" precision="FP32">
|
| 55981 |
<dim>-1</dim>
|
| 55982 |
<dim>77</dim>
|
| 55983 |
+
<dim>32</dim>
|
| 55984 |
</port>
|
| 55985 |
<port id="1" precision="FP32">
|
| 55986 |
<dim>32</dim>
|
|
|
|
| 56980 |
<port id="0" precision="FP32">
|
| 56981 |
<dim>-1</dim>
|
| 56982 |
<dim>77</dim>
|
| 56983 |
+
<dim>32</dim>
|
| 56984 |
</port>
|
| 56985 |
<port id="1" precision="FP32">
|
| 56986 |
<dim>32</dim>
|
|
|
|
| 66561 |
<port id="0" precision="FP32">
|
| 66562 |
<dim>-1</dim>
|
| 66563 |
<dim>77</dim>
|
| 66564 |
+
<dim>32</dim>
|
| 66565 |
</port>
|
| 66566 |
<port id="1" precision="FP32">
|
| 66567 |
<dim>32</dim>
|
|
|
|
| 67561 |
<port id="0" precision="FP32">
|
| 67562 |
<dim>-1</dim>
|
| 67563 |
<dim>77</dim>
|
| 67564 |
+
<dim>32</dim>
|
| 67565 |
</port>
|
| 67566 |
<port id="1" precision="FP32">
|
| 67567 |
<dim>32</dim>
|
vae_encoder/openvino_model.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:14509b2db28c5e75866ae3795e5e636db33ec5d47bdefa836f1bf97b5bfceba7
|
| 3 |
+
size 1021864
|
vae_encoder/openvino_model.xml
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|