add vae encoder component
Browse files- README.md +3 -2
- model_index.json +5 -1
- scheduler/scheduler_config.json +1 -1
- tokenizer/tokenizer_config.json +1 -1
- unet/openvino_model.xml +15 -15
- vae_encoder/openvino_model.bin +3 -0
- vae_encoder/openvino_model.xml +0 -0
README.md
CHANGED
@@ -3,8 +3,9 @@ license: apache-2.0
|
|
3 |
---
|
4 |
|
5 |
```python
|
6 |
-
from optimum.intel.openvino
|
7 |
|
8 |
-
|
|
|
9 |
```
|
10 |
|
|
|
3 |
---
|
4 |
|
5 |
```python
|
6 |
+
from optimum.intel.openvino import OVStableDiffusionPipeline
|
7 |
|
8 |
+
model_id = "hf-internal-testing/tiny-stable-diffusion-openvino"
|
9 |
+
pipe = OVStableDiffusionPipeline.from_pretrained(model_id)
|
10 |
```
|
11 |
|
model_index.json
CHANGED
@@ -1,6 +1,6 @@
|
|
1 |
{
|
2 |
"_class_name": "OVStableDiffusionPipeline",
|
3 |
-
"_diffusers_version": "0.
|
4 |
"feature_extractor": [
|
5 |
"transformers",
|
6 |
"CLIPFeatureExtractor"
|
@@ -28,5 +28,9 @@
|
|
28 |
"vae_decoder": [
|
29 |
"optimum",
|
30 |
"OVModelVaeDecoder"
|
|
|
|
|
|
|
|
|
31 |
]
|
32 |
}
|
|
|
1 |
{
|
2 |
"_class_name": "OVStableDiffusionPipeline",
|
3 |
+
"_diffusers_version": "0.14.0",
|
4 |
"feature_extractor": [
|
5 |
"transformers",
|
6 |
"CLIPFeatureExtractor"
|
|
|
28 |
"vae_decoder": [
|
29 |
"optimum",
|
30 |
"OVModelVaeDecoder"
|
31 |
+
],
|
32 |
+
"vae_encoder": [
|
33 |
+
"optimum",
|
34 |
+
"OVModelVaeEncoder"
|
35 |
]
|
36 |
}
|
scheduler/scheduler_config.json
CHANGED
@@ -1,6 +1,6 @@
|
|
1 |
{
|
2 |
"_class_name": "PNDMScheduler",
|
3 |
-
"_diffusers_version": "0.
|
4 |
"beta_end": 0.012,
|
5 |
"beta_schedule": "scaled_linear",
|
6 |
"beta_start": 0.00085,
|
|
|
1 |
{
|
2 |
"_class_name": "PNDMScheduler",
|
3 |
+
"_diffusers_version": "0.14.0",
|
4 |
"beta_end": 0.012,
|
5 |
"beta_schedule": "scaled_linear",
|
6 |
"beta_start": 0.00085,
|
tokenizer/tokenizer_config.json
CHANGED
@@ -19,7 +19,7 @@
|
|
19 |
},
|
20 |
"errors": "replace",
|
21 |
"model_max_length": 77,
|
22 |
-
"name_or_path": "/tmp/
|
23 |
"pad_token": "<|endoftext|>",
|
24 |
"special_tokens_map_file": "/home/lysandre/.cache/huggingface/transformers/18a566598f286c9139f88160c99f84eec492a26bd22738fa9cb44d5b7e0a5c76.cce1206abbad28826f000510f22f354e53e66a97f7c23745a7dfe27609cc07f5",
|
25 |
"tokenizer_class": "CLIPTokenizer",
|
|
|
19 |
},
|
20 |
"errors": "replace",
|
21 |
"model_max_length": 77,
|
22 |
+
"name_or_path": "/tmp/tmp6i7rva3d/tokenizer",
|
23 |
"pad_token": "<|endoftext|>",
|
24 |
"special_tokens_map_file": "/home/lysandre/.cache/huggingface/transformers/18a566598f286c9139f88160c99f84eec492a26bd22738fa9cb44d5b7e0a5c76.cce1206abbad28826f000510f22f354e53e66a97f7c23745a7dfe27609cc07f5",
|
25 |
"tokenizer_class": "CLIPTokenizer",
|
unet/openvino_model.xml
CHANGED
@@ -27,7 +27,7 @@
|
|
27 |
</output>
|
28 |
</layer>
|
29 |
<layer id="0" name="encoder_hidden_states" type="Parameter" version="opset1">
|
30 |
-
<data shape="?,77
|
31 |
<rt_info>
|
32 |
<attribute name="fused_names" version="0" value="encoder_hidden_states" />
|
33 |
</rt_info>
|
@@ -35,7 +35,7 @@
|
|
35 |
<port id="0" precision="FP32" names="encoder_hidden_states">
|
36 |
<dim>-1</dim>
|
37 |
<dim>77</dim>
|
38 |
-
<dim
|
39 |
</port>
|
40 |
</output>
|
41 |
</layer>
|
@@ -1436,7 +1436,7 @@
|
|
1436 |
</port>
|
1437 |
</output>
|
1438 |
</layer>
|
1439 |
-
<layer id="92" name="
|
1440 |
<data element_type="i64" shape="1" offset="58936" size="8" />
|
1441 |
<rt_info>
|
1442 |
<attribute name="fused_names" version="0" value="/Reshape" />
|
@@ -12418,7 +12418,7 @@
|
|
12418 |
<port id="0" precision="FP32">
|
12419 |
<dim>-1</dim>
|
12420 |
<dim>77</dim>
|
12421 |
-
<dim
|
12422 |
</port>
|
12423 |
<port id="1" precision="FP32">
|
12424 |
<dim>32</dim>
|
@@ -13418,7 +13418,7 @@
|
|
13418 |
<port id="0" precision="FP32">
|
13419 |
<dim>-1</dim>
|
13420 |
<dim>77</dim>
|
13421 |
-
<dim
|
13422 |
</port>
|
13423 |
<port id="1" precision="FP32">
|
13424 |
<dim>32</dim>
|
@@ -22714,7 +22714,7 @@
|
|
22714 |
<port id="0" precision="FP32">
|
22715 |
<dim>-1</dim>
|
22716 |
<dim>77</dim>
|
22717 |
-
<dim
|
22718 |
</port>
|
22719 |
<port id="1" precision="FP32">
|
22720 |
<dim>32</dim>
|
@@ -23714,7 +23714,7 @@
|
|
23714 |
<port id="0" precision="FP32">
|
23715 |
<dim>-1</dim>
|
23716 |
<dim>77</dim>
|
23717 |
-
<dim
|
23718 |
</port>
|
23719 |
<port id="1" precision="FP32">
|
23720 |
<dim>32</dim>
|
@@ -33010,7 +33010,7 @@
|
|
33010 |
<port id="0" precision="FP32">
|
33011 |
<dim>-1</dim>
|
33012 |
<dim>77</dim>
|
33013 |
-
<dim
|
33014 |
</port>
|
33015 |
<port id="1" precision="FP32">
|
33016 |
<dim>32</dim>
|
@@ -34010,7 +34010,7 @@
|
|
34010 |
<port id="0" precision="FP32">
|
34011 |
<dim>-1</dim>
|
34012 |
<dim>77</dim>
|
34013 |
-
<dim
|
34014 |
</port>
|
34015 |
<port id="1" precision="FP32">
|
34016 |
<dim>32</dim>
|
@@ -45425,7 +45425,7 @@
|
|
45425 |
<port id="0" precision="FP32">
|
45426 |
<dim>-1</dim>
|
45427 |
<dim>77</dim>
|
45428 |
-
<dim
|
45429 |
</port>
|
45430 |
<port id="1" precision="FP32">
|
45431 |
<dim>32</dim>
|
@@ -46425,7 +46425,7 @@
|
|
46425 |
<port id="0" precision="FP32">
|
46426 |
<dim>-1</dim>
|
46427 |
<dim>77</dim>
|
46428 |
-
<dim
|
46429 |
</port>
|
46430 |
<port id="1" precision="FP32">
|
46431 |
<dim>32</dim>
|
@@ -55980,7 +55980,7 @@
|
|
55980 |
<port id="0" precision="FP32">
|
55981 |
<dim>-1</dim>
|
55982 |
<dim>77</dim>
|
55983 |
-
<dim
|
55984 |
</port>
|
55985 |
<port id="1" precision="FP32">
|
55986 |
<dim>32</dim>
|
@@ -56980,7 +56980,7 @@
|
|
56980 |
<port id="0" precision="FP32">
|
56981 |
<dim>-1</dim>
|
56982 |
<dim>77</dim>
|
56983 |
-
<dim
|
56984 |
</port>
|
56985 |
<port id="1" precision="FP32">
|
56986 |
<dim>32</dim>
|
@@ -66561,7 +66561,7 @@
|
|
66561 |
<port id="0" precision="FP32">
|
66562 |
<dim>-1</dim>
|
66563 |
<dim>77</dim>
|
66564 |
-
<dim
|
66565 |
</port>
|
66566 |
<port id="1" precision="FP32">
|
66567 |
<dim>32</dim>
|
@@ -67561,7 +67561,7 @@
|
|
67561 |
<port id="0" precision="FP32">
|
67562 |
<dim>-1</dim>
|
67563 |
<dim>77</dim>
|
67564 |
-
<dim
|
67565 |
</port>
|
67566 |
<port id="1" precision="FP32">
|
67567 |
<dim>32</dim>
|
|
|
27 |
</output>
|
28 |
</layer>
|
29 |
<layer id="0" name="encoder_hidden_states" type="Parameter" version="opset1">
|
30 |
+
<data shape="?,77,32" element_type="f32" />
|
31 |
<rt_info>
|
32 |
<attribute name="fused_names" version="0" value="encoder_hidden_states" />
|
33 |
</rt_info>
|
|
|
35 |
<port id="0" precision="FP32" names="encoder_hidden_states">
|
36 |
<dim>-1</dim>
|
37 |
<dim>77</dim>
|
38 |
+
<dim>32</dim>
|
39 |
</port>
|
40 |
</output>
|
41 |
</layer>
|
|
|
1436 |
</port>
|
1437 |
</output>
|
1438 |
</layer>
|
1439 |
+
<layer id="92" name="Constant_274101" type="Const" version="opset1">
|
1440 |
<data element_type="i64" shape="1" offset="58936" size="8" />
|
1441 |
<rt_info>
|
1442 |
<attribute name="fused_names" version="0" value="/Reshape" />
|
|
|
12418 |
<port id="0" precision="FP32">
|
12419 |
<dim>-1</dim>
|
12420 |
<dim>77</dim>
|
12421 |
+
<dim>32</dim>
|
12422 |
</port>
|
12423 |
<port id="1" precision="FP32">
|
12424 |
<dim>32</dim>
|
|
|
13418 |
<port id="0" precision="FP32">
|
13419 |
<dim>-1</dim>
|
13420 |
<dim>77</dim>
|
13421 |
+
<dim>32</dim>
|
13422 |
</port>
|
13423 |
<port id="1" precision="FP32">
|
13424 |
<dim>32</dim>
|
|
|
22714 |
<port id="0" precision="FP32">
|
22715 |
<dim>-1</dim>
|
22716 |
<dim>77</dim>
|
22717 |
+
<dim>32</dim>
|
22718 |
</port>
|
22719 |
<port id="1" precision="FP32">
|
22720 |
<dim>32</dim>
|
|
|
23714 |
<port id="0" precision="FP32">
|
23715 |
<dim>-1</dim>
|
23716 |
<dim>77</dim>
|
23717 |
+
<dim>32</dim>
|
23718 |
</port>
|
23719 |
<port id="1" precision="FP32">
|
23720 |
<dim>32</dim>
|
|
|
33010 |
<port id="0" precision="FP32">
|
33011 |
<dim>-1</dim>
|
33012 |
<dim>77</dim>
|
33013 |
+
<dim>32</dim>
|
33014 |
</port>
|
33015 |
<port id="1" precision="FP32">
|
33016 |
<dim>32</dim>
|
|
|
34010 |
<port id="0" precision="FP32">
|
34011 |
<dim>-1</dim>
|
34012 |
<dim>77</dim>
|
34013 |
+
<dim>32</dim>
|
34014 |
</port>
|
34015 |
<port id="1" precision="FP32">
|
34016 |
<dim>32</dim>
|
|
|
45425 |
<port id="0" precision="FP32">
|
45426 |
<dim>-1</dim>
|
45427 |
<dim>77</dim>
|
45428 |
+
<dim>32</dim>
|
45429 |
</port>
|
45430 |
<port id="1" precision="FP32">
|
45431 |
<dim>32</dim>
|
|
|
46425 |
<port id="0" precision="FP32">
|
46426 |
<dim>-1</dim>
|
46427 |
<dim>77</dim>
|
46428 |
+
<dim>32</dim>
|
46429 |
</port>
|
46430 |
<port id="1" precision="FP32">
|
46431 |
<dim>32</dim>
|
|
|
55980 |
<port id="0" precision="FP32">
|
55981 |
<dim>-1</dim>
|
55982 |
<dim>77</dim>
|
55983 |
+
<dim>32</dim>
|
55984 |
</port>
|
55985 |
<port id="1" precision="FP32">
|
55986 |
<dim>32</dim>
|
|
|
56980 |
<port id="0" precision="FP32">
|
56981 |
<dim>-1</dim>
|
56982 |
<dim>77</dim>
|
56983 |
+
<dim>32</dim>
|
56984 |
</port>
|
56985 |
<port id="1" precision="FP32">
|
56986 |
<dim>32</dim>
|
|
|
66561 |
<port id="0" precision="FP32">
|
66562 |
<dim>-1</dim>
|
66563 |
<dim>77</dim>
|
66564 |
+
<dim>32</dim>
|
66565 |
</port>
|
66566 |
<port id="1" precision="FP32">
|
66567 |
<dim>32</dim>
|
|
|
67561 |
<port id="0" precision="FP32">
|
67562 |
<dim>-1</dim>
|
67563 |
<dim>77</dim>
|
67564 |
+
<dim>32</dim>
|
67565 |
</port>
|
67566 |
<port id="1" precision="FP32">
|
67567 |
<dim>32</dim>
|
vae_encoder/openvino_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:14509b2db28c5e75866ae3795e5e636db33ec5d47bdefa836f1bf97b5bfceba7
|
3 |
+
size 1021864
|
vae_encoder/openvino_model.xml
ADDED
The diff for this file is too large to render.
See raw diff
|
|