echarlaix HF Staff commited on
Commit
28c5fbe
·
1 Parent(s): 7bde0f7

add vae encoder component

Browse files
README.md CHANGED
@@ -3,8 +3,9 @@ license: apache-2.0
3
  ---
4
 
5
  ```python
6
- from optimum.intel.openvino.modeling_diffusion import OVStableDiffusionPipeline
7
 
8
- pipe = OVStableDiffusionPipeline.from_pretrained("hf-internal-testing/tiny-stable-diffusion-openvino")
 
9
  ```
10
 
 
3
  ---
4
 
5
  ```python
6
+ from optimum.intel.openvino import OVStableDiffusionPipeline
7
 
8
+ model_id = "hf-internal-testing/tiny-stable-diffusion-openvino"
9
+ pipe = OVStableDiffusionPipeline.from_pretrained(model_id)
10
  ```
11
 
model_index.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "_class_name": "OVStableDiffusionPipeline",
3
- "_diffusers_version": "0.13.1",
4
  "feature_extractor": [
5
  "transformers",
6
  "CLIPFeatureExtractor"
@@ -28,5 +28,9 @@
28
  "vae_decoder": [
29
  "optimum",
30
  "OVModelVaeDecoder"
 
 
 
 
31
  ]
32
  }
 
1
  {
2
  "_class_name": "OVStableDiffusionPipeline",
3
+ "_diffusers_version": "0.14.0",
4
  "feature_extractor": [
5
  "transformers",
6
  "CLIPFeatureExtractor"
 
28
  "vae_decoder": [
29
  "optimum",
30
  "OVModelVaeDecoder"
31
+ ],
32
+ "vae_encoder": [
33
+ "optimum",
34
+ "OVModelVaeEncoder"
35
  ]
36
  }
scheduler/scheduler_config.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "_class_name": "PNDMScheduler",
3
- "_diffusers_version": "0.13.1",
4
  "beta_end": 0.012,
5
  "beta_schedule": "scaled_linear",
6
  "beta_start": 0.00085,
 
1
  {
2
  "_class_name": "PNDMScheduler",
3
+ "_diffusers_version": "0.14.0",
4
  "beta_end": 0.012,
5
  "beta_schedule": "scaled_linear",
6
  "beta_start": 0.00085,
tokenizer/tokenizer_config.json CHANGED
@@ -19,7 +19,7 @@
19
  },
20
  "errors": "replace",
21
  "model_max_length": 77,
22
- "name_or_path": "/tmp/tmp3si_ovlc/tokenizer",
23
  "pad_token": "<|endoftext|>",
24
  "special_tokens_map_file": "/home/lysandre/.cache/huggingface/transformers/18a566598f286c9139f88160c99f84eec492a26bd22738fa9cb44d5b7e0a5c76.cce1206abbad28826f000510f22f354e53e66a97f7c23745a7dfe27609cc07f5",
25
  "tokenizer_class": "CLIPTokenizer",
 
19
  },
20
  "errors": "replace",
21
  "model_max_length": 77,
22
+ "name_or_path": "/tmp/tmp6i7rva3d/tokenizer",
23
  "pad_token": "<|endoftext|>",
24
  "special_tokens_map_file": "/home/lysandre/.cache/huggingface/transformers/18a566598f286c9139f88160c99f84eec492a26bd22738fa9cb44d5b7e0a5c76.cce1206abbad28826f000510f22f354e53e66a97f7c23745a7dfe27609cc07f5",
25
  "tokenizer_class": "CLIPTokenizer",
unet/openvino_model.xml CHANGED
@@ -27,7 +27,7 @@
27
  </output>
28
  </layer>
29
  <layer id="0" name="encoder_hidden_states" type="Parameter" version="opset1">
30
- <data shape="?,77,?" element_type="f32" />
31
  <rt_info>
32
  <attribute name="fused_names" version="0" value="encoder_hidden_states" />
33
  </rt_info>
@@ -35,7 +35,7 @@
35
  <port id="0" precision="FP32" names="encoder_hidden_states">
36
  <dim>-1</dim>
37
  <dim>77</dim>
38
- <dim>-1</dim>
39
  </port>
40
  </output>
41
  </layer>
@@ -1436,7 +1436,7 @@
1436
  </port>
1437
  </output>
1438
  </layer>
1439
- <layer id="92" name="Constant_256350" type="Const" version="opset1">
1440
  <data element_type="i64" shape="1" offset="58936" size="8" />
1441
  <rt_info>
1442
  <attribute name="fused_names" version="0" value="/Reshape" />
@@ -12418,7 +12418,7 @@
12418
  <port id="0" precision="FP32">
12419
  <dim>-1</dim>
12420
  <dim>77</dim>
12421
- <dim>-1</dim>
12422
  </port>
12423
  <port id="1" precision="FP32">
12424
  <dim>32</dim>
@@ -13418,7 +13418,7 @@
13418
  <port id="0" precision="FP32">
13419
  <dim>-1</dim>
13420
  <dim>77</dim>
13421
- <dim>-1</dim>
13422
  </port>
13423
  <port id="1" precision="FP32">
13424
  <dim>32</dim>
@@ -22714,7 +22714,7 @@
22714
  <port id="0" precision="FP32">
22715
  <dim>-1</dim>
22716
  <dim>77</dim>
22717
- <dim>-1</dim>
22718
  </port>
22719
  <port id="1" precision="FP32">
22720
  <dim>32</dim>
@@ -23714,7 +23714,7 @@
23714
  <port id="0" precision="FP32">
23715
  <dim>-1</dim>
23716
  <dim>77</dim>
23717
- <dim>-1</dim>
23718
  </port>
23719
  <port id="1" precision="FP32">
23720
  <dim>32</dim>
@@ -33010,7 +33010,7 @@
33010
  <port id="0" precision="FP32">
33011
  <dim>-1</dim>
33012
  <dim>77</dim>
33013
- <dim>-1</dim>
33014
  </port>
33015
  <port id="1" precision="FP32">
33016
  <dim>32</dim>
@@ -34010,7 +34010,7 @@
34010
  <port id="0" precision="FP32">
34011
  <dim>-1</dim>
34012
  <dim>77</dim>
34013
- <dim>-1</dim>
34014
  </port>
34015
  <port id="1" precision="FP32">
34016
  <dim>32</dim>
@@ -45425,7 +45425,7 @@
45425
  <port id="0" precision="FP32">
45426
  <dim>-1</dim>
45427
  <dim>77</dim>
45428
- <dim>-1</dim>
45429
  </port>
45430
  <port id="1" precision="FP32">
45431
  <dim>32</dim>
@@ -46425,7 +46425,7 @@
46425
  <port id="0" precision="FP32">
46426
  <dim>-1</dim>
46427
  <dim>77</dim>
46428
- <dim>-1</dim>
46429
  </port>
46430
  <port id="1" precision="FP32">
46431
  <dim>32</dim>
@@ -55980,7 +55980,7 @@
55980
  <port id="0" precision="FP32">
55981
  <dim>-1</dim>
55982
  <dim>77</dim>
55983
- <dim>-1</dim>
55984
  </port>
55985
  <port id="1" precision="FP32">
55986
  <dim>32</dim>
@@ -56980,7 +56980,7 @@
56980
  <port id="0" precision="FP32">
56981
  <dim>-1</dim>
56982
  <dim>77</dim>
56983
- <dim>-1</dim>
56984
  </port>
56985
  <port id="1" precision="FP32">
56986
  <dim>32</dim>
@@ -66561,7 +66561,7 @@
66561
  <port id="0" precision="FP32">
66562
  <dim>-1</dim>
66563
  <dim>77</dim>
66564
- <dim>-1</dim>
66565
  </port>
66566
  <port id="1" precision="FP32">
66567
  <dim>32</dim>
@@ -67561,7 +67561,7 @@
67561
  <port id="0" precision="FP32">
67562
  <dim>-1</dim>
67563
  <dim>77</dim>
67564
- <dim>-1</dim>
67565
  </port>
67566
  <port id="1" precision="FP32">
67567
  <dim>32</dim>
 
27
  </output>
28
  </layer>
29
  <layer id="0" name="encoder_hidden_states" type="Parameter" version="opset1">
30
+ <data shape="?,77,32" element_type="f32" />
31
  <rt_info>
32
  <attribute name="fused_names" version="0" value="encoder_hidden_states" />
33
  </rt_info>
 
35
  <port id="0" precision="FP32" names="encoder_hidden_states">
36
  <dim>-1</dim>
37
  <dim>77</dim>
38
+ <dim>32</dim>
39
  </port>
40
  </output>
41
  </layer>
 
1436
  </port>
1437
  </output>
1438
  </layer>
1439
+ <layer id="92" name="Constant_274101" type="Const" version="opset1">
1440
  <data element_type="i64" shape="1" offset="58936" size="8" />
1441
  <rt_info>
1442
  <attribute name="fused_names" version="0" value="/Reshape" />
 
12418
  <port id="0" precision="FP32">
12419
  <dim>-1</dim>
12420
  <dim>77</dim>
12421
+ <dim>32</dim>
12422
  </port>
12423
  <port id="1" precision="FP32">
12424
  <dim>32</dim>
 
13418
  <port id="0" precision="FP32">
13419
  <dim>-1</dim>
13420
  <dim>77</dim>
13421
+ <dim>32</dim>
13422
  </port>
13423
  <port id="1" precision="FP32">
13424
  <dim>32</dim>
 
22714
  <port id="0" precision="FP32">
22715
  <dim>-1</dim>
22716
  <dim>77</dim>
22717
+ <dim>32</dim>
22718
  </port>
22719
  <port id="1" precision="FP32">
22720
  <dim>32</dim>
 
23714
  <port id="0" precision="FP32">
23715
  <dim>-1</dim>
23716
  <dim>77</dim>
23717
+ <dim>32</dim>
23718
  </port>
23719
  <port id="1" precision="FP32">
23720
  <dim>32</dim>
 
33010
  <port id="0" precision="FP32">
33011
  <dim>-1</dim>
33012
  <dim>77</dim>
33013
+ <dim>32</dim>
33014
  </port>
33015
  <port id="1" precision="FP32">
33016
  <dim>32</dim>
 
34010
  <port id="0" precision="FP32">
34011
  <dim>-1</dim>
34012
  <dim>77</dim>
34013
+ <dim>32</dim>
34014
  </port>
34015
  <port id="1" precision="FP32">
34016
  <dim>32</dim>
 
45425
  <port id="0" precision="FP32">
45426
  <dim>-1</dim>
45427
  <dim>77</dim>
45428
+ <dim>32</dim>
45429
  </port>
45430
  <port id="1" precision="FP32">
45431
  <dim>32</dim>
 
46425
  <port id="0" precision="FP32">
46426
  <dim>-1</dim>
46427
  <dim>77</dim>
46428
+ <dim>32</dim>
46429
  </port>
46430
  <port id="1" precision="FP32">
46431
  <dim>32</dim>
 
55980
  <port id="0" precision="FP32">
55981
  <dim>-1</dim>
55982
  <dim>77</dim>
55983
+ <dim>32</dim>
55984
  </port>
55985
  <port id="1" precision="FP32">
55986
  <dim>32</dim>
 
56980
  <port id="0" precision="FP32">
56981
  <dim>-1</dim>
56982
  <dim>77</dim>
56983
+ <dim>32</dim>
56984
  </port>
56985
  <port id="1" precision="FP32">
56986
  <dim>32</dim>
 
66561
  <port id="0" precision="FP32">
66562
  <dim>-1</dim>
66563
  <dim>77</dim>
66564
+ <dim>32</dim>
66565
  </port>
66566
  <port id="1" precision="FP32">
66567
  <dim>32</dim>
 
67561
  <port id="0" precision="FP32">
67562
  <dim>-1</dim>
67563
  <dim>77</dim>
67564
+ <dim>32</dim>
67565
  </port>
67566
  <port id="1" precision="FP32">
67567
  <dim>32</dim>
vae_encoder/openvino_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14509b2db28c5e75866ae3795e5e636db33ec5d47bdefa836f1bf97b5bfceba7
3
+ size 1021864
vae_encoder/openvino_model.xml ADDED
The diff for this file is too large to render. See raw diff