bconsolvo commited on
Commit
8fadf70
·
2 Parent(s): 37bb88375bb598

Merge branch '1.7.1'

Browse files
Files changed (29) hide show
  1. .gitattributes +5 -0
  2. scheduler/scheduler_config.json +4 -3
  3. text_encoder/config.json +25 -25
  4. text_encoder/text_encoder_fp16.onnx +3 -0
  5. text_encoder_2/config.json +25 -25
  6. text_encoder_2/model.fp16.safetensors +3 -0
  7. text_encoder_2/text_encoder_2_fp16.onnx +3 -0
  8. text_encoder_2/text_encoder_2_fp16.onnx.data +3 -0
  9. unet/config.json +72 -72
  10. unet/dd/cache/NhwcConv_0-unetconv_inConv_meta.json +0 -0
  11. unet/dd/dd_metastate_SD15_Unet_NhwcConv_0-unetconv_inConv.ctrlpkt +2 -2
  12. unet/dd/dd_metastate_SD15_Unet_NhwcConv_0-unetconv_inConv.state +2 -2
  13. unet/dd/dd_metastate_SD15_Unet_NhwcConv_0-unetconv_inConv.super +2 -2
  14. unet/dd/onnx_report.txt +10 -10
  15. unet/dd/replaced.onnx +2 -2
  16. vae_decoder/dd/cache/NhwcConv_0-post_quant_convConv_meta.json +0 -0
  17. vae_decoder/dd/dd_metastate_Sd15_Decoder_NhwcConv_0-post_quant_convConv.ctrlpkt +2 -2
  18. vae_decoder/dd/dd_metastate_Sd15_Decoder_NhwcConv_0-post_quant_convConv.state +2 -2
  19. vae_decoder/dd/dd_metastate_Sd15_Decoder_NhwcConv_0-post_quant_convConv.super +2 -2
  20. vae_decoder/dd/onnx_report.txt +3 -3
  21. vae_decoder/dd/replaced.onnx +2 -2
  22. vae_encoder/config.json +31 -0
  23. vae_encoder/dd/cache/NhwcConv_0-encoderconv_inConv_meta.json +0 -0
  24. vae_encoder/dd/dd_metastate_Sd15_Decoder_NhwcConv_0-encoderconv_inConv.ctrlpkt +3 -0
  25. vae_encoder/dd/dd_metastate_Sd15_Decoder_NhwcConv_0-encoderconv_inConv.fconst +3 -0
  26. vae_encoder/dd/dd_metastate_Sd15_Decoder_NhwcConv_0-encoderconv_inConv.state +3 -0
  27. vae_encoder/dd/dd_metastate_Sd15_Decoder_NhwcConv_0-encoderconv_inConv.super +3 -0
  28. vae_encoder/dd/onnx_report.txt +42 -0
  29. vae_encoder/dd/replaced.onnx +3 -0
.gitattributes CHANGED
@@ -41,3 +41,8 @@ vae_decoder/dd/dd_metastate_Sd15_Decoder_NhwcConv_0-post_quant_convConv.ctrlpkt
41
  vae_decoder/dd/dd_metastate_Sd15_Decoder_NhwcConv_0-post_quant_convConv.fconst filter=lfs diff=lfs merge=lfs -text
42
  vae_decoder/dd/dd_metastate_Sd15_Decoder_NhwcConv_0-post_quant_convConv.state filter=lfs diff=lfs merge=lfs -text
43
  vae_decoder/dd/dd_metastate_Sd15_Decoder_NhwcConv_0-post_quant_convConv.super filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
41
  vae_decoder/dd/dd_metastate_Sd15_Decoder_NhwcConv_0-post_quant_convConv.fconst filter=lfs diff=lfs merge=lfs -text
42
  vae_decoder/dd/dd_metastate_Sd15_Decoder_NhwcConv_0-post_quant_convConv.state filter=lfs diff=lfs merge=lfs -text
43
  vae_decoder/dd/dd_metastate_Sd15_Decoder_NhwcConv_0-post_quant_convConv.super filter=lfs diff=lfs merge=lfs -text
44
+ *.onnx.data filter=lfs diff=lfs merge=lfs -text
45
+ vae_encoder/dd/dd_metastate_Sd15_Decoder_NhwcConv_0-encoderconv_inConv.ctrlpkt filter=lfs diff=lfs merge=lfs -text
46
+ vae_encoder/dd/dd_metastate_Sd15_Decoder_NhwcConv_0-encoderconv_inConv.fconst filter=lfs diff=lfs merge=lfs -text
47
+ vae_encoder/dd/dd_metastate_Sd15_Decoder_NhwcConv_0-encoderconv_inConv.state filter=lfs diff=lfs merge=lfs -text
48
+ vae_encoder/dd/dd_metastate_Sd15_Decoder_NhwcConv_0-encoderconv_inConv.super filter=lfs diff=lfs merge=lfs -text
scheduler/scheduler_config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_class_name": "EulerAncestralDiscreteScheduler",
3
  "_diffusers_version": "0.24.0.dev0",
4
  "beta_end": 0.012,
5
  "beta_schedule": "scaled_linear",
@@ -12,6 +12,7 @@
12
  "set_alpha_to_one": false,
13
  "skip_prk_steps": true,
14
  "steps_offset": 1,
15
- "timestep_spacing": "trailing",
16
- "trained_betas": null
 
17
  }
 
1
  {
2
+ "_class_name": "EulerDiscreteScheduler",
3
  "_diffusers_version": "0.24.0.dev0",
4
  "beta_end": 0.012,
5
  "beta_schedule": "scaled_linear",
 
12
  "set_alpha_to_one": false,
13
  "skip_prk_steps": true,
14
  "steps_offset": 1,
15
+ "timestep_spacing": "leading",
16
+ "trained_betas": null,
17
+ "use_karras_sigmas": false
18
  }
text_encoder/config.json CHANGED
@@ -1,25 +1,25 @@
1
- {
2
- "_name_or_path": "SSD-Tiny/text_encoder",
3
- "architectures": [
4
- "CLIPTextModel"
5
- ],
6
- "attention_dropout": 0.0,
7
- "bos_token_id": 0,
8
- "dropout": 0.0,
9
- "eos_token_id": 2,
10
- "hidden_act": "quick_gelu",
11
- "hidden_size": 768,
12
- "initializer_factor": 1.0,
13
- "initializer_range": 0.02,
14
- "intermediate_size": 3072,
15
- "layer_norm_eps": 1e-05,
16
- "max_position_embeddings": 77,
17
- "model_type": "clip_text_model",
18
- "num_attention_heads": 12,
19
- "num_hidden_layers": 12,
20
- "pad_token_id": 1,
21
- "projection_dim": 768,
22
- "torch_dtype": "float16",
23
- "transformers_version": "4.35.2",
24
- "vocab_size": 49408
25
- }
 
1
+ {
2
+ "_name_or_path": "SSD-Tiny/text_encoder",
3
+ "architectures": [
4
+ "CLIPTextModel"
5
+ ],
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 0,
8
+ "dropout": 0.0,
9
+ "eos_token_id": 2,
10
+ "hidden_act": "quick_gelu",
11
+ "hidden_size": 768,
12
+ "initializer_factor": 1.0,
13
+ "initializer_range": 0.02,
14
+ "intermediate_size": 3072,
15
+ "layer_norm_eps": 1e-05,
16
+ "max_position_embeddings": 77,
17
+ "model_type": "clip_text_model",
18
+ "num_attention_heads": 12,
19
+ "num_hidden_layers": 12,
20
+ "pad_token_id": 1,
21
+ "projection_dim": 768,
22
+ "torch_dtype": "float16",
23
+ "transformers_version": "4.35.2",
24
+ "vocab_size": 49408
25
+ }
text_encoder/text_encoder_fp16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2db887fa686e054d3594fbbe0bef482ec0714e7a57028f887e5c84ed54f956f
3
+ size 246387418
text_encoder_2/config.json CHANGED
@@ -1,25 +1,25 @@
1
- {
2
- "_name_or_path": "SSD-Tiny/text_encoder_2",
3
- "architectures": [
4
- "CLIPTextModelWithProjection"
5
- ],
6
- "attention_dropout": 0.0,
7
- "bos_token_id": 0,
8
- "dropout": 0.0,
9
- "eos_token_id": 2,
10
- "hidden_act": "gelu",
11
- "hidden_size": 1280,
12
- "initializer_factor": 1.0,
13
- "initializer_range": 0.02,
14
- "intermediate_size": 5120,
15
- "layer_norm_eps": 1e-05,
16
- "max_position_embeddings": 77,
17
- "model_type": "clip_text_model",
18
- "num_attention_heads": 20,
19
- "num_hidden_layers": 32,
20
- "pad_token_id": 1,
21
- "projection_dim": 1280,
22
- "torch_dtype": "float16",
23
- "transformers_version": "4.35.2",
24
- "vocab_size": 49408
25
- }
 
1
+ {
2
+ "_name_or_path": "SSD-Tiny/text_encoder_2",
3
+ "architectures": [
4
+ "CLIPTextModelWithProjection"
5
+ ],
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 0,
8
+ "dropout": 0.0,
9
+ "eos_token_id": 2,
10
+ "hidden_act": "gelu",
11
+ "hidden_size": 1280,
12
+ "initializer_factor": 1.0,
13
+ "initializer_range": 0.02,
14
+ "intermediate_size": 5120,
15
+ "layer_norm_eps": 1e-05,
16
+ "max_position_embeddings": 77,
17
+ "model_type": "clip_text_model",
18
+ "num_attention_heads": 20,
19
+ "num_hidden_layers": 32,
20
+ "pad_token_id": 1,
21
+ "projection_dim": 1280,
22
+ "torch_dtype": "float16",
23
+ "transformers_version": "4.35.2",
24
+ "vocab_size": 49408
25
+ }
text_encoder_2/model.fp16.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b98e4a57a9292eeb819d67e2d2100f66f17db723cde4ecea27a7c3741160d0c
3
+ size 1389382176
text_encoder_2/text_encoder_2_fp16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b38bebdcc0915847f3fffdd5cf87810284c254e5ea7d767f601ad47a30968365
3
+ size 756674
text_encoder_2/text_encoder_2_fp16.onnx.data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aff1824430cc7d549adfb7f763cfbc6393495e35dcf8269004a9dd208d9ce22c
3
+ size 1389319680
unet/config.json CHANGED
@@ -1,72 +1,72 @@
1
- {
2
- "_class_name": "UNet2DConditionModel",
3
- "_diffusers_version": "0.24.0",
4
- "act_fn": "silu",
5
- "addition_embed_type": "text_time",
6
- "addition_embed_type_num_heads": 64,
7
- "addition_time_embed_dim": 256,
8
- "attention_head_dim": [
9
- 5,
10
- 10,
11
- 20
12
- ],
13
- "attention_type": "default",
14
- "block_out_channels": [
15
- 320,
16
- 640,
17
- 1280
18
- ],
19
- "center_input_sample": false,
20
- "class_embed_type": null,
21
- "class_embeddings_concat": false,
22
- "conv_in_kernel": 3,
23
- "conv_out_kernel": 3,
24
- "cross_attention_dim": 2048,
25
- "cross_attention_norm": null,
26
- "down_block_types": [
27
- "DownBlock2D",
28
- "CrossAttnDownBlock2D",
29
- "CrossAttnDownBlock2D"
30
- ],
31
- "downsample_padding": 1,
32
- "dropout": 0.0,
33
- "dual_cross_attention": false,
34
- "encoder_hid_dim": null,
35
- "encoder_hid_dim_type": null,
36
- "flip_sin_to_cos": true,
37
- "freq_shift": 0,
38
- "in_channels": 4,
39
- "layers_per_block": 2,
40
- "mid_block_only_cross_attention": null,
41
- "mid_block_scale_factor": 1,
42
- "mid_block_type": "UNetMidBlock2D",
43
- "norm_eps": 1e-05,
44
- "norm_num_groups": 32,
45
- "num_attention_heads": null,
46
- "num_class_embeds": null,
47
- "only_cross_attention": false,
48
- "out_channels": 4,
49
- "projection_class_embeddings_input_dim": 2816,
50
- "resnet_out_scale_factor": 1.0,
51
- "resnet_skip_time_act": false,
52
- "resnet_time_scale_shift": "default",
53
- "reverse_transformer_layers_per_block": null,
54
- "sample_size": 128,
55
- "time_cond_proj_dim": null,
56
- "time_embedding_act_fn": null,
57
- "time_embedding_dim": null,
58
- "time_embedding_type": "positional",
59
- "timestep_post_act": null,
60
- "transformer_layers_per_block": [
61
- 1,
62
- 1,
63
- 2
64
- ],
65
- "up_block_types": [
66
- "CrossAttnUpBlock2D",
67
- "CrossAttnUpBlock2D",
68
- "UpBlock2D"
69
- ],
70
- "upcast_attention": null,
71
- "use_linear_projection": true
72
- }
 
1
+ {
2
+ "_class_name": "UNet2DConditionModel",
3
+ "_diffusers_version": "0.24.0",
4
+ "act_fn": "silu",
5
+ "addition_embed_type": "text_time",
6
+ "addition_embed_type_num_heads": 64,
7
+ "addition_time_embed_dim": 256,
8
+ "attention_head_dim": [
9
+ 5,
10
+ 10,
11
+ 20
12
+ ],
13
+ "attention_type": "default",
14
+ "block_out_channels": [
15
+ 320,
16
+ 640,
17
+ 1280
18
+ ],
19
+ "center_input_sample": false,
20
+ "class_embed_type": null,
21
+ "class_embeddings_concat": false,
22
+ "conv_in_kernel": 3,
23
+ "conv_out_kernel": 3,
24
+ "cross_attention_dim": 2048,
25
+ "cross_attention_norm": null,
26
+ "down_block_types": [
27
+ "DownBlock2D",
28
+ "CrossAttnDownBlock2D",
29
+ "CrossAttnDownBlock2D"
30
+ ],
31
+ "downsample_padding": 1,
32
+ "dropout": 0.0,
33
+ "dual_cross_attention": false,
34
+ "encoder_hid_dim": null,
35
+ "encoder_hid_dim_type": null,
36
+ "flip_sin_to_cos": true,
37
+ "freq_shift": 0,
38
+ "in_channels": 4,
39
+ "layers_per_block": 2,
40
+ "mid_block_only_cross_attention": null,
41
+ "mid_block_scale_factor": 1,
42
+ "mid_block_type": "UNetMidBlock2D",
43
+ "norm_eps": 1e-05,
44
+ "norm_num_groups": 32,
45
+ "num_attention_heads": null,
46
+ "num_class_embeds": null,
47
+ "only_cross_attention": false,
48
+ "out_channels": 4,
49
+ "projection_class_embeddings_input_dim": 2816,
50
+ "resnet_out_scale_factor": 1.0,
51
+ "resnet_skip_time_act": false,
52
+ "resnet_time_scale_shift": "default",
53
+ "reverse_transformer_layers_per_block": null,
54
+ "sample_size": 128,
55
+ "time_cond_proj_dim": null,
56
+ "time_embedding_act_fn": null,
57
+ "time_embedding_dim": null,
58
+ "time_embedding_type": "positional",
59
+ "timestep_post_act": null,
60
+ "transformer_layers_per_block": [
61
+ 1,
62
+ 1,
63
+ 2
64
+ ],
65
+ "up_block_types": [
66
+ "CrossAttnUpBlock2D",
67
+ "CrossAttnUpBlock2D",
68
+ "UpBlock2D"
69
+ ],
70
+ "upcast_attention": null,
71
+ "use_linear_projection": true
72
+ }
unet/dd/cache/NhwcConv_0-unetconv_inConv_meta.json CHANGED
The diff for this file is too large to render. See raw diff
 
unet/dd/dd_metastate_SD15_Unet_NhwcConv_0-unetconv_inConv.ctrlpkt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:defdd9d30fb97bec3ec22a68b6e615cb5a94963f257ec9dfc7bba8b733fbcbe7
3
- size 57028248
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a89a54f1e044a2058ff2cea15e8dc127d89f29327c12da6b8d0116729d59d82
3
+ size 64468764
unet/dd/dd_metastate_SD15_Unet_NhwcConv_0-unetconv_inConv.state CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b795c4f96011509da333bd05557f2c5a41bb993dd8820efcd12020288c0863a8
3
- size 15840065
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12468b4d14df11a58ccaee3f9a603aa4015a116f467cac82befaac691e9407f0
3
+ size 10841842
unet/dd/dd_metastate_SD15_Unet_NhwcConv_0-unetconv_inConv.super CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1248c187b5b209a54a2555d999a0a774ce336d9a22fb136550232f079df36dc9
3
- size 1046920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8790f62735e5711f8bf8bb786e13c4d804890de070e5263ec7d9d9421795aa9
3
+ size 1242152
unet/dd/onnx_report.txt CHANGED
@@ -52,22 +52,22 @@
52
  +-------------------+-----------------+-------------------+-------------------+
53
  | Offloaded sum | 1 | | |
54
  +-------------------+-----------------+-------------------+-------------------+
55
- | Offloaded Op | SDConv_bfp | | |
56
- | Types | SDAdd_bfp | | |
57
- | | SDGemm_bfp | | |
58
- | | SDCastBf2Bfp | | |
 
59
  | | SDLayerNorm_bfp | | |
 
 
 
 
60
  | | SDConcat_bfp | | |
61
  | | SDCastBfp2Bf | | |
62
- | | SDFlatMHA | | |
63
  | | SDSilu | | |
64
- | | SDMHA_bfp | | |
65
- | | SDConv | | |
66
- | | SDGemm | | |
67
- | | SDMul_bfp | | |
68
- | | SDAdd | | |
69
  | | SDGroupNorm_bfp | | |
70
  | | SDResize_bfp | | |
 
71
  +-------------------+-----------------+-------------------+-------------------+
72
  | Offloaded sum (dd | 521 | | |
73
  | fusion) | | | |
 
52
  +-------------------+-----------------+-------------------+-------------------+
53
  | Offloaded sum | 1 | | |
54
  +-------------------+-----------------+-------------------+-------------------+
55
+ | Offloaded Op | SDGemm_bfp | | |
56
+ | Types | SDCastBf2Bfp | | |
57
+ | | SDAdd_bfp | | |
58
+ | | SDConv | | |
59
+ | | SDFlatMHA | | |
60
  | | SDLayerNorm_bfp | | |
61
+ | | SDConv_bfp | | |
62
+ | | SDMul_bfp | | |
63
+ | | SDMHA_bfp | | |
64
+ | | SDAdd | | |
65
  | | SDConcat_bfp | | |
66
  | | SDCastBfp2Bf | | |
 
67
  | | SDSilu | | |
 
 
 
 
 
68
  | | SDGroupNorm_bfp | | |
69
  | | SDResize_bfp | | |
70
+ | | SDGemm | | |
71
  +-------------------+-----------------+-------------------+-------------------+
72
  | Offloaded sum (dd | 521 | | |
73
  | fusion) | | | |
unet/dd/replaced.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d41ef0893404115729f086891bcc236a3ad6310e51ae4ad15054e7ad9fbb5251
3
- size 536412
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8328611e5a7c7fed2370616ff2e530c1b0c2a7fc52d3026171412c2d26bf898
3
+ size 533385
vae_decoder/dd/cache/NhwcConv_0-post_quant_convConv_meta.json CHANGED
The diff for this file is too large to render. See raw diff
 
vae_decoder/dd/dd_metastate_Sd15_Decoder_NhwcConv_0-post_quant_convConv.ctrlpkt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4650279f5948218b061bac546f1fea0a9353f2eb1dbf3cd14e3735c005266b2a
3
- size 77767176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b4d0b28e77cf288a764895a37600e19ceb034b48e8016e36465b34bbc87b995
3
+ size 58489488
vae_decoder/dd/dd_metastate_Sd15_Decoder_NhwcConv_0-post_quant_convConv.state CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:055e9a0cfb9a62a94cb637b10f1f1c32bb82318de0d50b73ef5ed4ef5092104d
3
- size 22813448
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ef6347815ce5d44e3f7de34054dbd40a0c9c77675bcbbf476e30f9dc3839d56
3
+ size 13659638
vae_decoder/dd/dd_metastate_Sd15_Decoder_NhwcConv_0-post_quant_convConv.super CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:10334e04fe3040fe12d4b37e1f6d0c08f7ebf5d0ab4e7e5acc8589bc82c0d57a
3
- size 785568
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:230fe28efa807448cf48c4d03c05becc580249daabc6b2a7120f35cdbcca2414
3
+ size 772640
vae_decoder/dd/onnx_report.txt CHANGED
@@ -21,11 +21,11 @@
21
  +--------------------+-------------+--------------------+---------------------+
22
  | Offloaded sum | 1 | | |
23
  +--------------------+-------------+--------------------+---------------------+
24
- | Offloaded Op Types | SDConv | | |
 
25
  | | SDMHA_VAE | | |
 
26
  | | SDGroupNorm | | |
27
- | | SDGemm | | |
28
- | | SDAdd | | |
29
  | | SDResize | | |
30
  +--------------------+-------------+--------------------+---------------------+
31
  | Offloaded sum (dd | 89 | | |
 
21
  +--------------------+-------------+--------------------+---------------------+
22
  | Offloaded sum | 1 | | |
23
  +--------------------+-------------+--------------------+---------------------+
24
+ | Offloaded Op Types | SDAdd | | |
25
+ | | SDGemm | | |
26
  | | SDMHA_VAE | | |
27
+ | | SDConv | | |
28
  | | SDGroupNorm | | |
 
 
29
  | | SDResize | | |
30
  +--------------------+-------------+--------------------+---------------------+
31
  | Offloaded sum (dd | 89 | | |
vae_decoder/dd/replaced.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1cb7ac8e40339c0fcb1db9c07a96ad4e8a38258f92b90f24e0cf087773ecabf0
3
- size 46098
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7fc5cb253512e74931adbf6a77fe277a44065e61acf7f49aed975b0c15acc2c
3
+ size 45974
vae_encoder/config.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "AutoencoderKL",
3
+ "_diffusers_version": "0.24.0.dev0",
4
+ "act_fn": "silu",
5
+ "block_out_channels": [
6
+ 128,
7
+ 256,
8
+ 512,
9
+ 512
10
+ ],
11
+ "down_block_types": [
12
+ "DownEncoderBlock2D",
13
+ "DownEncoderBlock2D",
14
+ "DownEncoderBlock2D",
15
+ "DownEncoderBlock2D"
16
+ ],
17
+ "force_upcast": true,
18
+ "in_channels": 3,
19
+ "latent_channels": 4,
20
+ "layers_per_block": 2,
21
+ "norm_num_groups": 32,
22
+ "out_channels": 3,
23
+ "sample_size": 1024,
24
+ "scaling_factor": 0.13025,
25
+ "up_block_types": [
26
+ "UpDecoderBlock2D",
27
+ "UpDecoderBlock2D",
28
+ "UpDecoderBlock2D",
29
+ "UpDecoderBlock2D"
30
+ ]
31
+ }
vae_encoder/dd/cache/NhwcConv_0-encoderconv_inConv_meta.json ADDED
The diff for this file is too large to render. See raw diff
 
vae_encoder/dd/dd_metastate_Sd15_Decoder_NhwcConv_0-encoderconv_inConv.ctrlpkt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e1a5c24f90e1502dbfc5f79348dcb2f618bb1cb0bf9b6b88ceec2bcbd8d0241
3
+ size 29858688
vae_encoder/dd/dd_metastate_Sd15_Decoder_NhwcConv_0-encoderconv_inConv.fconst ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39f4c3ac20324cc894cc5333ee3b21209bc92cfbb7cfd26ec7964e5f94330767
3
+ size 42147856
vae_encoder/dd/dd_metastate_Sd15_Decoder_NhwcConv_0-encoderconv_inConv.state ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbb30ef89acf22555554aaee0a8a8b1fd7c08fc8618b3f64c11b791bfa172207
3
+ size 6466405
vae_encoder/dd/dd_metastate_Sd15_Decoder_NhwcConv_0-encoderconv_inConv.super ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:230fe28efa807448cf48c4d03c05becc580249daabc6b2a7120f35cdbcca2414
3
+ size 772640
vae_encoder/dd/onnx_report.txt ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ DynamicDispatch Offload - not offloaded
2
+ +-------------------+-------+------------------------+------------------------+
3
+ | Op Type | Count | Inputs | Outputs |
4
+ +===================+=======+========================+========================+
5
+ | CastAvx | 1 | [1,1024,1024,4] - | [1,1024,1024,4] - |
6
+ | | | FLOAT | BFLOAT16 |
7
+ | CastAvx | 1 | [1,128,128,8] - | [1,128,128,8] - FLOAT |
8
+ | | | BFLOAT16 | |
9
+ | Pad | 1 | [1,3,1024,1024] - | [1,4,1024,1024] - |
10
+ | | | FLOAT | FLOAT |
11
+ | | | [8] - INT64 | |
12
+ | | | [1] - FLOAT | |
13
+ | Slice | 1 | [1,8,128,128] - FLOAT | [1,4,128,128] - FLOAT |
14
+ | | | [1] - INT64 | |
15
+ | | | [1] - INT64 | |
16
+ | | | [1] - INT64 | |
17
+ | Transpose | 1 | [1,4,1024,1024] - | [1,1024,1024,4] - |
18
+ | | | FLOAT | FLOAT |
19
+ | Transpose | 1 | [1,128,128,8] - FLOAT | [1,8,128,128] - FLOAT |
20
+ +-------------------+-------+------------------------+------------------------+
21
+ | Not offloaded sum | 6 | | |
22
+ +-------------------+-------+------------------------+------------------------+
23
+ DynamicDispatch Offload - offloaded
24
+ +--------------------+-------------+--------------------+---------------------+
25
+ | Op Type | Count | Inputs | Outputs |
26
+ +====================+=============+====================+=====================+
27
+ | DynamicDispatch | 1 | [1,1024,1024,4] - | [1,128,128,8] - |
28
+ | | | BFLOAT16 | BFLOAT16 |
29
+ +--------------------+-------------+--------------------+---------------------+
30
+ | Offloaded sum | 1 | | |
31
+ +--------------------+-------------+--------------------+---------------------+
32
+ | Offloaded Op Types | SDAdd | | |
33
+ | | SDMHA_VAE | | |
34
+ | | SDConv | | |
35
+ | | SDGroupNorm | | |
36
+ | | SDGemm | | |
37
+ +--------------------+-------------+--------------------+---------------------+
38
+ | Offloaded sum (dd | 66 | | |
39
+ | fusion) | | | |
40
+ | Offload Ratio (dd | 91.67% | | |
41
+ | fusion) | | | |
42
+ +--------------------+-------------+--------------------+---------------------+
vae_encoder/dd/replaced.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ec267beaa5e8681a2494a4d64adb0ad15a9ed8274926ff171124e407ca32acc
3
+ size 40934