jonathanbenavides commited on
Commit
a913451
·
verified ·
1 Parent(s): 7d739ad

Adding files

Browse files
TextEncoder.mlmodelc/analytics/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc42c2465771ddb06778190f611cc29696fb0a5f64b327ba01fefa0db1b0e94b
3
+ size 243
TextEncoder.mlmodelc/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a4f8bbf1a17a22e5912d0bd547d84d8c7b0c94822c4ac59fa1ff043c2e16b33
3
+ size 961
TextEncoder.mlmodelc/metadata.json ADDED
@@ -0,0 +1,84 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "shortDescription" : "Stable Diffusion generates images conditioned on text and\/or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
4
+ "metadataOutputVersion" : "3.0",
5
+ "outputSchema" : [
6
+ {
7
+ "hasShapeFlexibility" : "0",
8
+ "isOptional" : "0",
9
+ "dataType" : "Float32",
10
+ "formattedType" : "MultiArray (Float32 1 × 77 × 768)",
11
+ "shortDescription" : "Hidden states after the encoder layers",
12
+ "shape" : "[1, 77, 768]",
13
+ "name" : "hidden_embeds",
14
+ "type" : "MultiArray"
15
+ },
16
+ {
17
+ "hasShapeFlexibility" : "0",
18
+ "isOptional" : "0",
19
+ "dataType" : "Float32",
20
+ "formattedType" : "MultiArray (Float32 1 × 768)",
21
+ "shortDescription" : "The version of the `last_hidden_state` output after pooling",
22
+ "shape" : "[1, 768]",
23
+ "name" : "pooled_outputs",
24
+ "type" : "MultiArray"
25
+ }
26
+ ],
27
+ "version" : "turbovisionxlSuperFastXLBasedOnNew_tvxlV431Bakedvae_diffusers",
28
+ "modelParameters" : [
29
+
30
+ ],
31
+ "author" : "Please refer to the Model Card available at huggingface.co\/turbovisionxlSuperFastXLBasedOnNew_tvxlV431Bakedvae_diffusers",
32
+ "specificationVersion" : 7,
33
+ "storagePrecision" : "Float16",
34
+ "license" : "OpenRAIL++-M (https:\/\/huggingface.co\/stabilityai\/stable-diffusion-xl-base-1.0\/blob\/main\/LICENSE.md)",
35
+ "mlProgramOperationTypeHistogram" : {
36
+ "Ios16.cast" : 3,
37
+ "Ios16.mul" : 36,
38
+ "Ios16.layerNorm" : 25,
39
+ "Stack" : 1,
40
+ "Transpose" : 60,
41
+ "Ios16.sigmoid" : 12,
42
+ "Ios16.linear" : 72,
43
+ "Ios16.add" : 37,
44
+ "Ios16.matmul" : 24,
45
+ "Ios16.softmax" : 12,
46
+ "Ios16.gatherNd" : 1,
47
+ "Ios16.gather" : 1,
48
+ "Ios16.reshape" : 120,
49
+ "Ios16.reduceArgmax" : 1
50
+ },
51
+ "computePrecision" : "Mixed (Float16, Float32, Int32)",
52
+ "isUpdatable" : "0",
53
+ "availability" : {
54
+ "macOS" : "13.0",
55
+ "tvOS" : "16.0",
56
+ "visionOS" : "1.0",
57
+ "watchOS" : "9.0",
58
+ "iOS" : "16.0",
59
+ "macCatalyst" : "16.0"
60
+ },
61
+ "modelType" : {
62
+ "name" : "MLModelType_mlProgram"
63
+ },
64
+ "inputSchema" : [
65
+ {
66
+ "hasShapeFlexibility" : "0",
67
+ "isOptional" : "0",
68
+ "dataType" : "Float32",
69
+ "formattedType" : "MultiArray (Float32 1 × 77)",
70
+ "shortDescription" : "The token ids that represent the input text",
71
+ "shape" : "[1, 77]",
72
+ "name" : "input_ids",
73
+ "type" : "MultiArray"
74
+ }
75
+ ],
76
+ "userDefinedMetadata" : {
77
+ "com.github.apple.coremltools.source_dialect" : "TorchScript",
78
+ "com.github.apple.coremltools.source" : "torch==2.1.2",
79
+ "com.github.apple.coremltools.version" : "7.1"
80
+ },
81
+ "generatedClassName" : "Stable_Diffusion_version_turbovisionxlSuperFastXLBasedOnNew_tvxlV431Bakedvae_diffusers_text_encoder",
82
+ "method" : "predict"
83
+ }
84
+ ]
TextEncoder.mlmodelc/model.mil ADDED
The diff for this file is too large to render. See raw diff
 
TextEncoder.mlmodelc/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b8fb36808ab8d86254cae8c934591223124ffff0c8c6b213c52d9e3986d4ae0
3
+ size 246145536
TextEncoder2.mlmodelc/analytics/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:939e4df0cbed526bc2ace0f21bff7b4345562068bc2bbbfb49ff5f3d04b217b8
3
+ size 243
TextEncoder2.mlmodelc/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccab3111a97ae96a289f1e1809711f79d52fe4598fa7e56ed070a30b949131cc
3
+ size 961
TextEncoder2.mlmodelc/metadata.json ADDED
@@ -0,0 +1,84 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "shortDescription" : "Stable Diffusion generates images conditioned on text and\/or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
4
+ "metadataOutputVersion" : "3.0",
5
+ "outputSchema" : [
6
+ {
7
+ "hasShapeFlexibility" : "0",
8
+ "isOptional" : "0",
9
+ "dataType" : "Float32",
10
+ "formattedType" : "MultiArray (Float32 1 × 77 × 1280)",
11
+ "shortDescription" : "Hidden states after the encoder layers",
12
+ "shape" : "[1, 77, 1280]",
13
+ "name" : "hidden_embeds",
14
+ "type" : "MultiArray"
15
+ },
16
+ {
17
+ "hasShapeFlexibility" : "0",
18
+ "isOptional" : "0",
19
+ "dataType" : "Float32",
20
+ "formattedType" : "MultiArray (Float32 1 × 1280)",
21
+ "shortDescription" : "The version of the `last_hidden_state` output after pooling",
22
+ "shape" : "[1, 1280]",
23
+ "name" : "pooled_outputs",
24
+ "type" : "MultiArray"
25
+ }
26
+ ],
27
+ "version" : "turbovisionxlSuperFastXLBasedOnNew_tvxlV431Bakedvae_diffusers",
28
+ "modelParameters" : [
29
+
30
+ ],
31
+ "author" : "Please refer to the Model Card available at huggingface.co\/turbovisionxlSuperFastXLBasedOnNew_tvxlV431Bakedvae_diffusers",
32
+ "specificationVersion" : 7,
33
+ "storagePrecision" : "Float16",
34
+ "license" : "OpenRAIL++-M (https:\/\/huggingface.co\/stabilityai\/stable-diffusion-xl-base-1.0\/blob\/main\/LICENSE.md)",
35
+ "mlProgramOperationTypeHistogram" : {
36
+ "Ios16.cast" : 3,
37
+ "Ios16.mul" : 32,
38
+ "Ios16.layerNorm" : 65,
39
+ "Stack" : 1,
40
+ "Transpose" : 160,
41
+ "Ios16.linear" : 193,
42
+ "Ios16.add" : 97,
43
+ "Ios16.matmul" : 64,
44
+ "Ios16.gelu" : 32,
45
+ "Ios16.softmax" : 32,
46
+ "Ios16.gatherNd" : 1,
47
+ "Ios16.gather" : 1,
48
+ "Ios16.reshape" : 320,
49
+ "Ios16.reduceArgmax" : 1
50
+ },
51
+ "computePrecision" : "Mixed (Float16, Float32, Int32)",
52
+ "isUpdatable" : "0",
53
+ "availability" : {
54
+ "macOS" : "13.0",
55
+ "tvOS" : "16.0",
56
+ "visionOS" : "1.0",
57
+ "watchOS" : "9.0",
58
+ "iOS" : "16.0",
59
+ "macCatalyst" : "16.0"
60
+ },
61
+ "modelType" : {
62
+ "name" : "MLModelType_mlProgram"
63
+ },
64
+ "inputSchema" : [
65
+ {
66
+ "hasShapeFlexibility" : "0",
67
+ "isOptional" : "0",
68
+ "dataType" : "Float32",
69
+ "formattedType" : "MultiArray (Float32 1 × 77)",
70
+ "shortDescription" : "The token ids that represent the input text",
71
+ "shape" : "[1, 77]",
72
+ "name" : "input_ids",
73
+ "type" : "MultiArray"
74
+ }
75
+ ],
76
+ "userDefinedMetadata" : {
77
+ "com.github.apple.coremltools.source_dialect" : "TorchScript",
78
+ "com.github.apple.coremltools.source" : "torch==2.1.2",
79
+ "com.github.apple.coremltools.version" : "7.1"
80
+ },
81
+ "generatedClassName" : "Stable_Diffusion_version_turbovisionxlSuperFastXLBasedOnNew_tvxlV431Bakedvae_diffusers_text_encoder_2",
82
+ "method" : "predict"
83
+ }
84
+ ]
TextEncoder2.mlmodelc/model.mil ADDED
The diff for this file is too large to render. See raw diff
 
TextEncoder2.mlmodelc/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09358857334c71c8993aa4565766dd5dbc3c56cfe0ebca5b188369026ed0a900
3
+ size 1389367424
Unet.mlmodelc/analytics/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc04a07715e0400945008ef2fb3360f59a61069b9c2d5793afb253318688df13
3
+ size 243
Unet.mlmodelc/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:149a68be62f848a315718547537f6d154b4b98a333819cfb7b0c25be5cbbb515
3
+ size 1713
Unet.mlmodelc/metadata.json ADDED
@@ -0,0 +1,124 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "shortDescription" : "Stable Diffusion generates images conditioned on text or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
4
+ "metadataOutputVersion" : "3.0",
5
+ "outputSchema" : [
6
+ {
7
+ "hasShapeFlexibility" : "0",
8
+ "isOptional" : "0",
9
+ "dataType" : "Float32",
10
+ "formattedType" : "MultiArray (Float32 2 × 4 × 96 × 96)",
11
+ "shortDescription" : "Same shape and dtype as the `sample` input. The predicted noise to facilitate the reverse diffusion (denoising) process",
12
+ "shape" : "[2, 4, 96, 96]",
13
+ "name" : "noise_pred",
14
+ "type" : "MultiArray"
15
+ }
16
+ ],
17
+ "version" : "turbovisionxlSuperFastXLBasedOnNew_tvxlV431Bakedvae_diffusers",
18
+ "modelParameters" : [
19
+
20
+ ],
21
+ "author" : "Please refer to the Model Card available at huggingface.co\/turbovisionxlSuperFastXLBasedOnNew_tvxlV431Bakedvae_diffusers",
22
+ "specificationVersion" : 7,
23
+ "storagePrecision" : "Float16",
24
+ "license" : "OpenRAIL++-M (https:\/\/huggingface.co\/stabilityai\/stable-diffusion-xl-base-1.0\/blob\/main\/LICENSE.md)",
25
+ "mlProgramOperationTypeHistogram" : {
26
+ "UpsampleNearestNeighbor" : 2,
27
+ "Ios16.reduceMean" : 512,
28
+ "Ios16.sin" : 2,
29
+ "Ios16.softmax" : 140,
30
+ "Split" : 70,
31
+ "Ios16.add" : 722,
32
+ "Concat" : 14,
33
+ "Ios16.realDiv" : 46,
34
+ "Ios16.square" : 46,
35
+ "ExpandDims" : 6,
36
+ "Ios16.sub" : 256,
37
+ "Ios16.cast" : 1,
38
+ "Ios16.conv" : 794,
39
+ "Ios16.gelu" : 70,
40
+ "Ios16.matmul" : 280,
41
+ "Ios16.reshape" : 676,
42
+ "Ios16.batchNorm" : 46,
43
+ "Ios16.rsqrt" : 210,
44
+ "Ios16.silu" : 38,
45
+ "Ios16.sqrt" : 46,
46
+ "SliceByIndex" : 4,
47
+ "Ios16.mul" : 842,
48
+ "Ios16.cos" : 2
49
+ },
50
+ "computePrecision" : "Mixed (Float16, Float32, Int32)",
51
+ "isUpdatable" : "0",
52
+ "availability" : {
53
+ "macOS" : "13.0",
54
+ "tvOS" : "16.0",
55
+ "visionOS" : "1.0",
56
+ "watchOS" : "9.0",
57
+ "iOS" : "16.0",
58
+ "macCatalyst" : "16.0"
59
+ },
60
+ "modelType" : {
61
+ "name" : "MLModelType_mlProgram"
62
+ },
63
+ "inputSchema" : [
64
+ {
65
+ "hasShapeFlexibility" : "0",
66
+ "isOptional" : "0",
67
+ "dataType" : "Float16",
68
+ "formattedType" : "MultiArray (Float16 2 × 4 × 96 × 96)",
69
+ "shortDescription" : "The low resolution latent feature maps being denoised through reverse diffusion",
70
+ "shape" : "[2, 4, 96, 96]",
71
+ "name" : "sample",
72
+ "type" : "MultiArray"
73
+ },
74
+ {
75
+ "hasShapeFlexibility" : "0",
76
+ "isOptional" : "0",
77
+ "dataType" : "Float16",
78
+ "formattedType" : "MultiArray (Float16 2)",
79
+ "shortDescription" : "A value emitted by the associated scheduler object to condition the model on a given noise schedule",
80
+ "shape" : "[2]",
81
+ "name" : "timestep",
82
+ "type" : "MultiArray"
83
+ },
84
+ {
85
+ "hasShapeFlexibility" : "0",
86
+ "isOptional" : "0",
87
+ "dataType" : "Float16",
88
+ "formattedType" : "MultiArray (Float16 2 × 2048 × 1 × 77)",
89
+ "shortDescription" : "Output embeddings from the associated text_encoder model to condition to generated image on text. A maximum of 77 tokens (~40 words) are allowed. Longer text is truncated. Shorter text does not reduce computation.",
90
+ "shape" : "[2, 2048, 1, 77]",
91
+ "name" : "encoder_hidden_states",
92
+ "type" : "MultiArray"
93
+ },
94
+ {
95
+ "hasShapeFlexibility" : "0",
96
+ "isOptional" : "0",
97
+ "dataType" : "Float16",
98
+ "formattedType" : "MultiArray (Float16 2 × 6)",
99
+ "shortDescription" : "Additional embeddings that if specified are added to the embeddings that are passed along to the UNet blocks.",
100
+ "shape" : "[2, 6]",
101
+ "name" : "time_ids",
102
+ "type" : "MultiArray"
103
+ },
104
+ {
105
+ "hasShapeFlexibility" : "0",
106
+ "isOptional" : "0",
107
+ "dataType" : "Float16",
108
+ "formattedType" : "MultiArray (Float16 2 × 1280)",
109
+ "shortDescription" : "Additional embeddings from text_encoder_2 that if specified are added to the embeddings that are passed along to the UNet blocks.",
110
+ "shape" : "[2, 1280]",
111
+ "name" : "text_embeds",
112
+ "type" : "MultiArray"
113
+ }
114
+ ],
115
+ "userDefinedMetadata" : {
116
+ "com.github.apple.ml-stable-diffusion.version" : "1.1.0",
117
+ "com.github.apple.coremltools.source" : "torch==2.1.2",
118
+ "com.github.apple.coremltools.version" : "7.1",
119
+ "com.github.apple.coremltools.source_dialect" : "TorchScript"
120
+ },
121
+ "generatedClassName" : "Stable_Diffusion_version_turbovisionxlSuperFastXLBasedOnNew_tvxlV431Bakedvae_diffusers_unet",
122
+ "method" : "predict"
123
+ }
124
+ ]
Unet.mlmodelc/model.mil ADDED
The diff for this file is too large to render. See raw diff
 
Unet.mlmodelc/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca61a9e9d3ae653611841f73322138edc73ce5b0067dd3013c6424454b6f401c
3
+ size 5135067072
VAEDecoder.mlmodelc/analytics/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18191a2b07696a539adfb10f33899c47b8bf1640b95d77a7da0b8872e2f02289
3
+ size 243
VAEDecoder.mlmodelc/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23ff78fb3be7dba159a45ef2fb91a6d9adf150ebeea2d978ed2e0de46d8103fe
3
+ size 910
VAEDecoder.mlmodelc/metadata.json ADDED
@@ -0,0 +1,76 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "shortDescription" : "Stable Diffusion generates images conditioned on text and\/or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
4
+ "metadataOutputVersion" : "3.0",
5
+ "outputSchema" : [
6
+ {
7
+ "hasShapeFlexibility" : "0",
8
+ "isOptional" : "0",
9
+ "dataType" : "Float32",
10
+ "formattedType" : "MultiArray (Float32 1 × 3 × 768 × 768)",
11
+ "shortDescription" : "Generated image normalized to range [-1, 1]",
12
+ "shape" : "[1, 3, 768, 768]",
13
+ "name" : "image",
14
+ "type" : "MultiArray"
15
+ }
16
+ ],
17
+ "version" : "turbovisionxlSuperFastXLBasedOnNew_tvxlV431Bakedvae_diffusers",
18
+ "modelParameters" : [
19
+
20
+ ],
21
+ "author" : "Please refer to the Model Card available at huggingface.co\/turbovisionxlSuperFastXLBasedOnNew_tvxlV431Bakedvae_diffusers",
22
+ "specificationVersion" : 7,
23
+ "storagePrecision" : "Float32",
24
+ "license" : "OpenRAIL++-M (https:\/\/huggingface.co\/stabilityai\/stable-diffusion-xl-base-1.0\/blob\/main\/LICENSE.md)",
25
+ "mlProgramOperationTypeHistogram" : {
26
+ "Ios16.mul" : 2,
27
+ "Ios16.sqrt" : 30,
28
+ "Ios16.sub" : 30,
29
+ "Transpose" : 6,
30
+ "UpsampleNearestNeighbor" : 3,
31
+ "Ios16.conv" : 36,
32
+ "Ios16.add" : 46,
33
+ "Ios16.linear" : 4,
34
+ "Ios16.matmul" : 2,
35
+ "Ios16.realDiv" : 30,
36
+ "Ios16.reduceMean" : 60,
37
+ "Ios16.softmax" : 1,
38
+ "Ios16.batchNorm" : 29,
39
+ "Ios16.square" : 30,
40
+ "Ios16.reshape" : 65,
41
+ "Ios16.silu" : 29
42
+ },
43
+ "computePrecision" : "Mixed (Float32, Int32)",
44
+ "isUpdatable" : "0",
45
+ "availability" : {
46
+ "macOS" : "13.0",
47
+ "tvOS" : "16.0",
48
+ "visionOS" : "1.0",
49
+ "watchOS" : "9.0",
50
+ "iOS" : "16.0",
51
+ "macCatalyst" : "16.0"
52
+ },
53
+ "modelType" : {
54
+ "name" : "MLModelType_mlProgram"
55
+ },
56
+ "inputSchema" : [
57
+ {
58
+ "hasShapeFlexibility" : "0",
59
+ "isOptional" : "0",
60
+ "dataType" : "Float32",
61
+ "formattedType" : "MultiArray (Float32 1 × 4 × 96 × 96)",
62
+ "shortDescription" : "The denoised latent embeddings from the unet model after the last step of reverse diffusion",
63
+ "shape" : "[1, 4, 96, 96]",
64
+ "name" : "z",
65
+ "type" : "MultiArray"
66
+ }
67
+ ],
68
+ "userDefinedMetadata" : {
69
+ "com.github.apple.coremltools.source_dialect" : "TorchScript",
70
+ "com.github.apple.coremltools.source" : "torch==2.1.2",
71
+ "com.github.apple.coremltools.version" : "7.1"
72
+ },
73
+ "generatedClassName" : "Stable_Diffusion_version_turbovisionxlSuperFastXLBasedOnNew_tvxlV431Bakedvae_diffusers_vae_decoder",
74
+ "method" : "predict"
75
+ }
76
+ ]
VAEDecoder.mlmodelc/model.mil ADDED
The diff for this file is too large to render. See raw diff
 
VAEDecoder.mlmodelc/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c07e9d7970c403188483df17fa736254aa9e1201f395a7fb05a8ccacf9e9a807
3
+ size 197977216
VAEEncoder.mlmodelc/analytics/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd09da9da725147cd68f67d424955f7f7c95bfd4fa8392d387c0f7b47884ac98
3
+ size 243
VAEEncoder.mlmodelc/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c641e2ef913abeaa33d28050f3acf074c56a4d07f56cc4a843d169285156541b
3
+ size 914
VAEEncoder.mlmodelc/metadata.json ADDED
@@ -0,0 +1,76 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "shortDescription" : "Stable Diffusion generates images conditioned on text and\/or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
4
+ "metadataOutputVersion" : "3.0",
5
+ "outputSchema" : [
6
+ {
7
+ "hasShapeFlexibility" : "0",
8
+ "isOptional" : "0",
9
+ "dataType" : "Float32",
10
+ "formattedType" : "MultiArray (Float32 1 × 8 × 96 × 96)",
11
+ "shortDescription" : "The latent embeddings from the unet model from the input image.",
12
+ "shape" : "[1, 8, 96, 96]",
13
+ "name" : "latent",
14
+ "type" : "MultiArray"
15
+ }
16
+ ],
17
+ "version" : "turbovisionxlSuperFastXLBasedOnNew_tvxlV431Bakedvae_diffusers",
18
+ "modelParameters" : [
19
+
20
+ ],
21
+ "author" : "Please refer to the Model Card available at huggingface.co\/turbovisionxlSuperFastXLBasedOnNew_tvxlV431Bakedvae_diffusers",
22
+ "specificationVersion" : 7,
23
+ "storagePrecision" : "Float32",
24
+ "license" : "OpenRAIL++-M (https:\/\/huggingface.co\/stabilityai\/stable-diffusion-xl-base-1.0\/blob\/main\/LICENSE.md)",
25
+ "mlProgramOperationTypeHistogram" : {
26
+ "Pad" : 3,
27
+ "Ios16.mul" : 2,
28
+ "Ios16.sqrt" : 22,
29
+ "Ios16.sub" : 22,
30
+ "Transpose" : 6,
31
+ "Ios16.conv" : 28,
32
+ "Ios16.add" : 34,
33
+ "Ios16.linear" : 4,
34
+ "Ios16.matmul" : 2,
35
+ "Ios16.realDiv" : 22,
36
+ "Ios16.reduceMean" : 44,
37
+ "Ios16.softmax" : 1,
38
+ "Ios16.batchNorm" : 21,
39
+ "Ios16.square" : 22,
40
+ "Ios16.reshape" : 49,
41
+ "Ios16.silu" : 21
42
+ },
43
+ "computePrecision" : "Mixed (Float32, Int32)",
44
+ "isUpdatable" : "0",
45
+ "availability" : {
46
+ "macOS" : "13.0",
47
+ "tvOS" : "16.0",
48
+ "visionOS" : "1.0",
49
+ "watchOS" : "9.0",
50
+ "iOS" : "16.0",
51
+ "macCatalyst" : "16.0"
52
+ },
53
+ "modelType" : {
54
+ "name" : "MLModelType_mlProgram"
55
+ },
56
+ "inputSchema" : [
57
+ {
58
+ "hasShapeFlexibility" : "0",
59
+ "isOptional" : "0",
60
+ "dataType" : "Float32",
61
+ "formattedType" : "MultiArray (Float32 1 × 3 × 768 × 768)",
62
+ "shortDescription" : "The input image to base the initial latents on normalized to range [-1, 1]",
63
+ "shape" : "[1, 3, 768, 768]",
64
+ "name" : "x",
65
+ "type" : "MultiArray"
66
+ }
67
+ ],
68
+ "userDefinedMetadata" : {
69
+ "com.github.apple.coremltools.source_dialect" : "TorchScript",
70
+ "com.github.apple.coremltools.source" : "torch==2.1.2",
71
+ "com.github.apple.coremltools.version" : "7.1"
72
+ },
73
+ "generatedClassName" : "Stable_Diffusion_version_turbovisionxlSuperFastXLBasedOnNew_tvxlV431Bakedvae_diffusers_vae_encoder",
74
+ "method" : "predict"
75
+ }
76
+ ]
VAEEncoder.mlmodelc/model.mil ADDED
The diff for this file is too large to render. See raw diff
 
VAEEncoder.mlmodelc/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b07c246e38dc348797d1c723bf6eaa325fbd4d5cc38430d76eac757128b164a
3
+ size 136668992
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
vocab.json ADDED
The diff for this file is too large to render. See raw diff