pcuenq HF staff commited on
Commit
f91130a
1 Parent(s): 96a2c3d

VAE Encoder (#3)

Browse files
original/compiled/VAEEncoder.mlmodelc/analytics/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e27fb7ebcffa0ff79c7212e1e914dbc14fddb8265b8c73d0d322a7eea4ef01e8
3
+ size 207
original/compiled/VAEEncoder.mlmodelc/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b8cb326a2c2071e8ba0b1ef1084609061d0e86a603f55d066d25c60e04acd4a
3
+ size 1272
original/compiled/VAEEncoder.mlmodelc/metadata.json ADDED
@@ -0,0 +1,118 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "shortDescription" : "Stable Diffusion generates images conditioned on text and\/or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
4
+ "metadataOutputVersion" : "3.0",
5
+ "outputSchema" : [
6
+ {
7
+ "hasShapeFlexibility" : "0",
8
+ "isOptional" : "0",
9
+ "dataType" : "Float32",
10
+ "formattedType" : "MultiArray (Float32)",
11
+ "shortDescription" : "The latent embeddings from the unet model from the input image.",
12
+ "shape" : "[]",
13
+ "name" : "latent_dist",
14
+ "type" : "MultiArray"
15
+ }
16
+ ],
17
+ "version" : "CompVis\/stable-diffusion-v1-4",
18
+ "modelParameters" : [
19
+
20
+ ],
21
+ "author" : "Please refer to the Model Card available at huggingface.co\/CompVis\/stable-diffusion-v1-4",
22
+ "specificationVersion" : 7,
23
+ "storagePrecision" : "Float16",
24
+ "license" : "OpenRAIL (https:\/\/huggingface.co\/spaces\/CompVis\/stable-diffusion-license)",
25
+ "mlProgramOperationTypeHistogram" : {
26
+ "Transpose" : 7,
27
+ "Ios16.exp" : 1,
28
+ "Ios16.reduceMean" : 44,
29
+ "Ios16.softmax" : 1,
30
+ "Split" : 1,
31
+ "Ios16.linear" : 4,
32
+ "Ios16.add" : 35,
33
+ "Ios16.realDiv" : 22,
34
+ "Ios16.square" : 22,
35
+ "Pad" : 3,
36
+ "Ios16.sub" : 22,
37
+ "Ios16.cast" : 1,
38
+ "Ios16.clip" : 1,
39
+ "Ios16.conv" : 28,
40
+ "Ios16.matmul" : 2,
41
+ "Ios16.reshape" : 54,
42
+ "Ios16.batchNorm" : 22,
43
+ "Ios16.silu" : 21,
44
+ "Ios16.sqrt" : 22,
45
+ "Ios16.mul" : 6
46
+ },
47
+ "computePrecision" : "Mixed (Float32, Float16, Int32)",
48
+ "isUpdatable" : "0",
49
+ "availability" : {
50
+ "macOS" : "13.0",
51
+ "tvOS" : "16.0",
52
+ "watchOS" : "9.0",
53
+ "iOS" : "16.0",
54
+ "macCatalyst" : "16.0"
55
+ },
56
+ "modelType" : {
57
+ "name" : "MLModelType_mlProgram"
58
+ },
59
+ "inputSchema" : [
60
+ {
61
+ "hasShapeFlexibility" : "0",
62
+ "isOptional" : "0",
63
+ "dataType" : "Float16",
64
+ "formattedType" : "MultiArray (Float16 1 × 3 × 512 × 512)",
65
+ "shortDescription" : "An image of the correct size to create the latent space with, image2image and in-painting.",
66
+ "shape" : "[1, 3, 512, 512]",
67
+ "name" : "sample",
68
+ "type" : "MultiArray"
69
+ },
70
+ {
71
+ "hasShapeFlexibility" : "0",
72
+ "isOptional" : "0",
73
+ "dataType" : "Float16",
74
+ "formattedType" : "MultiArray (Float16 1 × 4 × 64 × 64)",
75
+ "shortDescription" : "Latent noise for `DiagonalGaussianDistribution` operation.",
76
+ "shape" : "[1, 4, 64, 64]",
77
+ "name" : "diagonal_noise",
78
+ "type" : "MultiArray"
79
+ },
80
+ {
81
+ "hasShapeFlexibility" : "0",
82
+ "isOptional" : "0",
83
+ "dataType" : "Float16",
84
+ "formattedType" : "MultiArray (Float16 1 × 4 × 64 × 64)",
85
+ "shortDescription" : "Latent noise for use with strength parameter of image2image",
86
+ "shape" : "[1, 4, 64, 64]",
87
+ "name" : "noise",
88
+ "type" : "MultiArray"
89
+ },
90
+ {
91
+ "hasShapeFlexibility" : "0",
92
+ "isOptional" : "0",
93
+ "dataType" : "Float16",
94
+ "formattedType" : "MultiArray (Float16 1 × 1)",
95
+ "shortDescription" : "Precalculated `sqrt_alphas_cumprod` value based on strength and the current schedular's alphasCumprod values",
96
+ "shape" : "[1, 1]",
97
+ "name" : "sqrt_alphas_cumprod",
98
+ "type" : "MultiArray"
99
+ },
100
+ {
101
+ "hasShapeFlexibility" : "0",
102
+ "isOptional" : "0",
103
+ "dataType" : "Float16",
104
+ "formattedType" : "MultiArray (Float16 1 × 1)",
105
+ "shortDescription" : "Precalculated `sqrt_one_minus_alphas_cumprod` value based on strength and the current schedular's alphasCumprod values",
106
+ "shape" : "[1, 1]",
107
+ "name" : "sqrt_one_minus_alphas_cumprod",
108
+ "type" : "MultiArray"
109
+ }
110
+ ],
111
+ "userDefinedMetadata" : {
112
+ "com.github.apple.coremltools.version" : "6.1",
113
+ "com.github.apple.coremltools.source" : "torch==1.13.0"
114
+ },
115
+ "generatedClassName" : "Stable_Diffusion_version_CompVis_stable_diffusion_v1_4_vae_encoder",
116
+ "method" : "predict"
117
+ }
118
+ ]
original/compiled/VAEEncoder.mlmodelc/model.mil ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:823a50e22d4989acd5247f33e8cc52e0caf5dbceec978fe76f6a5dd9759c2c7f
3
+ size 137752
original/compiled/VAEEncoder.mlmodelc/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:edc9a37ae7f0c7b1696798514fa2224d183e5154356a356c0975acb6e9e7bba6
3
+ size 68370240
original/packages/Stable_Diffusion_version_CompVis_stable-diffusion-v1-4_vae_encoder.mlpackage/Data/com.apple.CoreML/model.mlmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6269f295fe1eef3d3194186afbf56d932b399d528663ff95fc56cfdf1885d015
3
+ size 117448
original/packages/Stable_Diffusion_version_CompVis_stable-diffusion-v1-4_vae_encoder.mlpackage/Data/com.apple.CoreML/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:edc9a37ae7f0c7b1696798514fa2224d183e5154356a356c0975acb6e9e7bba6
3
+ size 68370240
original/packages/Stable_Diffusion_version_CompVis_stable-diffusion-v1-4_vae_encoder.mlpackage/Manifest.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "fileFormatVersion": "1.0.0",
3
+ "itemInfoEntries": {
4
+ "572B88FB-BD8C-4BB2-94A9-59BBAA98B7E6": {
5
+ "author": "com.apple.CoreML",
6
+ "description": "CoreML Model Weights",
7
+ "name": "weights",
8
+ "path": "com.apple.CoreML/weights"
9
+ },
10
+ "908BDF53-CD61-4E50-821B-0721632446FB": {
11
+ "author": "com.apple.CoreML",
12
+ "description": "CoreML Model Specification",
13
+ "name": "model.mlmodel",
14
+ "path": "com.apple.CoreML/model.mlmodel"
15
+ }
16
+ },
17
+ "rootModelIdentifier": "908BDF53-CD61-4E50-821B-0721632446FB"
18
+ }
split_einsum/compiled/VAEEncoder.mlmodelc/analytics/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e27fb7ebcffa0ff79c7212e1e914dbc14fddb8265b8c73d0d322a7eea4ef01e8
3
+ size 207
split_einsum/compiled/VAEEncoder.mlmodelc/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a8053f3c4f3cebb592d42dd6e2dad8758c4c40417c8552424faf74c9986fe3f
3
+ size 1272
split_einsum/compiled/VAEEncoder.mlmodelc/metadata.json ADDED
@@ -0,0 +1,118 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "shortDescription" : "Stable Diffusion generates images conditioned on text and\/or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
4
+ "metadataOutputVersion" : "3.0",
5
+ "outputSchema" : [
6
+ {
7
+ "hasShapeFlexibility" : "0",
8
+ "isOptional" : "0",
9
+ "dataType" : "Float32",
10
+ "formattedType" : "MultiArray (Float32)",
11
+ "shortDescription" : "The latent embeddings from the unet model from the input image.",
12
+ "shape" : "[]",
13
+ "name" : "latent_dist",
14
+ "type" : "MultiArray"
15
+ }
16
+ ],
17
+ "version" : "CompVis\/stable-diffusion-v1-4",
18
+ "modelParameters" : [
19
+
20
+ ],
21
+ "author" : "Please refer to the Model Card available at huggingface.co\/CompVis\/stable-diffusion-v1-4",
22
+ "specificationVersion" : 7,
23
+ "storagePrecision" : "Float16",
24
+ "license" : "OpenRAIL (https:\/\/huggingface.co\/spaces\/CompVis\/stable-diffusion-license)",
25
+ "mlProgramOperationTypeHistogram" : {
26
+ "Transpose" : 7,
27
+ "Ios16.exp" : 1,
28
+ "Ios16.reduceMean" : 44,
29
+ "Ios16.softmax" : 1,
30
+ "Split" : 1,
31
+ "Ios16.linear" : 4,
32
+ "Ios16.add" : 35,
33
+ "Ios16.realDiv" : 22,
34
+ "Ios16.square" : 22,
35
+ "Pad" : 3,
36
+ "Ios16.sub" : 22,
37
+ "Ios16.cast" : 1,
38
+ "Ios16.clip" : 1,
39
+ "Ios16.conv" : 28,
40
+ "Ios16.matmul" : 2,
41
+ "Ios16.reshape" : 54,
42
+ "Ios16.batchNorm" : 22,
43
+ "Ios16.silu" : 21,
44
+ "Ios16.sqrt" : 22,
45
+ "Ios16.mul" : 6
46
+ },
47
+ "computePrecision" : "Mixed (Float32, Float16, Int32)",
48
+ "isUpdatable" : "0",
49
+ "availability" : {
50
+ "macOS" : "13.0",
51
+ "tvOS" : "16.0",
52
+ "watchOS" : "9.0",
53
+ "iOS" : "16.0",
54
+ "macCatalyst" : "16.0"
55
+ },
56
+ "modelType" : {
57
+ "name" : "MLModelType_mlProgram"
58
+ },
59
+ "inputSchema" : [
60
+ {
61
+ "hasShapeFlexibility" : "0",
62
+ "isOptional" : "0",
63
+ "dataType" : "Float16",
64
+ "formattedType" : "MultiArray (Float16 1 × 3 × 512 × 512)",
65
+ "shortDescription" : "An image of the correct size to create the latent space with, image2image and in-painting.",
66
+ "shape" : "[1, 3, 512, 512]",
67
+ "name" : "sample",
68
+ "type" : "MultiArray"
69
+ },
70
+ {
71
+ "hasShapeFlexibility" : "0",
72
+ "isOptional" : "0",
73
+ "dataType" : "Float16",
74
+ "formattedType" : "MultiArray (Float16 1 × 4 × 64 × 64)",
75
+ "shortDescription" : "Latent noise for `DiagonalGaussianDistribution` operation.",
76
+ "shape" : "[1, 4, 64, 64]",
77
+ "name" : "diagonal_noise",
78
+ "type" : "MultiArray"
79
+ },
80
+ {
81
+ "hasShapeFlexibility" : "0",
82
+ "isOptional" : "0",
83
+ "dataType" : "Float16",
84
+ "formattedType" : "MultiArray (Float16 1 × 4 × 64 × 64)",
85
+ "shortDescription" : "Latent noise for use with strength parameter of image2image",
86
+ "shape" : "[1, 4, 64, 64]",
87
+ "name" : "noise",
88
+ "type" : "MultiArray"
89
+ },
90
+ {
91
+ "hasShapeFlexibility" : "0",
92
+ "isOptional" : "0",
93
+ "dataType" : "Float16",
94
+ "formattedType" : "MultiArray (Float16 1 × 1)",
95
+ "shortDescription" : "Precalculated `sqrt_alphas_cumprod` value based on strength and the current schedular's alphasCumprod values",
96
+ "shape" : "[1, 1]",
97
+ "name" : "sqrt_alphas_cumprod",
98
+ "type" : "MultiArray"
99
+ },
100
+ {
101
+ "hasShapeFlexibility" : "0",
102
+ "isOptional" : "0",
103
+ "dataType" : "Float16",
104
+ "formattedType" : "MultiArray (Float16 1 × 1)",
105
+ "shortDescription" : "Precalculated `sqrt_one_minus_alphas_cumprod` value based on strength and the current schedular's alphasCumprod values",
106
+ "shape" : "[1, 1]",
107
+ "name" : "sqrt_one_minus_alphas_cumprod",
108
+ "type" : "MultiArray"
109
+ }
110
+ ],
111
+ "userDefinedMetadata" : {
112
+ "com.github.apple.coremltools.version" : "6.1",
113
+ "com.github.apple.coremltools.source" : "torch==1.13.0"
114
+ },
115
+ "generatedClassName" : "Stable_Diffusion_version_CompVis_stable_diffusion_v1_4_vae_encoder",
116
+ "method" : "predict"
117
+ }
118
+ ]
split_einsum/compiled/VAEEncoder.mlmodelc/model.mil ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:823a50e22d4989acd5247f33e8cc52e0caf5dbceec978fe76f6a5dd9759c2c7f
3
+ size 137752
split_einsum/compiled/VAEEncoder.mlmodelc/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2604aac03e12dde2d56b35a7d2f6c3275860b049ea2dedd75426c2a5c3a6c667
3
+ size 68370240
split_einsum/packages/Stable_Diffusion_version_CompVis_stable-diffusion-v1-4_vae_encoder.mlpackage/Data/com.apple.CoreML/model.mlmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6269f295fe1eef3d3194186afbf56d932b399d528663ff95fc56cfdf1885d015
3
+ size 117448
split_einsum/packages/Stable_Diffusion_version_CompVis_stable-diffusion-v1-4_vae_encoder.mlpackage/Data/com.apple.CoreML/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2604aac03e12dde2d56b35a7d2f6c3275860b049ea2dedd75426c2a5c3a6c667
3
+ size 68370240
split_einsum/packages/Stable_Diffusion_version_CompVis_stable-diffusion-v1-4_vae_encoder.mlpackage/Manifest.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "fileFormatVersion": "1.0.0",
3
+ "itemInfoEntries": {
4
+ "73F723E9-BBE9-40B7-8113-8FCA8733A20D": {
5
+ "author": "com.apple.CoreML",
6
+ "description": "CoreML Model Specification",
7
+ "name": "model.mlmodel",
8
+ "path": "com.apple.CoreML/model.mlmodel"
9
+ },
10
+ "DEB5F935-76BB-4FD1-BBD6-968993E96111": {
11
+ "author": "com.apple.CoreML",
12
+ "description": "CoreML Model Weights",
13
+ "name": "weights",
14
+ "path": "com.apple.CoreML/weights"
15
+ }
16
+ },
17
+ "rootModelIdentifier": "73F723E9-BBE9-40B7-8113-8FCA8733A20D"
18
+ }