pcuenq HF staff commited on
Commit
6b78662
1 Parent(s): ddab115

VAE Encoder (#4)

Browse files
.gitignore ADDED
@@ -0,0 +1 @@
 
 
1
+ .DS_Store
original/compiled/VAEEncoder.mlmodelc/analytics/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:925a46e40af84f2a065c43d3d4bbe0d5b49766a08c75df4c46a870f2a191868c
3
+ size 207
original/compiled/VAEEncoder.mlmodelc/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69c400c21fa4f0a15b9645d0f03ba36de9d758e0ca7ee076c079f449c3007ff1
3
+ size 1274
original/compiled/VAEEncoder.mlmodelc/metadata.json ADDED
@@ -0,0 +1,118 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "shortDescription" : "Stable Diffusion generates images conditioned on text and\/or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
4
+ "metadataOutputVersion" : "3.0",
5
+ "outputSchema" : [
6
+ {
7
+ "hasShapeFlexibility" : "0",
8
+ "isOptional" : "0",
9
+ "dataType" : "Float32",
10
+ "formattedType" : "MultiArray (Float32)",
11
+ "shortDescription" : "The latent embeddings from the unet model from the input image.",
12
+ "shape" : "[]",
13
+ "name" : "latent_dist",
14
+ "type" : "MultiArray"
15
+ }
16
+ ],
17
+ "version" : "runwayml\/stable-diffusion-v1-5",
18
+ "modelParameters" : [
19
+
20
+ ],
21
+ "author" : "Please refer to the Model Card available at huggingface.co\/runwayml\/stable-diffusion-v1-5",
22
+ "specificationVersion" : 7,
23
+ "storagePrecision" : "Float16",
24
+ "license" : "OpenRAIL (https:\/\/huggingface.co\/spaces\/CompVis\/stable-diffusion-license)",
25
+ "mlProgramOperationTypeHistogram" : {
26
+ "Transpose" : 7,
27
+ "Ios16.exp" : 1,
28
+ "Ios16.reduceMean" : 44,
29
+ "Ios16.softmax" : 1,
30
+ "Split" : 1,
31
+ "Ios16.linear" : 4,
32
+ "Ios16.add" : 35,
33
+ "Ios16.realDiv" : 22,
34
+ "Ios16.square" : 22,
35
+ "Pad" : 3,
36
+ "Ios16.sub" : 22,
37
+ "Ios16.cast" : 1,
38
+ "Ios16.clip" : 1,
39
+ "Ios16.conv" : 28,
40
+ "Ios16.matmul" : 2,
41
+ "Ios16.reshape" : 54,
42
+ "Ios16.batchNorm" : 22,
43
+ "Ios16.silu" : 21,
44
+ "Ios16.sqrt" : 22,
45
+ "Ios16.mul" : 6
46
+ },
47
+ "computePrecision" : "Mixed (Float32, Float16, Int32)",
48
+ "isUpdatable" : "0",
49
+ "availability" : {
50
+ "macOS" : "13.0",
51
+ "tvOS" : "16.0",
52
+ "watchOS" : "9.0",
53
+ "iOS" : "16.0",
54
+ "macCatalyst" : "16.0"
55
+ },
56
+ "modelType" : {
57
+ "name" : "MLModelType_mlProgram"
58
+ },
59
+ "inputSchema" : [
60
+ {
61
+ "hasShapeFlexibility" : "0",
62
+ "isOptional" : "0",
63
+ "dataType" : "Float16",
64
+ "formattedType" : "MultiArray (Float16 1 × 3 × 512 × 512)",
65
+ "shortDescription" : "An image of the correct size to create the latent space with, image2image and in-painting.",
66
+ "shape" : "[1, 3, 512, 512]",
67
+ "name" : "sample",
68
+ "type" : "MultiArray"
69
+ },
70
+ {
71
+ "hasShapeFlexibility" : "0",
72
+ "isOptional" : "0",
73
+ "dataType" : "Float16",
74
+ "formattedType" : "MultiArray (Float16 1 × 4 × 64 × 64)",
75
+ "shortDescription" : "Latent noise for `DiagonalGaussianDistribution` operation.",
76
+ "shape" : "[1, 4, 64, 64]",
77
+ "name" : "diagonal_noise",
78
+ "type" : "MultiArray"
79
+ },
80
+ {
81
+ "hasShapeFlexibility" : "0",
82
+ "isOptional" : "0",
83
+ "dataType" : "Float16",
84
+ "formattedType" : "MultiArray (Float16 1 × 4 × 64 × 64)",
85
+ "shortDescription" : "Latent noise for use with strength parameter of image2image",
86
+ "shape" : "[1, 4, 64, 64]",
87
+ "name" : "noise",
88
+ "type" : "MultiArray"
89
+ },
90
+ {
91
+ "hasShapeFlexibility" : "0",
92
+ "isOptional" : "0",
93
+ "dataType" : "Float16",
94
+ "formattedType" : "MultiArray (Float16 1 × 1)",
95
+ "shortDescription" : "Precalculated `sqrt_alphas_cumprod` value based on strength and the current schedular's alphasCumprod values",
96
+ "shape" : "[1, 1]",
97
+ "name" : "sqrt_alphas_cumprod",
98
+ "type" : "MultiArray"
99
+ },
100
+ {
101
+ "hasShapeFlexibility" : "0",
102
+ "isOptional" : "0",
103
+ "dataType" : "Float16",
104
+ "formattedType" : "MultiArray (Float16 1 × 1)",
105
+ "shortDescription" : "Precalculated `sqrt_one_minus_alphas_cumprod` value based on strength and the current schedular's alphasCumprod values",
106
+ "shape" : "[1, 1]",
107
+ "name" : "sqrt_one_minus_alphas_cumprod",
108
+ "type" : "MultiArray"
109
+ }
110
+ ],
111
+ "userDefinedMetadata" : {
112
+ "com.github.apple.coremltools.version" : "6.1",
113
+ "com.github.apple.coremltools.source" : "torch==1.13.1"
114
+ },
115
+ "generatedClassName" : "Stable_Diffusion_version_runwayml_stable_diffusion_v1_5_vae_encoder",
116
+ "method" : "predict"
117
+ }
118
+ ]
original/compiled/VAEEncoder.mlmodelc/model.mil ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3cd529b933adc7e28b4057051eb816d753241246416bceacf25eb844e2b64d4a
3
+ size 137752
original/compiled/VAEEncoder.mlmodelc/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57d5438c221fc6c65bd4249f621cfd15deab77ee03495f5fb99662426ef74d51
3
+ size 68370240
original/packages/Stable_Diffusion_version_runwayml_stable-diffusion-v1-5_vae_encoder.mlpackage/Data/com.apple.CoreML/model.mlmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:573fa4f8e8eb1601aa2ba87a789bfba6c9ee3a0d6c09db67a5c7c22c96a9194f
3
+ size 117450
original/packages/Stable_Diffusion_version_runwayml_stable-diffusion-v1-5_vae_encoder.mlpackage/Data/com.apple.CoreML/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57d5438c221fc6c65bd4249f621cfd15deab77ee03495f5fb99662426ef74d51
3
+ size 68370240
original/packages/Stable_Diffusion_version_runwayml_stable-diffusion-v1-5_vae_encoder.mlpackage/Manifest.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "fileFormatVersion": "1.0.0",
3
+ "itemInfoEntries": {
4
+ "3D939470-6F09-4758-9FFC-5CDD63158DC7": {
5
+ "author": "com.apple.CoreML",
6
+ "description": "CoreML Model Specification",
7
+ "name": "model.mlmodel",
8
+ "path": "com.apple.CoreML/model.mlmodel"
9
+ },
10
+ "E607BD7B-4F90-4362-B733-CE538A162148": {
11
+ "author": "com.apple.CoreML",
12
+ "description": "CoreML Model Weights",
13
+ "name": "weights",
14
+ "path": "com.apple.CoreML/weights"
15
+ }
16
+ },
17
+ "rootModelIdentifier": "3D939470-6F09-4758-9FFC-5CDD63158DC7"
18
+ }
split_einsum/compiled/VAEEncoder.mlmodelc/analytics/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:925a46e40af84f2a065c43d3d4bbe0d5b49766a08c75df4c46a870f2a191868c
3
+ size 207
split_einsum/compiled/VAEEncoder.mlmodelc/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69c400c21fa4f0a15b9645d0f03ba36de9d758e0ca7ee076c079f449c3007ff1
3
+ size 1274
split_einsum/compiled/VAEEncoder.mlmodelc/metadata.json ADDED
@@ -0,0 +1,118 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "shortDescription" : "Stable Diffusion generates images conditioned on text and\/or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
4
+ "metadataOutputVersion" : "3.0",
5
+ "outputSchema" : [
6
+ {
7
+ "hasShapeFlexibility" : "0",
8
+ "isOptional" : "0",
9
+ "dataType" : "Float32",
10
+ "formattedType" : "MultiArray (Float32)",
11
+ "shortDescription" : "The latent embeddings from the unet model from the input image.",
12
+ "shape" : "[]",
13
+ "name" : "latent_dist",
14
+ "type" : "MultiArray"
15
+ }
16
+ ],
17
+ "version" : "runwayml\/stable-diffusion-v1-5",
18
+ "modelParameters" : [
19
+
20
+ ],
21
+ "author" : "Please refer to the Model Card available at huggingface.co\/runwayml\/stable-diffusion-v1-5",
22
+ "specificationVersion" : 7,
23
+ "storagePrecision" : "Float16",
24
+ "license" : "OpenRAIL (https:\/\/huggingface.co\/spaces\/CompVis\/stable-diffusion-license)",
25
+ "mlProgramOperationTypeHistogram" : {
26
+ "Transpose" : 7,
27
+ "Ios16.exp" : 1,
28
+ "Ios16.reduceMean" : 44,
29
+ "Ios16.softmax" : 1,
30
+ "Split" : 1,
31
+ "Ios16.linear" : 4,
32
+ "Ios16.add" : 35,
33
+ "Ios16.realDiv" : 22,
34
+ "Ios16.square" : 22,
35
+ "Pad" : 3,
36
+ "Ios16.sub" : 22,
37
+ "Ios16.cast" : 1,
38
+ "Ios16.clip" : 1,
39
+ "Ios16.conv" : 28,
40
+ "Ios16.matmul" : 2,
41
+ "Ios16.reshape" : 54,
42
+ "Ios16.batchNorm" : 22,
43
+ "Ios16.silu" : 21,
44
+ "Ios16.sqrt" : 22,
45
+ "Ios16.mul" : 6
46
+ },
47
+ "computePrecision" : "Mixed (Float32, Float16, Int32)",
48
+ "isUpdatable" : "0",
49
+ "availability" : {
50
+ "macOS" : "13.0",
51
+ "tvOS" : "16.0",
52
+ "watchOS" : "9.0",
53
+ "iOS" : "16.0",
54
+ "macCatalyst" : "16.0"
55
+ },
56
+ "modelType" : {
57
+ "name" : "MLModelType_mlProgram"
58
+ },
59
+ "inputSchema" : [
60
+ {
61
+ "hasShapeFlexibility" : "0",
62
+ "isOptional" : "0",
63
+ "dataType" : "Float16",
64
+ "formattedType" : "MultiArray (Float16 1 × 3 × 512 × 512)",
65
+ "shortDescription" : "An image of the correct size to create the latent space with, image2image and in-painting.",
66
+ "shape" : "[1, 3, 512, 512]",
67
+ "name" : "sample",
68
+ "type" : "MultiArray"
69
+ },
70
+ {
71
+ "hasShapeFlexibility" : "0",
72
+ "isOptional" : "0",
73
+ "dataType" : "Float16",
74
+ "formattedType" : "MultiArray (Float16 1 × 4 × 64 × 64)",
75
+ "shortDescription" : "Latent noise for `DiagonalGaussianDistribution` operation.",
76
+ "shape" : "[1, 4, 64, 64]",
77
+ "name" : "diagonal_noise",
78
+ "type" : "MultiArray"
79
+ },
80
+ {
81
+ "hasShapeFlexibility" : "0",
82
+ "isOptional" : "0",
83
+ "dataType" : "Float16",
84
+ "formattedType" : "MultiArray (Float16 1 × 4 × 64 × 64)",
85
+ "shortDescription" : "Latent noise for use with strength parameter of image2image",
86
+ "shape" : "[1, 4, 64, 64]",
87
+ "name" : "noise",
88
+ "type" : "MultiArray"
89
+ },
90
+ {
91
+ "hasShapeFlexibility" : "0",
92
+ "isOptional" : "0",
93
+ "dataType" : "Float16",
94
+ "formattedType" : "MultiArray (Float16 1 × 1)",
95
+ "shortDescription" : "Precalculated `sqrt_alphas_cumprod` value based on strength and the current schedular's alphasCumprod values",
96
+ "shape" : "[1, 1]",
97
+ "name" : "sqrt_alphas_cumprod",
98
+ "type" : "MultiArray"
99
+ },
100
+ {
101
+ "hasShapeFlexibility" : "0",
102
+ "isOptional" : "0",
103
+ "dataType" : "Float16",
104
+ "formattedType" : "MultiArray (Float16 1 × 1)",
105
+ "shortDescription" : "Precalculated `sqrt_one_minus_alphas_cumprod` value based on strength and the current schedular's alphasCumprod values",
106
+ "shape" : "[1, 1]",
107
+ "name" : "sqrt_one_minus_alphas_cumprod",
108
+ "type" : "MultiArray"
109
+ }
110
+ ],
111
+ "userDefinedMetadata" : {
112
+ "com.github.apple.coremltools.version" : "6.1",
113
+ "com.github.apple.coremltools.source" : "torch==1.13.1"
114
+ },
115
+ "generatedClassName" : "Stable_Diffusion_version_runwayml_stable_diffusion_v1_5_vae_encoder",
116
+ "method" : "predict"
117
+ }
118
+ ]
split_einsum/compiled/VAEEncoder.mlmodelc/model.mil ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3cd529b933adc7e28b4057051eb816d753241246416bceacf25eb844e2b64d4a
3
+ size 137752
split_einsum/compiled/VAEEncoder.mlmodelc/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d34df7191f1b851ccbfc509c49afd294d2e7fc7bfc5103e79516388e16b3b726
3
+ size 68370240
split_einsum/packages/Stable_Diffusion_version_runwayml_stable-diffusion-v1-5_vae_encoder.mlpackage/Data/com.apple.CoreML/model.mlmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:573fa4f8e8eb1601aa2ba87a789bfba6c9ee3a0d6c09db67a5c7c22c96a9194f
3
+ size 117450
split_einsum/packages/Stable_Diffusion_version_runwayml_stable-diffusion-v1-5_vae_encoder.mlpackage/Data/com.apple.CoreML/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d34df7191f1b851ccbfc509c49afd294d2e7fc7bfc5103e79516388e16b3b726
3
+ size 68370240
split_einsum/packages/Stable_Diffusion_version_runwayml_stable-diffusion-v1-5_vae_encoder.mlpackage/Manifest.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "fileFormatVersion": "1.0.0",
3
+ "itemInfoEntries": {
4
+ "7EACD8CB-E3C8-49A1-B9FF-04B1EDACDC47": {
5
+ "author": "com.apple.CoreML",
6
+ "description": "CoreML Model Specification",
7
+ "name": "model.mlmodel",
8
+ "path": "com.apple.CoreML/model.mlmodel"
9
+ },
10
+ "86199C84-B673-4184-A06D-15D834AAA033": {
11
+ "author": "com.apple.CoreML",
12
+ "description": "CoreML Model Weights",
13
+ "name": "weights",
14
+ "path": "com.apple.CoreML/weights"
15
+ }
16
+ },
17
+ "rootModelIdentifier": "7EACD8CB-E3C8-49A1-B9FF-04B1EDACDC47"
18
+ }