Text-to-Image
Core ML
stable-diffusion
core-ml
pcuenq HF staff commited on
Commit
abea076
1 Parent(s): a8bfcd1

Update VAE Encoder.

Browse files

See https://github.com/apple/ml-stable-diffusion/issues/176

original/compiled/VAEEncoder.mlmodelc/analytics/coremldata.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eee76fbae1fa08a0d7bd18b2eb1f0324f9fdba01656f441a3e8357f08bb6345a
3
  size 207
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:132c6d52eacfe75bf06faebc63ba323965841e05c77b1c5e6158491100d96bd9
3
  size 207
original/compiled/VAEEncoder.mlmodelc/coremldata.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:854e552c6e9273ef52b93a0fd2013399421450f497fcd327eb8aa371a2e5f46d
3
- size 1284
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ac1e4a8ea5cfe3a02d26fff80894c8eee09248a0776be6dd55aab7d44d97d1b
3
+ size 771
original/compiled/VAEEncoder.mlmodelc/metadata.json CHANGED
@@ -10,7 +10,7 @@
10
  "formattedType" : "MultiArray (Float32)",
11
  "shortDescription" : "The latent embeddings from the unet model from the input image.",
12
  "shape" : "[]",
13
- "name" : "latent_dist",
14
  "type" : "MultiArray"
15
  }
16
  ],
@@ -23,26 +23,23 @@
23
  "storagePrecision" : "Float16",
24
  "license" : "OpenRAIL (https:\/\/huggingface.co\/spaces\/CompVis\/stable-diffusion-license)",
25
  "mlProgramOperationTypeHistogram" : {
26
- "Transpose" : 7,
27
- "Ios16.exp" : 1,
28
- "Ios16.reduceMean" : 44,
29
- "Ios16.softmax" : 1,
30
- "Split" : 1,
31
- "Ios16.linear" : 4,
32
- "Ios16.add" : 35,
33
- "Ios16.realDiv" : 22,
34
- "Ios16.square" : 22,
35
  "Pad" : 3,
36
- "Ios16.sub" : 22,
37
  "Ios16.cast" : 1,
38
- "Ios16.clip" : 1,
 
 
 
39
  "Ios16.conv" : 28,
 
 
40
  "Ios16.matmul" : 2,
41
- "Ios16.reshape" : 54,
 
 
42
  "Ios16.batchNorm" : 22,
43
- "Ios16.silu" : 21,
44
- "Ios16.sqrt" : 22,
45
- "Ios16.mul" : 6
46
  },
47
  "computePrecision" : "Mixed (Float32, Float16, Int32)",
48
  "isUpdatable" : "0",
@@ -62,55 +59,15 @@
62
  "isOptional" : "0",
63
  "dataType" : "Float16",
64
  "formattedType" : "MultiArray (Float16 1 × 3 × 512 × 512)",
65
- "shortDescription" : "An image of the correct size to create the latent space with, image2image and in-painting.",
66
  "shape" : "[1, 3, 512, 512]",
67
- "name" : "sample",
68
- "type" : "MultiArray"
69
- },
70
- {
71
- "hasShapeFlexibility" : "0",
72
- "isOptional" : "0",
73
- "dataType" : "Float16",
74
- "formattedType" : "MultiArray (Float16 1 × 4 × 64 × 64)",
75
- "shortDescription" : "Latent noise for `DiagonalGaussianDistribution` operation.",
76
- "shape" : "[1, 4, 64, 64]",
77
- "name" : "diagonal_noise",
78
- "type" : "MultiArray"
79
- },
80
- {
81
- "hasShapeFlexibility" : "0",
82
- "isOptional" : "0",
83
- "dataType" : "Float16",
84
- "formattedType" : "MultiArray (Float16 1 × 4 × 64 × 64)",
85
- "shortDescription" : "Latent noise for use with strength parameter of image2image",
86
- "shape" : "[1, 4, 64, 64]",
87
- "name" : "noise",
88
- "type" : "MultiArray"
89
- },
90
- {
91
- "hasShapeFlexibility" : "0",
92
- "isOptional" : "0",
93
- "dataType" : "Float16",
94
- "formattedType" : "MultiArray (Float16 1 × 1)",
95
- "shortDescription" : "Precalculated `sqrt_alphas_cumprod` value based on strength and the current schedular's alphasCumprod values",
96
- "shape" : "[1, 1]",
97
- "name" : "sqrt_alphas_cumprod",
98
- "type" : "MultiArray"
99
- },
100
- {
101
- "hasShapeFlexibility" : "0",
102
- "isOptional" : "0",
103
- "dataType" : "Float16",
104
- "formattedType" : "MultiArray (Float16 1 × 1)",
105
- "shortDescription" : "Precalculated `sqrt_one_minus_alphas_cumprod` value based on strength and the current schedular's alphasCumprod values",
106
- "shape" : "[1, 1]",
107
- "name" : "sqrt_one_minus_alphas_cumprod",
108
  "type" : "MultiArray"
109
  }
110
  ],
111
  "userDefinedMetadata" : {
112
- "com.github.apple.coremltools.version" : "6.1",
113
- "com.github.apple.coremltools.source" : "torch==1.13.1"
114
  },
115
  "generatedClassName" : "Stable_Diffusion_version_stabilityai_stable_diffusion_2_base_vae_encoder",
116
  "method" : "predict"
 
10
  "formattedType" : "MultiArray (Float32)",
11
  "shortDescription" : "The latent embeddings from the unet model from the input image.",
12
  "shape" : "[]",
13
+ "name" : "latent",
14
  "type" : "MultiArray"
15
  }
16
  ],
 
23
  "storagePrecision" : "Float16",
24
  "license" : "OpenRAIL (https:\/\/huggingface.co\/spaces\/CompVis\/stable-diffusion-license)",
25
  "mlProgramOperationTypeHistogram" : {
 
 
 
 
 
 
 
 
 
26
  "Pad" : 3,
 
27
  "Ios16.cast" : 1,
28
+ "Ios16.mul" : 1,
29
+ "Ios16.sqrt" : 22,
30
+ "Ios16.sub" : 22,
31
+ "Transpose" : 7,
32
  "Ios16.conv" : 28,
33
+ "Ios16.add" : 33,
34
+ "Ios16.linear" : 4,
35
  "Ios16.matmul" : 2,
36
+ "Ios16.realDiv" : 22,
37
+ "Ios16.reduceMean" : 44,
38
+ "Ios16.softmax" : 1,
39
  "Ios16.batchNorm" : 22,
40
+ "Ios16.square" : 22,
41
+ "Ios16.reshape" : 54,
42
+ "Ios16.silu" : 21
43
  },
44
  "computePrecision" : "Mixed (Float32, Float16, Int32)",
45
  "isUpdatable" : "0",
 
59
  "isOptional" : "0",
60
  "dataType" : "Float16",
61
  "formattedType" : "MultiArray (Float16 1 × 3 × 512 × 512)",
62
+ "shortDescription" : "The input image to base the initial latents on normalized to range [-1, 1]",
63
  "shape" : "[1, 3, 512, 512]",
64
+ "name" : "z",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
65
  "type" : "MultiArray"
66
  }
67
  ],
68
  "userDefinedMetadata" : {
69
+ "com.github.apple.coremltools.version" : "6.3.0",
70
+ "com.github.apple.coremltools.source" : "torch==2.0.0"
71
  },
72
  "generatedClassName" : "Stable_Diffusion_version_stabilityai_stable_diffusion_2_base_vae_encoder",
73
  "method" : "predict"
original/compiled/VAEEncoder.mlmodelc/model.mil CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3cd529b933adc7e28b4057051eb816d753241246416bceacf25eb844e2b64d4a
3
- size 137752
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d33d5d475d2457cb48abae239a2ba0a6ff14a6fa344633e4866c74c6f7907724
3
+ size 135576
original/compiled/VAEEncoder.mlmodelc/weights/weight.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3b7ad3fbf4898564c46e08732ce223712961270064549b06bdc95ec22a6e88b1
3
  size 68370240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:069f194d78e0893a066afb3805726f4e28d13538f2168204008530e9d9774ee2
3
  size 68370240
original/packages/Stable_Diffusion_version_stabilityai_stable-diffusion-2-base_vae_encoder.mlpackage/Data/com.apple.CoreML/model.mlmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:69544ea13c1a7b3115c01eb2e775a10136832d6ff91a074faf11b75f241d726c
3
- size 117460
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d148321b3515119341c54be79906feeaeb15e04e90368fab9ab434ad8ac8017e
3
+ size 114914
original/packages/Stable_Diffusion_version_stabilityai_stable-diffusion-2-base_vae_encoder.mlpackage/Data/com.apple.CoreML/weights/weight.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3b7ad3fbf4898564c46e08732ce223712961270064549b06bdc95ec22a6e88b1
3
  size 68370240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:069f194d78e0893a066afb3805726f4e28d13538f2168204008530e9d9774ee2
3
  size 68370240
original/packages/Stable_Diffusion_version_stabilityai_stable-diffusion-2-base_vae_encoder.mlpackage/Manifest.json CHANGED
@@ -1,18 +1,18 @@
1
  {
2
  "fileFormatVersion": "1.0.0",
3
  "itemInfoEntries": {
4
- "38BC24FA-2978-4B03-AF04-231A43CBF74C": {
5
  "author": "com.apple.CoreML",
6
  "description": "CoreML Model Weights",
7
  "name": "weights",
8
  "path": "com.apple.CoreML/weights"
9
  },
10
- "4627B776-3BCE-4766-960C-5877AC8F5A80": {
11
  "author": "com.apple.CoreML",
12
  "description": "CoreML Model Specification",
13
  "name": "model.mlmodel",
14
  "path": "com.apple.CoreML/model.mlmodel"
15
  }
16
  },
17
- "rootModelIdentifier": "4627B776-3BCE-4766-960C-5877AC8F5A80"
18
  }
 
1
  {
2
  "fileFormatVersion": "1.0.0",
3
  "itemInfoEntries": {
4
+ "08A44175-364B-4515-AA88-70B20EC944C2": {
5
  "author": "com.apple.CoreML",
6
  "description": "CoreML Model Weights",
7
  "name": "weights",
8
  "path": "com.apple.CoreML/weights"
9
  },
10
+ "9E280C88-8CAA-4EEA-986E-E04DA7E31BF6": {
11
  "author": "com.apple.CoreML",
12
  "description": "CoreML Model Specification",
13
  "name": "model.mlmodel",
14
  "path": "com.apple.CoreML/model.mlmodel"
15
  }
16
  },
17
+ "rootModelIdentifier": "9E280C88-8CAA-4EEA-986E-E04DA7E31BF6"
18
  }
split_einsum/compiled/VAEEncoder.mlmodelc/analytics/coremldata.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eee76fbae1fa08a0d7bd18b2eb1f0324f9fdba01656f441a3e8357f08bb6345a
3
  size 207
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:132c6d52eacfe75bf06faebc63ba323965841e05c77b1c5e6158491100d96bd9
3
  size 207
split_einsum/compiled/VAEEncoder.mlmodelc/coremldata.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:854e552c6e9273ef52b93a0fd2013399421450f497fcd327eb8aa371a2e5f46d
3
- size 1284
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ac1e4a8ea5cfe3a02d26fff80894c8eee09248a0776be6dd55aab7d44d97d1b
3
+ size 771
split_einsum/compiled/VAEEncoder.mlmodelc/metadata.json CHANGED
@@ -10,7 +10,7 @@
10
  "formattedType" : "MultiArray (Float32)",
11
  "shortDescription" : "The latent embeddings from the unet model from the input image.",
12
  "shape" : "[]",
13
- "name" : "latent_dist",
14
  "type" : "MultiArray"
15
  }
16
  ],
@@ -23,26 +23,23 @@
23
  "storagePrecision" : "Float16",
24
  "license" : "OpenRAIL (https:\/\/huggingface.co\/spaces\/CompVis\/stable-diffusion-license)",
25
  "mlProgramOperationTypeHistogram" : {
26
- "Transpose" : 7,
27
- "Ios16.exp" : 1,
28
- "Ios16.reduceMean" : 44,
29
- "Ios16.softmax" : 1,
30
- "Split" : 1,
31
- "Ios16.linear" : 4,
32
- "Ios16.add" : 35,
33
- "Ios16.realDiv" : 22,
34
- "Ios16.square" : 22,
35
  "Pad" : 3,
36
- "Ios16.sub" : 22,
37
  "Ios16.cast" : 1,
38
- "Ios16.clip" : 1,
 
 
 
39
  "Ios16.conv" : 28,
 
 
40
  "Ios16.matmul" : 2,
41
- "Ios16.reshape" : 54,
 
 
42
  "Ios16.batchNorm" : 22,
43
- "Ios16.silu" : 21,
44
- "Ios16.sqrt" : 22,
45
- "Ios16.mul" : 6
46
  },
47
  "computePrecision" : "Mixed (Float32, Float16, Int32)",
48
  "isUpdatable" : "0",
@@ -62,55 +59,15 @@
62
  "isOptional" : "0",
63
  "dataType" : "Float16",
64
  "formattedType" : "MultiArray (Float16 1 × 3 × 512 × 512)",
65
- "shortDescription" : "An image of the correct size to create the latent space with, image2image and in-painting.",
66
  "shape" : "[1, 3, 512, 512]",
67
- "name" : "sample",
68
- "type" : "MultiArray"
69
- },
70
- {
71
- "hasShapeFlexibility" : "0",
72
- "isOptional" : "0",
73
- "dataType" : "Float16",
74
- "formattedType" : "MultiArray (Float16 1 × 4 × 64 × 64)",
75
- "shortDescription" : "Latent noise for `DiagonalGaussianDistribution` operation.",
76
- "shape" : "[1, 4, 64, 64]",
77
- "name" : "diagonal_noise",
78
- "type" : "MultiArray"
79
- },
80
- {
81
- "hasShapeFlexibility" : "0",
82
- "isOptional" : "0",
83
- "dataType" : "Float16",
84
- "formattedType" : "MultiArray (Float16 1 × 4 × 64 × 64)",
85
- "shortDescription" : "Latent noise for use with strength parameter of image2image",
86
- "shape" : "[1, 4, 64, 64]",
87
- "name" : "noise",
88
- "type" : "MultiArray"
89
- },
90
- {
91
- "hasShapeFlexibility" : "0",
92
- "isOptional" : "0",
93
- "dataType" : "Float16",
94
- "formattedType" : "MultiArray (Float16 1 × 1)",
95
- "shortDescription" : "Precalculated `sqrt_alphas_cumprod` value based on strength and the current schedular's alphasCumprod values",
96
- "shape" : "[1, 1]",
97
- "name" : "sqrt_alphas_cumprod",
98
- "type" : "MultiArray"
99
- },
100
- {
101
- "hasShapeFlexibility" : "0",
102
- "isOptional" : "0",
103
- "dataType" : "Float16",
104
- "formattedType" : "MultiArray (Float16 1 × 1)",
105
- "shortDescription" : "Precalculated `sqrt_one_minus_alphas_cumprod` value based on strength and the current schedular's alphasCumprod values",
106
- "shape" : "[1, 1]",
107
- "name" : "sqrt_one_minus_alphas_cumprod",
108
  "type" : "MultiArray"
109
  }
110
  ],
111
  "userDefinedMetadata" : {
112
- "com.github.apple.coremltools.version" : "6.1",
113
- "com.github.apple.coremltools.source" : "torch==1.13.1"
114
  },
115
  "generatedClassName" : "Stable_Diffusion_version_stabilityai_stable_diffusion_2_base_vae_encoder",
116
  "method" : "predict"
 
10
  "formattedType" : "MultiArray (Float32)",
11
  "shortDescription" : "The latent embeddings from the unet model from the input image.",
12
  "shape" : "[]",
13
+ "name" : "latent",
14
  "type" : "MultiArray"
15
  }
16
  ],
 
23
  "storagePrecision" : "Float16",
24
  "license" : "OpenRAIL (https:\/\/huggingface.co\/spaces\/CompVis\/stable-diffusion-license)",
25
  "mlProgramOperationTypeHistogram" : {
 
 
 
 
 
 
 
 
 
26
  "Pad" : 3,
 
27
  "Ios16.cast" : 1,
28
+ "Ios16.mul" : 1,
29
+ "Ios16.sqrt" : 22,
30
+ "Ios16.sub" : 22,
31
+ "Transpose" : 7,
32
  "Ios16.conv" : 28,
33
+ "Ios16.add" : 33,
34
+ "Ios16.linear" : 4,
35
  "Ios16.matmul" : 2,
36
+ "Ios16.realDiv" : 22,
37
+ "Ios16.reduceMean" : 44,
38
+ "Ios16.softmax" : 1,
39
  "Ios16.batchNorm" : 22,
40
+ "Ios16.square" : 22,
41
+ "Ios16.reshape" : 54,
42
+ "Ios16.silu" : 21
43
  },
44
  "computePrecision" : "Mixed (Float32, Float16, Int32)",
45
  "isUpdatable" : "0",
 
59
  "isOptional" : "0",
60
  "dataType" : "Float16",
61
  "formattedType" : "MultiArray (Float16 1 × 3 × 512 × 512)",
62
+ "shortDescription" : "The input image to base the initial latents on normalized to range [-1, 1]",
63
  "shape" : "[1, 3, 512, 512]",
64
+ "name" : "z",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
65
  "type" : "MultiArray"
66
  }
67
  ],
68
  "userDefinedMetadata" : {
69
+ "com.github.apple.coremltools.version" : "6.3.0",
70
+ "com.github.apple.coremltools.source" : "torch==2.0.0"
71
  },
72
  "generatedClassName" : "Stable_Diffusion_version_stabilityai_stable_diffusion_2_base_vae_encoder",
73
  "method" : "predict"
split_einsum/compiled/VAEEncoder.mlmodelc/model.mil CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3cd529b933adc7e28b4057051eb816d753241246416bceacf25eb844e2b64d4a
3
- size 137752
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d33d5d475d2457cb48abae239a2ba0a6ff14a6fa344633e4866c74c6f7907724
3
+ size 135576
split_einsum/compiled/VAEEncoder.mlmodelc/weights/weight.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5061f127d29e767db8e4703bdfaf6cf2e944d5d8a27e807c78828496de3ce267
3
  size 68370240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:069f194d78e0893a066afb3805726f4e28d13538f2168204008530e9d9774ee2
3
  size 68370240
split_einsum/packages/Stable_Diffusion_version_stabilityai_stable-diffusion-2-base_vae_encoder.mlpackage/Data/com.apple.CoreML/model.mlmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:69544ea13c1a7b3115c01eb2e775a10136832d6ff91a074faf11b75f241d726c
3
- size 117460
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d148321b3515119341c54be79906feeaeb15e04e90368fab9ab434ad8ac8017e
3
+ size 114914
split_einsum/packages/Stable_Diffusion_version_stabilityai_stable-diffusion-2-base_vae_encoder.mlpackage/Data/com.apple.CoreML/weights/weight.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5061f127d29e767db8e4703bdfaf6cf2e944d5d8a27e807c78828496de3ce267
3
  size 68370240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:069f194d78e0893a066afb3805726f4e28d13538f2168204008530e9d9774ee2
3
  size 68370240
split_einsum/packages/Stable_Diffusion_version_stabilityai_stable-diffusion-2-base_vae_encoder.mlpackage/Manifest.json CHANGED
@@ -1,18 +1,18 @@
1
  {
2
  "fileFormatVersion": "1.0.0",
3
  "itemInfoEntries": {
4
- "260E53C9-7E53-4C87-9FA8-161CC0D21FDF": {
5
- "author": "com.apple.CoreML",
6
- "description": "CoreML Model Specification",
7
- "name": "model.mlmodel",
8
- "path": "com.apple.CoreML/model.mlmodel"
9
- },
10
- "70A48119-9715-487C-9953-FCA2BCE32D24": {
11
  "author": "com.apple.CoreML",
12
  "description": "CoreML Model Weights",
13
  "name": "weights",
14
  "path": "com.apple.CoreML/weights"
 
 
 
 
 
 
15
  }
16
  },
17
- "rootModelIdentifier": "260E53C9-7E53-4C87-9FA8-161CC0D21FDF"
18
  }
 
1
  {
2
  "fileFormatVersion": "1.0.0",
3
  "itemInfoEntries": {
4
+ "08A44175-364B-4515-AA88-70B20EC944C2": {
 
 
 
 
 
 
5
  "author": "com.apple.CoreML",
6
  "description": "CoreML Model Weights",
7
  "name": "weights",
8
  "path": "com.apple.CoreML/weights"
9
+ },
10
+ "9E280C88-8CAA-4EEA-986E-E04DA7E31BF6": {
11
+ "author": "com.apple.CoreML",
12
+ "description": "CoreML Model Specification",
13
+ "name": "model.mlmodel",
14
+ "path": "com.apple.CoreML/model.mlmodel"
15
  }
16
  },
17
+ "rootModelIdentifier": "9E280C88-8CAA-4EEA-986E-E04DA7E31BF6"
18
  }