pcuenq HF staff commited on
Commit
12d7ed9
1 Parent(s): f91130a

update-vae-encoder (#4)

Browse files

- Update VAE Encoder. (55e3bfa1d1814451e5a419d3efec8d4a4f3a54f6)

original/compiled/VAEEncoder.mlmodelc/analytics/coremldata.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e27fb7ebcffa0ff79c7212e1e914dbc14fddb8265b8c73d0d322a7eea4ef01e8
3
  size 207
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e47b4f8e21d3662a8c0f77eb6c760543f6f08a83b4dc3fbc9d25aa1fa0f2ab66
3
  size 207
original/compiled/VAEEncoder.mlmodelc/coremldata.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6b8cb326a2c2071e8ba0b1ef1084609061d0e86a603f55d066d25c60e04acd4a
3
- size 1272
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0896e8b3111c8950e88fbdb47c39b7c3bcee5fa5da8d3de5be91b8e6d567fc74
3
+ size 759
original/compiled/VAEEncoder.mlmodelc/metadata.json CHANGED
@@ -10,7 +10,7 @@
10
  "formattedType" : "MultiArray (Float32)",
11
  "shortDescription" : "The latent embeddings from the unet model from the input image.",
12
  "shape" : "[]",
13
- "name" : "latent_dist",
14
  "type" : "MultiArray"
15
  }
16
  ],
@@ -23,26 +23,23 @@
23
  "storagePrecision" : "Float16",
24
  "license" : "OpenRAIL (https:\/\/huggingface.co\/spaces\/CompVis\/stable-diffusion-license)",
25
  "mlProgramOperationTypeHistogram" : {
26
- "Transpose" : 7,
27
- "Ios16.exp" : 1,
28
- "Ios16.reduceMean" : 44,
29
- "Ios16.softmax" : 1,
30
- "Split" : 1,
31
- "Ios16.linear" : 4,
32
- "Ios16.add" : 35,
33
- "Ios16.realDiv" : 22,
34
- "Ios16.square" : 22,
35
  "Pad" : 3,
36
- "Ios16.sub" : 22,
37
  "Ios16.cast" : 1,
38
- "Ios16.clip" : 1,
 
 
 
39
  "Ios16.conv" : 28,
 
 
40
  "Ios16.matmul" : 2,
41
- "Ios16.reshape" : 54,
 
 
42
  "Ios16.batchNorm" : 22,
43
- "Ios16.silu" : 21,
44
- "Ios16.sqrt" : 22,
45
- "Ios16.mul" : 6
46
  },
47
  "computePrecision" : "Mixed (Float32, Float16, Int32)",
48
  "isUpdatable" : "0",
@@ -62,55 +59,15 @@
62
  "isOptional" : "0",
63
  "dataType" : "Float16",
64
  "formattedType" : "MultiArray (Float16 1 × 3 × 512 × 512)",
65
- "shortDescription" : "An image of the correct size to create the latent space with, image2image and in-painting.",
66
  "shape" : "[1, 3, 512, 512]",
67
- "name" : "sample",
68
- "type" : "MultiArray"
69
- },
70
- {
71
- "hasShapeFlexibility" : "0",
72
- "isOptional" : "0",
73
- "dataType" : "Float16",
74
- "formattedType" : "MultiArray (Float16 1 × 4 × 64 × 64)",
75
- "shortDescription" : "Latent noise for `DiagonalGaussianDistribution` operation.",
76
- "shape" : "[1, 4, 64, 64]",
77
- "name" : "diagonal_noise",
78
- "type" : "MultiArray"
79
- },
80
- {
81
- "hasShapeFlexibility" : "0",
82
- "isOptional" : "0",
83
- "dataType" : "Float16",
84
- "formattedType" : "MultiArray (Float16 1 × 4 × 64 × 64)",
85
- "shortDescription" : "Latent noise for use with strength parameter of image2image",
86
- "shape" : "[1, 4, 64, 64]",
87
- "name" : "noise",
88
- "type" : "MultiArray"
89
- },
90
- {
91
- "hasShapeFlexibility" : "0",
92
- "isOptional" : "0",
93
- "dataType" : "Float16",
94
- "formattedType" : "MultiArray (Float16 1 × 1)",
95
- "shortDescription" : "Precalculated `sqrt_alphas_cumprod` value based on strength and the current schedular's alphasCumprod values",
96
- "shape" : "[1, 1]",
97
- "name" : "sqrt_alphas_cumprod",
98
- "type" : "MultiArray"
99
- },
100
- {
101
- "hasShapeFlexibility" : "0",
102
- "isOptional" : "0",
103
- "dataType" : "Float16",
104
- "formattedType" : "MultiArray (Float16 1 × 1)",
105
- "shortDescription" : "Precalculated `sqrt_one_minus_alphas_cumprod` value based on strength and the current schedular's alphasCumprod values",
106
- "shape" : "[1, 1]",
107
- "name" : "sqrt_one_minus_alphas_cumprod",
108
  "type" : "MultiArray"
109
  }
110
  ],
111
  "userDefinedMetadata" : {
112
- "com.github.apple.coremltools.version" : "6.1",
113
- "com.github.apple.coremltools.source" : "torch==1.13.0"
114
  },
115
  "generatedClassName" : "Stable_Diffusion_version_CompVis_stable_diffusion_v1_4_vae_encoder",
116
  "method" : "predict"
 
10
  "formattedType" : "MultiArray (Float32)",
11
  "shortDescription" : "The latent embeddings from the unet model from the input image.",
12
  "shape" : "[]",
13
+ "name" : "latent",
14
  "type" : "MultiArray"
15
  }
16
  ],
 
23
  "storagePrecision" : "Float16",
24
  "license" : "OpenRAIL (https:\/\/huggingface.co\/spaces\/CompVis\/stable-diffusion-license)",
25
  "mlProgramOperationTypeHistogram" : {
 
 
 
 
 
 
 
 
 
26
  "Pad" : 3,
 
27
  "Ios16.cast" : 1,
28
+ "Ios16.mul" : 1,
29
+ "Ios16.sqrt" : 22,
30
+ "Ios16.sub" : 22,
31
+ "Transpose" : 7,
32
  "Ios16.conv" : 28,
33
+ "Ios16.add" : 33,
34
+ "Ios16.linear" : 4,
35
  "Ios16.matmul" : 2,
36
+ "Ios16.realDiv" : 22,
37
+ "Ios16.reduceMean" : 44,
38
+ "Ios16.softmax" : 1,
39
  "Ios16.batchNorm" : 22,
40
+ "Ios16.square" : 22,
41
+ "Ios16.reshape" : 54,
42
+ "Ios16.silu" : 21
43
  },
44
  "computePrecision" : "Mixed (Float32, Float16, Int32)",
45
  "isUpdatable" : "0",
 
59
  "isOptional" : "0",
60
  "dataType" : "Float16",
61
  "formattedType" : "MultiArray (Float16 1 × 3 × 512 × 512)",
62
+ "shortDescription" : "The input image to base the initial latents on normalized to range [-1, 1]",
63
  "shape" : "[1, 3, 512, 512]",
64
+ "name" : "z",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
65
  "type" : "MultiArray"
66
  }
67
  ],
68
  "userDefinedMetadata" : {
69
+ "com.github.apple.coremltools.version" : "6.3.0",
70
+ "com.github.apple.coremltools.source" : "torch==2.0.0"
71
  },
72
  "generatedClassName" : "Stable_Diffusion_version_CompVis_stable_diffusion_v1_4_vae_encoder",
73
  "method" : "predict"
original/compiled/VAEEncoder.mlmodelc/model.mil CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:823a50e22d4989acd5247f33e8cc52e0caf5dbceec978fe76f6a5dd9759c2c7f
3
- size 137752
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d33d5d475d2457cb48abae239a2ba0a6ff14a6fa344633e4866c74c6f7907724
3
+ size 135576
original/compiled/VAEEncoder.mlmodelc/weights/weight.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:edc9a37ae7f0c7b1696798514fa2224d183e5154356a356c0975acb6e9e7bba6
3
  size 68370240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:527539d44d78d725c785dff135c1fb1529908f67069e5ed71bafd56e74a60493
3
  size 68370240
original/packages/Stable_Diffusion_version_CompVis_stable-diffusion-v1-4_vae_encoder.mlpackage/Data/com.apple.CoreML/model.mlmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6269f295fe1eef3d3194186afbf56d932b399d528663ff95fc56cfdf1885d015
3
- size 117448
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2b68542ca85526d3d48e17f04ac406b9c2f5879dfa54fe39c7981bb41ab7cd9
3
+ size 114902
original/packages/Stable_Diffusion_version_CompVis_stable-diffusion-v1-4_vae_encoder.mlpackage/Data/com.apple.CoreML/weights/weight.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:edc9a37ae7f0c7b1696798514fa2224d183e5154356a356c0975acb6e9e7bba6
3
  size 68370240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:527539d44d78d725c785dff135c1fb1529908f67069e5ed71bafd56e74a60493
3
  size 68370240
original/packages/Stable_Diffusion_version_CompVis_stable-diffusion-v1-4_vae_encoder.mlpackage/Manifest.json CHANGED
@@ -1,18 +1,18 @@
1
  {
2
  "fileFormatVersion": "1.0.0",
3
  "itemInfoEntries": {
4
- "572B88FB-BD8C-4BB2-94A9-59BBAA98B7E6": {
5
- "author": "com.apple.CoreML",
6
- "description": "CoreML Model Weights",
7
- "name": "weights",
8
- "path": "com.apple.CoreML/weights"
9
- },
10
- "908BDF53-CD61-4E50-821B-0721632446FB": {
11
  "author": "com.apple.CoreML",
12
  "description": "CoreML Model Specification",
13
  "name": "model.mlmodel",
14
  "path": "com.apple.CoreML/model.mlmodel"
 
 
 
 
 
 
15
  }
16
  },
17
- "rootModelIdentifier": "908BDF53-CD61-4E50-821B-0721632446FB"
18
  }
 
1
  {
2
  "fileFormatVersion": "1.0.0",
3
  "itemInfoEntries": {
4
+ "4AC76ED5-4FE2-4025-A4F9-190A8B2EFE35": {
 
 
 
 
 
 
5
  "author": "com.apple.CoreML",
6
  "description": "CoreML Model Specification",
7
  "name": "model.mlmodel",
8
  "path": "com.apple.CoreML/model.mlmodel"
9
+ },
10
+ "E3770AC4-12AE-42B0-8181-C0F84452E3D3": {
11
+ "author": "com.apple.CoreML",
12
+ "description": "CoreML Model Weights",
13
+ "name": "weights",
14
+ "path": "com.apple.CoreML/weights"
15
  }
16
  },
17
+ "rootModelIdentifier": "4AC76ED5-4FE2-4025-A4F9-190A8B2EFE35"
18
  }
split_einsum/compiled/VAEEncoder.mlmodelc/analytics/coremldata.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e27fb7ebcffa0ff79c7212e1e914dbc14fddb8265b8c73d0d322a7eea4ef01e8
3
  size 207
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e47b4f8e21d3662a8c0f77eb6c760543f6f08a83b4dc3fbc9d25aa1fa0f2ab66
3
  size 207
split_einsum/compiled/VAEEncoder.mlmodelc/coremldata.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6a8053f3c4f3cebb592d42dd6e2dad8758c4c40417c8552424faf74c9986fe3f
3
- size 1272
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0896e8b3111c8950e88fbdb47c39b7c3bcee5fa5da8d3de5be91b8e6d567fc74
3
+ size 759
split_einsum/compiled/VAEEncoder.mlmodelc/metadata.json CHANGED
@@ -10,7 +10,7 @@
10
  "formattedType" : "MultiArray (Float32)",
11
  "shortDescription" : "The latent embeddings from the unet model from the input image.",
12
  "shape" : "[]",
13
- "name" : "latent_dist",
14
  "type" : "MultiArray"
15
  }
16
  ],
@@ -23,26 +23,23 @@
23
  "storagePrecision" : "Float16",
24
  "license" : "OpenRAIL (https:\/\/huggingface.co\/spaces\/CompVis\/stable-diffusion-license)",
25
  "mlProgramOperationTypeHistogram" : {
26
- "Transpose" : 7,
27
- "Ios16.exp" : 1,
28
- "Ios16.reduceMean" : 44,
29
- "Ios16.softmax" : 1,
30
- "Split" : 1,
31
- "Ios16.linear" : 4,
32
- "Ios16.add" : 35,
33
- "Ios16.realDiv" : 22,
34
- "Ios16.square" : 22,
35
  "Pad" : 3,
36
- "Ios16.sub" : 22,
37
  "Ios16.cast" : 1,
38
- "Ios16.clip" : 1,
 
 
 
39
  "Ios16.conv" : 28,
 
 
40
  "Ios16.matmul" : 2,
41
- "Ios16.reshape" : 54,
 
 
42
  "Ios16.batchNorm" : 22,
43
- "Ios16.silu" : 21,
44
- "Ios16.sqrt" : 22,
45
- "Ios16.mul" : 6
46
  },
47
  "computePrecision" : "Mixed (Float32, Float16, Int32)",
48
  "isUpdatable" : "0",
@@ -62,55 +59,15 @@
62
  "isOptional" : "0",
63
  "dataType" : "Float16",
64
  "formattedType" : "MultiArray (Float16 1 × 3 × 512 × 512)",
65
- "shortDescription" : "An image of the correct size to create the latent space with, image2image and in-painting.",
66
  "shape" : "[1, 3, 512, 512]",
67
- "name" : "sample",
68
- "type" : "MultiArray"
69
- },
70
- {
71
- "hasShapeFlexibility" : "0",
72
- "isOptional" : "0",
73
- "dataType" : "Float16",
74
- "formattedType" : "MultiArray (Float16 1 × 4 × 64 × 64)",
75
- "shortDescription" : "Latent noise for `DiagonalGaussianDistribution` operation.",
76
- "shape" : "[1, 4, 64, 64]",
77
- "name" : "diagonal_noise",
78
- "type" : "MultiArray"
79
- },
80
- {
81
- "hasShapeFlexibility" : "0",
82
- "isOptional" : "0",
83
- "dataType" : "Float16",
84
- "formattedType" : "MultiArray (Float16 1 × 4 × 64 × 64)",
85
- "shortDescription" : "Latent noise for use with strength parameter of image2image",
86
- "shape" : "[1, 4, 64, 64]",
87
- "name" : "noise",
88
- "type" : "MultiArray"
89
- },
90
- {
91
- "hasShapeFlexibility" : "0",
92
- "isOptional" : "0",
93
- "dataType" : "Float16",
94
- "formattedType" : "MultiArray (Float16 1 × 1)",
95
- "shortDescription" : "Precalculated `sqrt_alphas_cumprod` value based on strength and the current schedular's alphasCumprod values",
96
- "shape" : "[1, 1]",
97
- "name" : "sqrt_alphas_cumprod",
98
- "type" : "MultiArray"
99
- },
100
- {
101
- "hasShapeFlexibility" : "0",
102
- "isOptional" : "0",
103
- "dataType" : "Float16",
104
- "formattedType" : "MultiArray (Float16 1 × 1)",
105
- "shortDescription" : "Precalculated `sqrt_one_minus_alphas_cumprod` value based on strength and the current schedular's alphasCumprod values",
106
- "shape" : "[1, 1]",
107
- "name" : "sqrt_one_minus_alphas_cumprod",
108
  "type" : "MultiArray"
109
  }
110
  ],
111
  "userDefinedMetadata" : {
112
- "com.github.apple.coremltools.version" : "6.1",
113
- "com.github.apple.coremltools.source" : "torch==1.13.0"
114
  },
115
  "generatedClassName" : "Stable_Diffusion_version_CompVis_stable_diffusion_v1_4_vae_encoder",
116
  "method" : "predict"
 
10
  "formattedType" : "MultiArray (Float32)",
11
  "shortDescription" : "The latent embeddings from the unet model from the input image.",
12
  "shape" : "[]",
13
+ "name" : "latent",
14
  "type" : "MultiArray"
15
  }
16
  ],
 
23
  "storagePrecision" : "Float16",
24
  "license" : "OpenRAIL (https:\/\/huggingface.co\/spaces\/CompVis\/stable-diffusion-license)",
25
  "mlProgramOperationTypeHistogram" : {
 
 
 
 
 
 
 
 
 
26
  "Pad" : 3,
 
27
  "Ios16.cast" : 1,
28
+ "Ios16.mul" : 1,
29
+ "Ios16.sqrt" : 22,
30
+ "Ios16.sub" : 22,
31
+ "Transpose" : 7,
32
  "Ios16.conv" : 28,
33
+ "Ios16.add" : 33,
34
+ "Ios16.linear" : 4,
35
  "Ios16.matmul" : 2,
36
+ "Ios16.realDiv" : 22,
37
+ "Ios16.reduceMean" : 44,
38
+ "Ios16.softmax" : 1,
39
  "Ios16.batchNorm" : 22,
40
+ "Ios16.square" : 22,
41
+ "Ios16.reshape" : 54,
42
+ "Ios16.silu" : 21
43
  },
44
  "computePrecision" : "Mixed (Float32, Float16, Int32)",
45
  "isUpdatable" : "0",
 
59
  "isOptional" : "0",
60
  "dataType" : "Float16",
61
  "formattedType" : "MultiArray (Float16 1 × 3 × 512 × 512)",
62
+ "shortDescription" : "The input image to base the initial latents on normalized to range [-1, 1]",
63
  "shape" : "[1, 3, 512, 512]",
64
+ "name" : "z",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
65
  "type" : "MultiArray"
66
  }
67
  ],
68
  "userDefinedMetadata" : {
69
+ "com.github.apple.coremltools.version" : "6.3.0",
70
+ "com.github.apple.coremltools.source" : "torch==2.0.0"
71
  },
72
  "generatedClassName" : "Stable_Diffusion_version_CompVis_stable_diffusion_v1_4_vae_encoder",
73
  "method" : "predict"
split_einsum/compiled/VAEEncoder.mlmodelc/model.mil CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:823a50e22d4989acd5247f33e8cc52e0caf5dbceec978fe76f6a5dd9759c2c7f
3
- size 137752
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d33d5d475d2457cb48abae239a2ba0a6ff14a6fa344633e4866c74c6f7907724
3
+ size 135576
split_einsum/compiled/VAEEncoder.mlmodelc/weights/weight.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2604aac03e12dde2d56b35a7d2f6c3275860b049ea2dedd75426c2a5c3a6c667
3
  size 68370240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:527539d44d78d725c785dff135c1fb1529908f67069e5ed71bafd56e74a60493
3
  size 68370240
split_einsum/packages/Stable_Diffusion_version_CompVis_stable-diffusion-v1-4_vae_encoder.mlpackage/Data/com.apple.CoreML/model.mlmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6269f295fe1eef3d3194186afbf56d932b399d528663ff95fc56cfdf1885d015
3
- size 117448
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2b68542ca85526d3d48e17f04ac406b9c2f5879dfa54fe39c7981bb41ab7cd9
3
+ size 114902
split_einsum/packages/Stable_Diffusion_version_CompVis_stable-diffusion-v1-4_vae_encoder.mlpackage/Data/com.apple.CoreML/weights/weight.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2604aac03e12dde2d56b35a7d2f6c3275860b049ea2dedd75426c2a5c3a6c667
3
  size 68370240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:527539d44d78d725c785dff135c1fb1529908f67069e5ed71bafd56e74a60493
3
  size 68370240
split_einsum/packages/Stable_Diffusion_version_CompVis_stable-diffusion-v1-4_vae_encoder.mlpackage/Manifest.json CHANGED
@@ -1,18 +1,18 @@
1
  {
2
  "fileFormatVersion": "1.0.0",
3
  "itemInfoEntries": {
4
- "73F723E9-BBE9-40B7-8113-8FCA8733A20D": {
5
  "author": "com.apple.CoreML",
6
  "description": "CoreML Model Specification",
7
  "name": "model.mlmodel",
8
  "path": "com.apple.CoreML/model.mlmodel"
9
  },
10
- "DEB5F935-76BB-4FD1-BBD6-968993E96111": {
11
  "author": "com.apple.CoreML",
12
  "description": "CoreML Model Weights",
13
  "name": "weights",
14
  "path": "com.apple.CoreML/weights"
15
  }
16
  },
17
- "rootModelIdentifier": "73F723E9-BBE9-40B7-8113-8FCA8733A20D"
18
  }
 
1
  {
2
  "fileFormatVersion": "1.0.0",
3
  "itemInfoEntries": {
4
+ "4AC76ED5-4FE2-4025-A4F9-190A8B2EFE35": {
5
  "author": "com.apple.CoreML",
6
  "description": "CoreML Model Specification",
7
  "name": "model.mlmodel",
8
  "path": "com.apple.CoreML/model.mlmodel"
9
  },
10
+ "E3770AC4-12AE-42B0-8181-C0F84452E3D3": {
11
  "author": "com.apple.CoreML",
12
  "description": "CoreML Model Weights",
13
  "name": "weights",
14
  "path": "com.apple.CoreML/weights"
15
  }
16
  },
17
+ "rootModelIdentifier": "4AC76ED5-4FE2-4025-A4F9-190A8B2EFE35"
18
  }