Vishnou commited on
Commit
5aaf3a3
1 Parent(s): 7a6624b

Upload folder using huggingface_hub

Browse files
.DS_Store ADDED
Binary file (6.15 kB). View file
 
TextEncoder.mlmodelc/analytics/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8dac4ccc46f3c5e8ffa0a19511039b8ceadd239791fabb5623b822bce8063275
3
+ size 243
TextEncoder.mlmodelc/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13e580e4ef472512859174485e27ab173759522d91e225a1db35ceee09acae66
3
+ size 848
TextEncoder.mlmodelc/metadata.json ADDED
@@ -0,0 +1,84 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "shortDescription" : "Stable Diffusion generates images conditioned on text and\/or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
4
+ "metadataOutputVersion" : "3.0",
5
+ "outputSchema" : [
6
+ {
7
+ "hasShapeFlexibility" : "0",
8
+ "isOptional" : "0",
9
+ "dataType" : "Float32",
10
+ "formattedType" : "MultiArray (Float32 1 × 77 × 1024)",
11
+ "shortDescription" : "The token embeddings as encoded by the Transformer model",
12
+ "shape" : "[1, 77, 1024]",
13
+ "name" : "last_hidden_state",
14
+ "type" : "MultiArray"
15
+ },
16
+ {
17
+ "hasShapeFlexibility" : "0",
18
+ "isOptional" : "0",
19
+ "dataType" : "Float32",
20
+ "formattedType" : "MultiArray (Float32 1 × 1024)",
21
+ "shortDescription" : "The version of the `last_hidden_state` output after pooling",
22
+ "shape" : "[1, 1024]",
23
+ "name" : "pooled_outputs",
24
+ "type" : "MultiArray"
25
+ }
26
+ ],
27
+ "version" : "stabilityai\/stable-diffusion-2-1-base",
28
+ "modelParameters" : [
29
+
30
+ ],
31
+ "author" : "Please refer to the Model Card available at huggingface.co\/stabilityai\/stable-diffusion-2-1-base",
32
+ "specificationVersion" : 7,
33
+ "storagePrecision" : "Mixed (Float16, Palettized (2 bits))",
34
+ "license" : "OpenRAIL (https:\/\/huggingface.co\/spaces\/CompVis\/stable-diffusion-license)",
35
+ "mlProgramOperationTypeHistogram" : {
36
+ "Ios16.cast" : 3,
37
+ "Ios16.mul" : 23,
38
+ "Ios16.layerNorm" : 47,
39
+ "Ios16.constexprLutToDense" : 163,
40
+ "Stack" : 1,
41
+ "Transpose" : 115,
42
+ "Ios16.linear" : 138,
43
+ "Ios16.add" : 70,
44
+ "Ios16.matmul" : 46,
45
+ "Ios16.gelu" : 23,
46
+ "Ios16.softmax" : 23,
47
+ "Ios16.gatherNd" : 1,
48
+ "Ios16.gather" : 1,
49
+ "Ios16.reshape" : 230,
50
+ "Ios16.reduceArgmax" : 1
51
+ },
52
+ "computePrecision" : "Mixed (Float16, Float32, Int32)",
53
+ "isUpdatable" : "0",
54
+ "availability" : {
55
+ "macOS" : "13.0",
56
+ "tvOS" : "16.0",
57
+ "visionOS" : "1.0",
58
+ "watchOS" : "9.0",
59
+ "iOS" : "16.0",
60
+ "macCatalyst" : "16.0"
61
+ },
62
+ "modelType" : {
63
+ "name" : "MLModelType_mlProgram"
64
+ },
65
+ "inputSchema" : [
66
+ {
67
+ "hasShapeFlexibility" : "0",
68
+ "isOptional" : "0",
69
+ "dataType" : "Float32",
70
+ "formattedType" : "MultiArray (Float32 1 × 77)",
71
+ "shortDescription" : "The token ids that represent the input text",
72
+ "shape" : "[1, 77]",
73
+ "name" : "input_ids",
74
+ "type" : "MultiArray"
75
+ }
76
+ ],
77
+ "userDefinedMetadata" : {
78
+ "com.github.apple.coremltools.version" : "7.0",
79
+ "com.github.apple.coremltools.source" : "torch==2.0.0"
80
+ },
81
+ "generatedClassName" : "Stable_Diffusion_version_stabilityai_stable_diffusion_2_1_base_text_encoder",
82
+ "method" : "predict"
83
+ }
84
+ ]
TextEncoder.mlmodelc/model.mil ADDED
The diff for this file is too large to render. See raw diff
 
TextEncoder.mlmodelc/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce910048d3a79dcbbd1a0dc902a0e54846764f43cfeadad873d018902ac0f2c9
3
+ size 174036096
Unet.mlmodelc/analytics/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c49fb4696b48d5268002dfc2a837a6f970a870f190d5e807d2e753afa3dea20e
3
+ size 243
Unet.mlmodelc/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fed8a3480712df21867ca0d0ae912e402a0f7b3d421f41bee689d1b0e11d6936
3
+ size 1281
Unet.mlmodelc/metadata.json ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "shortDescription" : "Stable Diffusion generates images conditioned on text or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
4
+ "metadataOutputVersion" : "3.0",
5
+ "outputSchema" : [
6
+ {
7
+ "hasShapeFlexibility" : "0",
8
+ "isOptional" : "0",
9
+ "dataType" : "Float32",
10
+ "formattedType" : "MultiArray (Float32 2 × 4 × 64 × 64)",
11
+ "shortDescription" : "Same shape and dtype as the `sample` input. The predicted noise to facilitate the reverse diffusion (denoising) process",
12
+ "shape" : "[2, 4, 64, 64]",
13
+ "name" : "noise_pred",
14
+ "type" : "MultiArray"
15
+ }
16
+ ],
17
+ "version" : "stabilityai\/stable-diffusion-2-1-base",
18
+ "modelParameters" : [
19
+
20
+ ],
21
+ "author" : "Please refer to the Model Card available at huggingface.co\/stabilityai\/stable-diffusion-2-1-base",
22
+ "specificationVersion" : 7,
23
+ "storagePrecision" : "Mixed (Float16, Palettized (2 bits))",
24
+ "license" : "OpenRAIL (https:\/\/huggingface.co\/spaces\/CompVis\/stable-diffusion-license)",
25
+ "mlProgramOperationTypeHistogram" : {
26
+ "Transpose" : 32,
27
+ "UpsampleNearestNeighbor" : 3,
28
+ "Ios16.reduceMean" : 218,
29
+ "Ios16.sin" : 1,
30
+ "Ios16.softmax" : 840,
31
+ "Split" : 16,
32
+ "Ios16.add" : 265,
33
+ "Concat" : 196,
34
+ "Ios16.realDiv" : 61,
35
+ "Ios16.square" : 61,
36
+ "ExpandDims" : 3,
37
+ "Ios16.sub" : 109,
38
+ "Ios16.cast" : 1,
39
+ "Ios16.conv" : 282,
40
+ "Ios16.constexprLutToDense" : 310,
41
+ "Ios16.einsum" : 1680,
42
+ "Ios16.gelu" : 16,
43
+ "Ios16.batchNorm" : 61,
44
+ "Ios16.reshape" : 154,
45
+ "Ios16.rsqrt" : 48,
46
+ "Ios16.silu" : 47,
47
+ "Ios16.sqrt" : 61,
48
+ "Ios16.mul" : 1001,
49
+ "Ios16.cos" : 1,
50
+ "SliceByIndex" : 1772
51
+ },
52
+ "computePrecision" : "Mixed (Float16, Float32, Int32)",
53
+ "isUpdatable" : "0",
54
+ "availability" : {
55
+ "macOS" : "13.0",
56
+ "tvOS" : "16.0",
57
+ "visionOS" : "1.0",
58
+ "watchOS" : "9.0",
59
+ "iOS" : "16.0",
60
+ "macCatalyst" : "16.0"
61
+ },
62
+ "modelType" : {
63
+ "name" : "MLModelType_mlProgram"
64
+ },
65
+ "inputSchema" : [
66
+ {
67
+ "hasShapeFlexibility" : "0",
68
+ "isOptional" : "0",
69
+ "dataType" : "Float16",
70
+ "formattedType" : "MultiArray (Float16 2 × 4 × 64 × 64)",
71
+ "shortDescription" : "The low resolution latent feature maps being denoised through reverse diffusion",
72
+ "shape" : "[2, 4, 64, 64]",
73
+ "name" : "sample",
74
+ "type" : "MultiArray"
75
+ },
76
+ {
77
+ "hasShapeFlexibility" : "0",
78
+ "isOptional" : "0",
79
+ "dataType" : "Float16",
80
+ "formattedType" : "MultiArray (Float16 2)",
81
+ "shortDescription" : "A value emitted by the associated scheduler object to condition the model on a given noise schedule",
82
+ "shape" : "[2]",
83
+ "name" : "timestep",
84
+ "type" : "MultiArray"
85
+ },
86
+ {
87
+ "hasShapeFlexibility" : "0",
88
+ "isOptional" : "0",
89
+ "dataType" : "Float16",
90
+ "formattedType" : "MultiArray (Float16 2 × 1024 × 1 × 77)",
91
+ "shortDescription" : "Output embeddings from the associated text_encoder model to condition to generated image on text. A maximum of 77 tokens (~40 words) are allowed. Longer text is truncated. Shorter text does not reduce computation.",
92
+ "shape" : "[2, 1024, 1, 77]",
93
+ "name" : "encoder_hidden_states",
94
+ "type" : "MultiArray"
95
+ }
96
+ ],
97
+ "userDefinedMetadata" : {
98
+ "com.github.apple.coremltools.version" : "7.0",
99
+ "com.github.apple.coremltools.source" : "torch==2.0.0",
100
+ "com.github.apple.ml-stable-diffusion.version" : "1.1.0"
101
+ },
102
+ "generatedClassName" : "Stable_Diffusion_version_stabilityai_stable_diffusion_2_1_base_unet",
103
+ "method" : "predict"
104
+ }
105
+ ]
Unet.mlmodelc/model.mil ADDED
The diff for this file is too large to render. See raw diff
 
Unet.mlmodelc/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7e0f7d21a5d8f37474854c83ebf55ce8dc1b872a63e9022cb05375d621ea359
3
+ size 217101696
VAEDecoder.mlmodelc/analytics/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cecb86254a5fa4e2233ac8588b0ba32c830f16a8e711e6242eb9d8eb449ee66b
3
+ size 243
VAEDecoder.mlmodelc/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a14171592a8031331c432f8dff9504622f702065240d18325414cae688d68e8
3
+ size 775
VAEDecoder.mlmodelc/metadata.json ADDED
@@ -0,0 +1,76 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "shortDescription" : "Stable Diffusion generates images conditioned on text and\/or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
4
+ "metadataOutputVersion" : "3.0",
5
+ "outputSchema" : [
6
+ {
7
+ "hasShapeFlexibility" : "0",
8
+ "isOptional" : "0",
9
+ "dataType" : "Float32",
10
+ "formattedType" : "MultiArray (Float32 1 × 3 × 512 × 512)",
11
+ "shortDescription" : "Generated image normalized to range [-1, 1]",
12
+ "shape" : "[1, 3, 512, 512]",
13
+ "name" : "image",
14
+ "type" : "MultiArray"
15
+ }
16
+ ],
17
+ "version" : "stabilityai\/stable-diffusion-2-1-base",
18
+ "modelParameters" : [
19
+
20
+ ],
21
+ "author" : "Please refer to the Model Card available at huggingface.co\/stabilityai\/stable-diffusion-2-1-base",
22
+ "specificationVersion" : 7,
23
+ "storagePrecision" : "Float16",
24
+ "license" : "OpenRAIL (https:\/\/huggingface.co\/spaces\/CompVis\/stable-diffusion-license)",
25
+ "mlProgramOperationTypeHistogram" : {
26
+ "Ios16.cast" : 1,
27
+ "Ios16.mul" : 2,
28
+ "Ios16.sqrt" : 30,
29
+ "Ios16.sub" : 30,
30
+ "Transpose" : 6,
31
+ "UpsampleNearestNeighbor" : 3,
32
+ "Ios16.conv" : 36,
33
+ "Ios16.add" : 46,
34
+ "Ios16.linear" : 4,
35
+ "Ios16.matmul" : 2,
36
+ "Ios16.realDiv" : 30,
37
+ "Ios16.reduceMean" : 60,
38
+ "Ios16.softmax" : 1,
39
+ "Ios16.batchNorm" : 29,
40
+ "Ios16.square" : 30,
41
+ "Ios16.reshape" : 65,
42
+ "Ios16.silu" : 29
43
+ },
44
+ "computePrecision" : "Mixed (Float16, Float32, Int32)",
45
+ "isUpdatable" : "0",
46
+ "availability" : {
47
+ "macOS" : "13.0",
48
+ "tvOS" : "16.0",
49
+ "visionOS" : "1.0",
50
+ "watchOS" : "9.0",
51
+ "iOS" : "16.0",
52
+ "macCatalyst" : "16.0"
53
+ },
54
+ "modelType" : {
55
+ "name" : "MLModelType_mlProgram"
56
+ },
57
+ "inputSchema" : [
58
+ {
59
+ "hasShapeFlexibility" : "0",
60
+ "isOptional" : "0",
61
+ "dataType" : "Float16",
62
+ "formattedType" : "MultiArray (Float16 1 × 4 × 64 × 64)",
63
+ "shortDescription" : "The denoised latent embeddings from the unet model after the last step of reverse diffusion",
64
+ "shape" : "[1, 4, 64, 64]",
65
+ "name" : "z",
66
+ "type" : "MultiArray"
67
+ }
68
+ ],
69
+ "userDefinedMetadata" : {
70
+ "com.github.apple.coremltools.version" : "7.0",
71
+ "com.github.apple.coremltools.source" : "torch==2.0.0"
72
+ },
73
+ "generatedClassName" : "Stable_Diffusion_version_stabilityai_stable_diffusion_2_1_base_vae_decoder",
74
+ "method" : "predict"
75
+ }
76
+ ]
VAEDecoder.mlmodelc/model.mil ADDED
The diff for this file is too large to render. See raw diff
 
VAEDecoder.mlmodelc/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccc8ff9d007a62958b367dfdaaee208e1f842e2cdc432d484d2f8297c9b0afe3
3
+ size 98993280
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
vocab.json ADDED
The diff for this file is too large to render. See raw diff