Upload folder using huggingface_hub

Browse files

Files changed (18) hide show

.DS_Store +0 -0
TextEncoder.mlmodelc/analytics/coremldata.bin +3 -0
TextEncoder.mlmodelc/coremldata.bin +3 -0
TextEncoder.mlmodelc/metadata.json +84 -0
TextEncoder.mlmodelc/model.mil +0 -0
TextEncoder.mlmodelc/weights/weight.bin +3 -0
Unet.mlmodelc/analytics/coremldata.bin +3 -0
Unet.mlmodelc/coremldata.bin +3 -0
Unet.mlmodelc/metadata.json +105 -0
Unet.mlmodelc/model.mil +0 -0
Unet.mlmodelc/weights/weight.bin +3 -0
VAEDecoder.mlmodelc/analytics/coremldata.bin +3 -0
VAEDecoder.mlmodelc/coremldata.bin +3 -0
VAEDecoder.mlmodelc/metadata.json +76 -0
VAEDecoder.mlmodelc/model.mil +0 -0
VAEDecoder.mlmodelc/weights/weight.bin +3 -0
merges.txt +0 -0
vocab.json +0 -0

.DS_Store ADDED Viewed

Binary file (6.15 kB). View file

TextEncoder.mlmodelc/analytics/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8dac4ccc46f3c5e8ffa0a19511039b8ceadd239791fabb5623b822bce8063275
+size 243

TextEncoder.mlmodelc/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:13e580e4ef472512859174485e27ab173759522d91e225a1db35ceee09acae66
+size 848

TextEncoder.mlmodelc/metadata.json ADDED Viewed

	@@ -0,0 +1,84 @@

+[
+  {
+    "shortDescription" : "Stable Diffusion generates images conditioned on text and\/or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
+    "metadataOutputVersion" : "3.0",
+    "outputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float32",
+        "formattedType" : "MultiArray (Float32 1 × 77 × 1024)",
+        "shortDescription" : "The token embeddings as encoded by the Transformer model",
+        "shape" : "[1, 77, 1024]",
+        "name" : "last_hidden_state",
+        "type" : "MultiArray"
+      },
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float32",
+        "formattedType" : "MultiArray (Float32 1 × 1024)",
+        "shortDescription" : "The version of the `last_hidden_state` output after pooling",
+        "shape" : "[1, 1024]",
+        "name" : "pooled_outputs",
+        "type" : "MultiArray"
+      }
+    ],
+    "version" : "stabilityai\/stable-diffusion-2-1-base",
+    "modelParameters" : [
+    ],
+    "author" : "Please refer to the Model Card available at huggingface.co\/stabilityai\/stable-diffusion-2-1-base",
+    "specificationVersion" : 7,
+    "storagePrecision" : "Mixed (Float16, Palettized (2 bits))",
+    "license" : "OpenRAIL (https:\/\/huggingface.co\/spaces\/CompVis\/stable-diffusion-license)",
+    "mlProgramOperationTypeHistogram" : {
+      "Ios16.cast" : 3,
+      "Ios16.mul" : 23,
+      "Ios16.layerNorm" : 47,
+      "Ios16.constexprLutToDense" : 163,
+      "Stack" : 1,
+      "Transpose" : 115,
+      "Ios16.linear" : 138,
+      "Ios16.add" : 70,
+      "Ios16.matmul" : 46,
+      "Ios16.gelu" : 23,
+      "Ios16.softmax" : 23,
+      "Ios16.gatherNd" : 1,
+      "Ios16.gather" : 1,
+      "Ios16.reshape" : 230,
+      "Ios16.reduceArgmax" : 1
+    },
+    "computePrecision" : "Mixed (Float16, Float32, Int32)",
+    "isUpdatable" : "0",
+    "availability" : {
+      "macOS" : "13.0",
+      "tvOS" : "16.0",
+      "visionOS" : "1.0",
+      "watchOS" : "9.0",
+      "iOS" : "16.0",
+      "macCatalyst" : "16.0"
+    },
+    "modelType" : {
+      "name" : "MLModelType_mlProgram"
+    },
+    "inputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float32",
+        "formattedType" : "MultiArray (Float32 1 × 77)",
+        "shortDescription" : "The token ids that represent the input text",
+        "shape" : "[1, 77]",
+        "name" : "input_ids",
+        "type" : "MultiArray"
+      }
+    ],
+    "userDefinedMetadata" : {
+      "com.github.apple.coremltools.version" : "7.0",
+      "com.github.apple.coremltools.source" : "torch==2.0.0"
+    },
+    "generatedClassName" : "Stable_Diffusion_version_stabilityai_stable_diffusion_2_1_base_text_encoder",
+    "method" : "predict"
+  }
+]

TextEncoder.mlmodelc/model.mil ADDED Viewed

The diff for this file is too large to render. See raw diff

TextEncoder.mlmodelc/weights/weight.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ce910048d3a79dcbbd1a0dc902a0e54846764f43cfeadad873d018902ac0f2c9
+size 174036096

Unet.mlmodelc/analytics/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c49fb4696b48d5268002dfc2a837a6f970a870f190d5e807d2e753afa3dea20e
+size 243

Unet.mlmodelc/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fed8a3480712df21867ca0d0ae912e402a0f7b3d421f41bee689d1b0e11d6936
+size 1281

Unet.mlmodelc/metadata.json ADDED Viewed

	@@ -0,0 +1,105 @@

+[
+  {
+    "shortDescription" : "Stable Diffusion generates images conditioned on text or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
+    "metadataOutputVersion" : "3.0",
+    "outputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float32",
+        "formattedType" : "MultiArray (Float32 2 × 4 × 64 × 64)",
+        "shortDescription" : "Same shape and dtype as the `sample` input. The predicted noise to facilitate the reverse diffusion (denoising) process",
+        "shape" : "[2, 4, 64, 64]",
+        "name" : "noise_pred",
+        "type" : "MultiArray"
+      }
+    ],
+    "version" : "stabilityai\/stable-diffusion-2-1-base",
+    "modelParameters" : [
+    ],
+    "author" : "Please refer to the Model Card available at huggingface.co\/stabilityai\/stable-diffusion-2-1-base",
+    "specificationVersion" : 7,
+    "storagePrecision" : "Mixed (Float16, Palettized (2 bits))",
+    "license" : "OpenRAIL (https:\/\/huggingface.co\/spaces\/CompVis\/stable-diffusion-license)",
+    "mlProgramOperationTypeHistogram" : {
+      "Transpose" : 32,
+      "UpsampleNearestNeighbor" : 3,
+      "Ios16.reduceMean" : 218,
+      "Ios16.sin" : 1,
+      "Ios16.softmax" : 840,
+      "Split" : 16,
+      "Ios16.add" : 265,
+      "Concat" : 196,
+      "Ios16.realDiv" : 61,
+      "Ios16.square" : 61,
+      "ExpandDims" : 3,
+      "Ios16.sub" : 109,
+      "Ios16.cast" : 1,
+      "Ios16.conv" : 282,
+      "Ios16.constexprLutToDense" : 310,
+      "Ios16.einsum" : 1680,
+      "Ios16.gelu" : 16,
+      "Ios16.batchNorm" : 61,
+      "Ios16.reshape" : 154,
+      "Ios16.rsqrt" : 48,
+      "Ios16.silu" : 47,
+      "Ios16.sqrt" : 61,
+      "Ios16.mul" : 1001,
+      "Ios16.cos" : 1,
+      "SliceByIndex" : 1772
+    },
+    "computePrecision" : "Mixed (Float16, Float32, Int32)",
+    "isUpdatable" : "0",
+    "availability" : {
+      "macOS" : "13.0",
+      "tvOS" : "16.0",
+      "visionOS" : "1.0",
+      "watchOS" : "9.0",
+      "iOS" : "16.0",
+      "macCatalyst" : "16.0"
+    },
+    "modelType" : {
+      "name" : "MLModelType_mlProgram"
+    },
+    "inputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 2 × 4 × 64 × 64)",
+        "shortDescription" : "The low resolution latent feature maps being denoised through reverse diffusion",
+        "shape" : "[2, 4, 64, 64]",
+        "name" : "sample",
+        "type" : "MultiArray"
+      },
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 2)",
+        "shortDescription" : "A value emitted by the associated scheduler object to condition the model on a given noise schedule",
+        "shape" : "[2]",
+        "name" : "timestep",
+        "type" : "MultiArray"
+      },
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 2 × 1024 × 1 × 77)",
+        "shortDescription" : "Output embeddings from the associated text_encoder model to condition to generated image on text. A maximum of 77 tokens (~40 words) are allowed. Longer text is truncated. Shorter text does not reduce computation.",
+        "shape" : "[2, 1024, 1, 77]",
+        "name" : "encoder_hidden_states",
+        "type" : "MultiArray"
+      }
+    ],
+    "userDefinedMetadata" : {
+      "com.github.apple.coremltools.version" : "7.0",
+      "com.github.apple.coremltools.source" : "torch==2.0.0",
+      "com.github.apple.ml-stable-diffusion.version" : "1.1.0"
+    },
+    "generatedClassName" : "Stable_Diffusion_version_stabilityai_stable_diffusion_2_1_base_unet",
+    "method" : "predict"
+  }
+]

Unet.mlmodelc/model.mil ADDED Viewed

The diff for this file is too large to render. See raw diff

Unet.mlmodelc/weights/weight.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e7e0f7d21a5d8f37474854c83ebf55ce8dc1b872a63e9022cb05375d621ea359
+size 217101696

VAEDecoder.mlmodelc/analytics/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cecb86254a5fa4e2233ac8588b0ba32c830f16a8e711e6242eb9d8eb449ee66b
+size 243

VAEDecoder.mlmodelc/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2a14171592a8031331c432f8dff9504622f702065240d18325414cae688d68e8
+size 775

VAEDecoder.mlmodelc/metadata.json ADDED Viewed

	@@ -0,0 +1,76 @@

+[
+  {
+    "shortDescription" : "Stable Diffusion generates images conditioned on text and\/or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
+    "metadataOutputVersion" : "3.0",
+    "outputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float32",
+        "formattedType" : "MultiArray (Float32 1 × 3 × 512 × 512)",
+        "shortDescription" : "Generated image normalized to range [-1, 1]",
+        "shape" : "[1, 3, 512, 512]",
+        "name" : "image",
+        "type" : "MultiArray"
+      }
+    ],
+    "version" : "stabilityai\/stable-diffusion-2-1-base",
+    "modelParameters" : [
+    ],
+    "author" : "Please refer to the Model Card available at huggingface.co\/stabilityai\/stable-diffusion-2-1-base",
+    "specificationVersion" : 7,
+    "storagePrecision" : "Float16",
+    "license" : "OpenRAIL (https:\/\/huggingface.co\/spaces\/CompVis\/stable-diffusion-license)",
+    "mlProgramOperationTypeHistogram" : {
+      "Ios16.cast" : 1,
+      "Ios16.mul" : 2,
+      "Ios16.sqrt" : 30,
+      "Ios16.sub" : 30,
+      "Transpose" : 6,
+      "UpsampleNearestNeighbor" : 3,
+      "Ios16.conv" : 36,
+      "Ios16.add" : 46,
+      "Ios16.linear" : 4,
+      "Ios16.matmul" : 2,
+      "Ios16.realDiv" : 30,
+      "Ios16.reduceMean" : 60,
+      "Ios16.softmax" : 1,
+      "Ios16.batchNorm" : 29,
+      "Ios16.square" : 30,
+      "Ios16.reshape" : 65,
+      "Ios16.silu" : 29
+    },
+    "computePrecision" : "Mixed (Float16, Float32, Int32)",
+    "isUpdatable" : "0",
+    "availability" : {
+      "macOS" : "13.0",
+      "tvOS" : "16.0",
+      "visionOS" : "1.0",
+      "watchOS" : "9.0",
+      "iOS" : "16.0",
+      "macCatalyst" : "16.0"
+    },
+    "modelType" : {
+      "name" : "MLModelType_mlProgram"
+    },
+    "inputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 1 × 4 × 64 × 64)",
+        "shortDescription" : "The denoised latent embeddings from the unet model after the last step of reverse diffusion",
+        "shape" : "[1, 4, 64, 64]",
+        "name" : "z",
+        "type" : "MultiArray"
+      }
+    ],
+    "userDefinedMetadata" : {
+      "com.github.apple.coremltools.version" : "7.0",
+      "com.github.apple.coremltools.source" : "torch==2.0.0"
+    },
+    "generatedClassName" : "Stable_Diffusion_version_stabilityai_stable_diffusion_2_1_base_vae_decoder",
+    "method" : "predict"
+  }
+]

VAEDecoder.mlmodelc/model.mil ADDED Viewed

The diff for this file is too large to render. See raw diff

VAEDecoder.mlmodelc/weights/weight.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ccc8ff9d007a62958b367dfdaaee208e1f842e2cdc432d484d2f8297c9b0afe3
+size 98993280

merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff