pcuenq HF staff commited on Jun 14, 2023

Commit

bf4734c

1 Parent(s): 9f5706e

Final zip and uncompressed versions with encoder.

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

coreml-stable-diffusion-2-1-base-palettized_original_compiled.zip +2 -2
coreml-stable-diffusion-2-1-base-palettized_split_einsum_v2_compiled.zip +2 -2
original/compiled/TextEncoder.mlmodelc/analytics/coremldata.bin +3 -0
original/compiled/TextEncoder.mlmodelc/coremldata.bin +3 -0
original/compiled/TextEncoder.mlmodelc/metadata.json +83 -0
original/compiled/TextEncoder.mlmodelc/model.mil +0 -0
original/compiled/TextEncoder.mlmodelc/weights/weight.bin +3 -0
original/compiled/Unet.mlmodelc/analytics/coremldata.bin +3 -0
original/compiled/Unet.mlmodelc/coremldata.bin +3 -0
original/compiled/Unet.mlmodelc/metadata.json +102 -0
original/compiled/Unet.mlmodelc/model.mil +0 -0
original/compiled/Unet.mlmodelc/weights/weight.bin +3 -0
original/compiled/VAEDecoder.mlmodelc/analytics/coremldata.bin +3 -0
original/compiled/VAEDecoder.mlmodelc/coremldata.bin +3 -0
original/compiled/VAEDecoder.mlmodelc/metadata.json +75 -0
original/compiled/VAEDecoder.mlmodelc/model.mil +0 -0
original/compiled/VAEDecoder.mlmodelc/weights/weight.bin +3 -0
original/compiled/VAEEncoder.mlmodelc/analytics/coremldata.bin +3 -0
original/compiled/VAEEncoder.mlmodelc/coremldata.bin +3 -0
original/compiled/VAEEncoder.mlmodelc/metadata.json +75 -0
original/compiled/VAEEncoder.mlmodelc/model.mil +0 -0
original/compiled/VAEEncoder.mlmodelc/weights/weight.bin +3 -0
original/compiled/merges.txt +0 -0
original/compiled/vocab.json +0 -0
original/packages/Stable_Diffusion_version_stabilityai_stable-diffusion-2-1-base_text_encoder.mlpackage/Data/com.apple.CoreML/model.mlmodel +3 -0
original/packages/Stable_Diffusion_version_stabilityai_stable-diffusion-2-1-base_text_encoder.mlpackage/Data/com.apple.CoreML/weights/weight.bin +3 -0
original/packages/Stable_Diffusion_version_stabilityai_stable-diffusion-2-1-base_text_encoder.mlpackage/Manifest.json +18 -0
original/packages/Stable_Diffusion_version_stabilityai_stable-diffusion-2-1-base_unet.mlpackage/Data/com.apple.CoreML/model.mlmodel +3 -0
original/packages/Stable_Diffusion_version_stabilityai_stable-diffusion-2-1-base_unet.mlpackage/Data/com.apple.CoreML/weights/weight.bin +3 -0
original/packages/Stable_Diffusion_version_stabilityai_stable-diffusion-2-1-base_unet.mlpackage/Manifest.json +18 -0
original/packages/Stable_Diffusion_version_stabilityai_stable-diffusion-2-1-base_vae_decoder.mlpackage/Data/com.apple.CoreML/model.mlmodel +3 -0
original/packages/Stable_Diffusion_version_stabilityai_stable-diffusion-2-1-base_vae_decoder.mlpackage/Data/com.apple.CoreML/weights/weight.bin +3 -0
original/packages/Stable_Diffusion_version_stabilityai_stable-diffusion-2-1-base_vae_decoder.mlpackage/Manifest.json +18 -0
original/packages/Stable_Diffusion_version_stabilityai_stable-diffusion-2-1-base_vae_encoder.mlpackage/Data/com.apple.CoreML/model.mlmodel +3 -0
original/packages/Stable_Diffusion_version_stabilityai_stable-diffusion-2-1-base_vae_encoder.mlpackage/Data/com.apple.CoreML/weights/weight.bin +3 -0
original/packages/Stable_Diffusion_version_stabilityai_stable-diffusion-2-1-base_vae_encoder.mlpackage/Manifest.json +18 -0
split_einsum_v2/compiled/TextEncoder.mlmodelc/analytics/coremldata.bin +3 -0
split_einsum_v2/compiled/TextEncoder.mlmodelc/coremldata.bin +3 -0
split_einsum_v2/compiled/TextEncoder.mlmodelc/metadata.json +83 -0
split_einsum_v2/compiled/TextEncoder.mlmodelc/model.mil +0 -0
split_einsum_v2/compiled/TextEncoder.mlmodelc/weights/weight.bin +3 -0
split_einsum_v2/compiled/Unet.mlmodelc/analytics/coremldata.bin +3 -0
split_einsum_v2/compiled/Unet.mlmodelc/coremldata.bin +3 -0
split_einsum_v2/compiled/Unet.mlmodelc/metadata.json +103 -0
split_einsum_v2/compiled/Unet.mlmodelc/model.mil +0 -0
split_einsum_v2/compiled/Unet.mlmodelc/weights/weight.bin +3 -0
split_einsum_v2/compiled/VAEDecoder.mlmodelc/analytics/coremldata.bin +3 -0
split_einsum_v2/compiled/VAEDecoder.mlmodelc/coremldata.bin +3 -0
split_einsum_v2/compiled/VAEDecoder.mlmodelc/metadata.json +75 -0
split_einsum_v2/compiled/VAEDecoder.mlmodelc/model.mil +0 -0

coreml-stable-diffusion-2-1-base-palettized_original_compiled.zip CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:75d6a8416b593e63042259036faa326c01c9621cbca0ddbebbca3c2247060417
-size 1070762141

 version https://git-lfs.github.com/spec/v1
+oid sha256:3769cd509f62f0ad3d326c6592864138ce0fdfc536d3d4e67fd65bea40eb5d7c
+size 1139245980

coreml-stable-diffusion-2-1-base-palettized_split_einsum_v2_compiled.zip CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f346c3fd19bcfcbb9561f65e53f9f417339f66a7dcc3282e033a8b9717bf5eaa
-size 1072895985

 version https://git-lfs.github.com/spec/v1
+oid sha256:90c532943d460c559a8d84b7a0f05a4d265fee78ca355fdd5aa734fd43e08972
+size 1141379936

original/compiled/TextEncoder.mlmodelc/analytics/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a26bdd792e919ca3412c0685e74ea507a6de835532f0ec58d780c99b0a7a0193
+size 207

original/compiled/TextEncoder.mlmodelc/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2f0484a1a04e023da06787de4140cf215f9ccd67f93d916dc388b846d8607899
+size 839

original/compiled/TextEncoder.mlmodelc/metadata.json ADDED Viewed

	@@ -0,0 +1,83 @@

+[
+  {
+    "shortDescription" : "Stable Diffusion generates images conditioned on text and\/or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
+    "metadataOutputVersion" : "3.0",
+    "outputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float32",
+        "formattedType" : "MultiArray (Float32)",
+        "shortDescription" : "The token embeddings as encoded by the Transformer model",
+        "shape" : "[]",
+        "name" : "last_hidden_state",
+        "type" : "MultiArray"
+      },
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float32",
+        "formattedType" : "MultiArray (Float32)",
+        "shortDescription" : "The version of the `last_hidden_state` output after pooling",
+        "shape" : "[]",
+        "name" : "pooled_outputs",
+        "type" : "MultiArray"
+      }
+    ],
+    "version" : "stabilityai\/stable-diffusion-2-1-base",
+    "modelParameters" : [
+    ],
+    "author" : "Please refer to the Model Card available at huggingface.co\/stabilityai\/stable-diffusion-2-1-base",
+    "specificationVersion" : 7,
+    "storagePrecision" : "Mixed (Float16, Palettized (6 bits))",
+    "license" : "OpenRAIL (https:\/\/huggingface.co\/spaces\/CompVis\/stable-diffusion-license)",
+    "mlProgramOperationTypeHistogram" : {
+      "Ios16.cast" : 3,
+      "Ios16.mul" : 23,
+      "Ios16.layerNorm" : 47,
+      "Ios16.constexprLutToDense" : 163,
+      "Stack" : 1,
+      "Transpose" : 115,
+      "Ios16.linear" : 138,
+      "Ios16.add" : 70,
+      "Ios16.matmul" : 46,
+      "Ios16.gelu" : 23,
+      "Ios16.softmax" : 23,
+      "Ios16.gatherNd" : 1,
+      "Ios16.gather" : 1,
+      "Ios16.reshape" : 230,
+      "Ios16.reduceArgmax" : 1
+    },
+    "computePrecision" : "Mixed (Float16, Float32, Int32)",
+    "isUpdatable" : "0",
+    "availability" : {
+      "macOS" : "13.0",
+      "tvOS" : "16.0",
+      "watchOS" : "9.0",
+      "iOS" : "16.0",
+      "macCatalyst" : "16.0"
+    },
+    "modelType" : {
+      "name" : "MLModelType_mlProgram"
+    },
+    "inputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float32",
+        "formattedType" : "MultiArray (Float32 1 × 77)",
+        "shortDescription" : "The token ids that represent the input text",
+        "shape" : "[1, 77]",
+        "name" : "input_ids",
+        "type" : "MultiArray"
+      }
+    ],
+    "userDefinedMetadata" : {
+      "com.github.apple.coremltools.version" : "7.0b1",
+      "com.github.apple.coremltools.source" : "torch==2.0.1"
+    },
+    "generatedClassName" : "Stable_Diffusion_version_stabilityai_stable_diffusion_2_1_base_text_encoder",
+    "method" : "predict"
+  }
+]

original/compiled/TextEncoder.mlmodelc/model.mil ADDED Viewed

The diff for this file is too large to render. See raw diff

original/compiled/TextEncoder.mlmodelc/weights/weight.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4e5ac135bb5f002401ffea7766e8f2231ebb75dd2deee90893eb11a9c1a07d35
+size 318860352

original/compiled/Unet.mlmodelc/analytics/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fb7e6fb835c839f3651203e04393bf965d36b9fd374b4738622b17129fd93b6f
+size 207

original/compiled/Unet.mlmodelc/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5bc742d03b80b46feaa6f9e2159a5c89acda3ed2c1562f2b4f781bb7bfbce110
+size 1221

original/compiled/Unet.mlmodelc/metadata.json ADDED Viewed

	@@ -0,0 +1,102 @@

+[
+  {
+    "shortDescription" : "Stable Diffusion generates images conditioned on text or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
+    "metadataOutputVersion" : "3.0",
+    "outputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float32",
+        "formattedType" : "MultiArray (Float32)",
+        "shortDescription" : "Same shape and dtype as the `sample` input. The predicted noise to facilitate the reverse diffusion (denoising) process",
+        "shape" : "[]",
+        "name" : "noise_pred",
+        "type" : "MultiArray"
+      }
+    ],
+    "version" : "stabilityai\/stable-diffusion-2-1-base",
+    "modelParameters" : [
+    ],
+    "author" : "Please refer to the Model Card available at huggingface.co\/stabilityai\/stable-diffusion-2-1-base",
+    "specificationVersion" : 7,
+    "storagePrecision" : "Mixed (Float16, Palettized (6 bits))",
+    "license" : "OpenRAIL (https:\/\/huggingface.co\/spaces\/CompVis\/stable-diffusion-license)",
+    "mlProgramOperationTypeHistogram" : {
+      "UpsampleNearestNeighbor" : 3,
+      "Ios16.reduceMean" : 218,
+      "Ios16.sin" : 1,
+      "Ios16.softmax" : 32,
+      "Split" : 16,
+      "Ios16.add" : 265,
+      "Concat" : 14,
+      "Ios16.realDiv" : 61,
+      "Ios16.square" : 61,
+      "ExpandDims" : 3,
+      "Ios16.sub" : 109,
+      "Ios16.cast" : 1,
+      "Ios16.conv" : 282,
+      "Ios16.constexprLutToDense" : 310,
+      "Ios16.gelu" : 16,
+      "Ios16.matmul" : 64,
+      "Ios16.batchNorm" : 61,
+      "Ios16.reshape" : 282,
+      "Ios16.rsqrt" : 48,
+      "Ios16.silu" : 47,
+      "Ios16.sqrt" : 61,
+      "Ios16.mul" : 193,
+      "Ios16.cos" : 1,
+      "SliceByIndex" : 2
+    },
+    "computePrecision" : "Mixed (Float16, Float32, Int32)",
+    "isUpdatable" : "0",
+    "availability" : {
+      "macOS" : "13.0",
+      "tvOS" : "16.0",
+      "watchOS" : "9.0",
+      "iOS" : "16.0",
+      "macCatalyst" : "16.0"
+    },
+    "modelType" : {
+      "name" : "MLModelType_mlProgram"
+    },
+    "inputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 2 × 4 × 64 × 64)",
+        "shortDescription" : "The low resolution latent feature maps being denoised through reverse diffusion",
+        "shape" : "[2, 4, 64, 64]",
+        "name" : "sample",
+        "type" : "MultiArray"
+      },
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 2)",
+        "shortDescription" : "A value emitted by the associated scheduler object to condition the model on a given noise schedule",
+        "shape" : "[2]",
+        "name" : "timestep",
+        "type" : "MultiArray"
+      },
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 2 × 1024 × 1 × 77)",
+        "shortDescription" : "Output embeddings from the associated text_encoder model to condition to generated image on text. A maximum of 77 tokens (~40 words) are allowed. Longer text is truncated. Shorter text does not reduce computation.",
+        "shape" : "[2, 1024, 1, 77]",
+        "name" : "encoder_hidden_states",
+        "type" : "MultiArray"
+      }
+    ],
+    "userDefinedMetadata" : {
+      "com.github.apple.coremltools.version" : "7.0b1",
+      "com.github.apple.coremltools.source" : "torch==2.0.1"
+    },
+    "generatedClassName" : "Stable_Diffusion_version_stabilityai_stable_diffusion_2_1_base_unet",
+    "method" : "predict"
+  }
+]

original/compiled/Unet.mlmodelc/model.mil ADDED Viewed

The diff for this file is too large to render. See raw diff

original/compiled/Unet.mlmodelc/weights/weight.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:45bf0fd5713dc4f15bf1d14788e33bb6ad27796c80cffbe52e157cf398bbae0b
+size 649959936

original/compiled/VAEDecoder.mlmodelc/analytics/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:682f30dbd27b8c96fae9dd5d7cec36e85812e370cc2a920d9a6cef7a908e29d3
+size 207

original/compiled/VAEDecoder.mlmodelc/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:57555bee9ff5d60c5b6fd48564eac43523d954a2d34101273b8e3fa8f1aee3d0
+size 769

original/compiled/VAEDecoder.mlmodelc/metadata.json ADDED Viewed

	@@ -0,0 +1,75 @@

+[
+  {
+    "shortDescription" : "Stable Diffusion generates images conditioned on text and\/or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
+    "metadataOutputVersion" : "3.0",
+    "outputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float32",
+        "formattedType" : "MultiArray (Float32)",
+        "shortDescription" : "Generated image normalized to range [-1, 1]",
+        "shape" : "[]",
+        "name" : "image",
+        "type" : "MultiArray"
+      }
+    ],
+    "version" : "stabilityai\/stable-diffusion-2-1-base",
+    "modelParameters" : [
+    ],
+    "author" : "Please refer to the Model Card available at huggingface.co\/stabilityai\/stable-diffusion-2-1-base",
+    "specificationVersion" : 7,
+    "storagePrecision" : "Float16",
+    "license" : "OpenRAIL (https:\/\/huggingface.co\/spaces\/CompVis\/stable-diffusion-license)",
+    "mlProgramOperationTypeHistogram" : {
+      "Ios16.cast" : 1,
+      "Ios16.mul" : 1,
+      "Ios16.sqrt" : 30,
+      "Ios16.sub" : 30,
+      "Transpose" : 7,
+      "UpsampleNearestNeighbor" : 3,
+      "Ios16.conv" : 36,
+      "Ios16.add" : 45,
+      "Ios16.linear" : 4,
+      "Ios16.matmul" : 2,
+      "Ios16.realDiv" : 30,
+      "Ios16.reduceMean" : 60,
+      "Ios16.softmax" : 1,
+      "Ios16.batchNorm" : 30,
+      "Ios16.square" : 30,
+      "Ios16.reshape" : 70,
+      "Ios16.silu" : 29
+    },
+    "computePrecision" : "Mixed (Float16, Float32, Int32)",
+    "isUpdatable" : "0",
+    "availability" : {
+      "macOS" : "13.0",
+      "tvOS" : "16.0",
+      "watchOS" : "9.0",
+      "iOS" : "16.0",
+      "macCatalyst" : "16.0"
+    },
+    "modelType" : {
+      "name" : "MLModelType_mlProgram"
+    },
+    "inputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 1 × 4 × 64 × 64)",
+        "shortDescription" : "The denoised latent embeddings from the unet model after the last step of reverse diffusion",
+        "shape" : "[1, 4, 64, 64]",
+        "name" : "z",
+        "type" : "MultiArray"
+      }
+    ],
+    "userDefinedMetadata" : {
+      "com.github.apple.coremltools.version" : "7.0b1",
+      "com.github.apple.coremltools.source" : "torch==2.0.1"
+    },
+    "generatedClassName" : "Stable_Diffusion_version_stabilityai_stable_diffusion_2_1_base_vae_decoder",
+    "method" : "predict"
+  }
+]

original/compiled/VAEDecoder.mlmodelc/model.mil ADDED Viewed

The diff for this file is too large to render. See raw diff

original/compiled/VAEDecoder.mlmodelc/weights/weight.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1fc0794d5ffad51b5599d2e978ee3351638edeab6753a3f6e5453fa612772286
+size 98993280

original/compiled/VAEEncoder.mlmodelc/analytics/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:15f5816e1040cbb9124d5d3d9b17ea7cee1e32adda5322b45d992b072bfa352a
+size 207

original/compiled/VAEEncoder.mlmodelc/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d8d5fe5e99e6989b1ea29a9da7a6938025f9a7253e81ef722c6accca4594ae36
+size 775

original/compiled/VAEEncoder.mlmodelc/metadata.json ADDED Viewed

	@@ -0,0 +1,75 @@

+[
+  {
+    "shortDescription" : "Stable Diffusion generates images conditioned on text and\/or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
+    "metadataOutputVersion" : "3.0",
+    "outputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float32",
+        "formattedType" : "MultiArray (Float32)",
+        "shortDescription" : "The latent embeddings from the unet model from the input image.",
+        "shape" : "[]",
+        "name" : "latent",
+        "type" : "MultiArray"
+      }
+    ],
+    "version" : "stabilityai\/stable-diffusion-2-1-base",
+    "modelParameters" : [
+    ],
+    "author" : "Please refer to the Model Card available at huggingface.co\/stabilityai\/stable-diffusion-2-1-base",
+    "specificationVersion" : 7,
+    "storagePrecision" : "Float16",
+    "license" : "OpenRAIL (https:\/\/huggingface.co\/spaces\/CompVis\/stable-diffusion-license)",
+    "mlProgramOperationTypeHistogram" : {
+      "Pad" : 3,
+      "Ios16.cast" : 1,
+      "Ios16.mul" : 1,
+      "Ios16.sqrt" : 22,
+      "Ios16.sub" : 22,
+      "Transpose" : 7,
+      "Ios16.conv" : 28,
+      "Ios16.add" : 33,
+      "Ios16.linear" : 4,
+      "Ios16.matmul" : 2,
+      "Ios16.realDiv" : 22,
+      "Ios16.reduceMean" : 44,
+      "Ios16.softmax" : 1,
+      "Ios16.batchNorm" : 22,
+      "Ios16.square" : 22,
+      "Ios16.reshape" : 54,
+      "Ios16.silu" : 21
+    },
+    "computePrecision" : "Mixed (Float16, Float32, Int32)",
+    "isUpdatable" : "0",
+    "availability" : {
+      "macOS" : "13.0",
+      "tvOS" : "16.0",
+      "watchOS" : "9.0",
+      "iOS" : "16.0",
+      "macCatalyst" : "16.0"
+    },
+    "modelType" : {
+      "name" : "MLModelType_mlProgram"
+    },
+    "inputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 1 × 3 × 512 × 512)",
+        "shortDescription" : "The input image to base the initial latents on normalized to range [-1, 1]",
+        "shape" : "[1, 3, 512, 512]",
+        "name" : "z",
+        "type" : "MultiArray"
+      }
+    ],
+    "userDefinedMetadata" : {
+      "com.github.apple.coremltools.version" : "7.0b1",
+      "com.github.apple.coremltools.source" : "torch==2.0.1"
+    },
+    "generatedClassName" : "Stable_Diffusion_version_stabilityai_stable_diffusion_2_1_base_vae_encoder",
+    "method" : "predict"
+  }
+]

original/compiled/VAEEncoder.mlmodelc/model.mil ADDED Viewed

The diff for this file is too large to render. See raw diff

original/compiled/VAEEncoder.mlmodelc/weights/weight.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6f2d9d29b46a29008068665a44b921c661baea9be0443e1ff5bf12cd7032e516
+size 68338112

original/compiled/merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

original/compiled/vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff

original/packages/Stable_Diffusion_version_stabilityai_stable-diffusion-2-1-base_text_encoder.mlpackage/Data/com.apple.CoreML/model.mlmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e01d9bc98cfe3bd805dab8d2cbf4a48348de0849969ca809abd46bcf0793fb57
+size 325428

original/packages/Stable_Diffusion_version_stabilityai_stable-diffusion-2-1-base_text_encoder.mlpackage/Data/com.apple.CoreML/weights/weight.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4e5ac135bb5f002401ffea7766e8f2231ebb75dd2deee90893eb11a9c1a07d35
+size 318860352

original/packages/Stable_Diffusion_version_stabilityai_stable-diffusion-2-1-base_text_encoder.mlpackage/Manifest.json ADDED Viewed

	@@ -0,0 +1,18 @@

+{
+    "fileFormatVersion": "1.0.0",
+    "itemInfoEntries": {
+        "4E390967-A1B3-4867-95AF-D4C37FC150E6": {
+            "author": "com.apple.CoreML",
+            "description": "CoreML Model Specification",
+            "name": "model.mlmodel",
+            "path": "com.apple.CoreML/model.mlmodel"
+        },
+        "F818F547-4536-4699-AE30-389FE0DFE215": {
+            "author": "com.apple.CoreML",
+            "description": "CoreML Model Weights",
+            "name": "weights",
+            "path": "com.apple.CoreML/weights"
+        }
+    },
+    "rootModelIdentifier": "4E390967-A1B3-4867-95AF-D4C37FC150E6"
+}

original/packages/Stable_Diffusion_version_stabilityai_stable-diffusion-2-1-base_unet.mlpackage/Data/com.apple.CoreML/model.mlmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:36cbf4d2fc2d40cf7bf9cbaaf69bbd6f2c97249893212f25d56efab1369fdc70
+size 822548

original/packages/Stable_Diffusion_version_stabilityai_stable-diffusion-2-1-base_unet.mlpackage/Data/com.apple.CoreML/weights/weight.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:45bf0fd5713dc4f15bf1d14788e33bb6ad27796c80cffbe52e157cf398bbae0b
+size 649959936

original/packages/Stable_Diffusion_version_stabilityai_stable-diffusion-2-1-base_unet.mlpackage/Manifest.json ADDED Viewed

	@@ -0,0 +1,18 @@

+{
+    "fileFormatVersion": "1.0.0",
+    "itemInfoEntries": {
+        "9588C4DE-C362-45E3-8069-9188B08D251F": {
+            "author": "com.apple.CoreML",
+            "description": "CoreML Model Specification",
+            "name": "model.mlmodel",
+            "path": "com.apple.CoreML/model.mlmodel"
+        },
+        "B0E56A57-C91D-4EC6-AE9E-AA0973BA672B": {
+            "author": "com.apple.CoreML",
+            "description": "CoreML Model Weights",
+            "name": "weights",
+            "path": "com.apple.CoreML/weights"
+        }
+    },
+    "rootModelIdentifier": "9588C4DE-C362-45E3-8069-9188B08D251F"
+}

original/packages/Stable_Diffusion_version_stabilityai_stable-diffusion-2-1-base_vae_decoder.mlpackage/Data/com.apple.CoreML/model.mlmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f51c78e72da77a882a7ffc5b290b73ca67bdb762ba7849075a83f07fe2773a22
+size 156826

original/packages/Stable_Diffusion_version_stabilityai_stable-diffusion-2-1-base_vae_decoder.mlpackage/Data/com.apple.CoreML/weights/weight.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1fc0794d5ffad51b5599d2e978ee3351638edeab6753a3f6e5453fa612772286
+size 98993280

original/packages/Stable_Diffusion_version_stabilityai_stable-diffusion-2-1-base_vae_decoder.mlpackage/Manifest.json ADDED Viewed

	@@ -0,0 +1,18 @@

+{
+    "fileFormatVersion": "1.0.0",
+    "itemInfoEntries": {
+        "CDEF2CCF-0ABB-4574-A995-095B2C7DEA9F": {
+            "author": "com.apple.CoreML",
+            "description": "CoreML Model Weights",
+            "name": "weights",
+            "path": "com.apple.CoreML/weights"
+        },
+        "DF6E69CD-88D9-4A19-B45F-560BE165DF49": {
+            "author": "com.apple.CoreML",
+            "description": "CoreML Model Specification",
+            "name": "model.mlmodel",
+            "path": "com.apple.CoreML/model.mlmodel"
+        }
+    },
+    "rootModelIdentifier": "DF6E69CD-88D9-4A19-B45F-560BE165DF49"
+}

original/packages/Stable_Diffusion_version_stabilityai_stable-diffusion-2-1-base_vae_encoder.mlpackage/Data/com.apple.CoreML/model.mlmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:150f221a9c11ffe64367885a3c0883bab651342aea45743234df4881c9c6091b
+size 120695

original/packages/Stable_Diffusion_version_stabilityai_stable-diffusion-2-1-base_vae_encoder.mlpackage/Data/com.apple.CoreML/weights/weight.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6f2d9d29b46a29008068665a44b921c661baea9be0443e1ff5bf12cd7032e516
+size 68338112

original/packages/Stable_Diffusion_version_stabilityai_stable-diffusion-2-1-base_vae_encoder.mlpackage/Manifest.json ADDED Viewed

	@@ -0,0 +1,18 @@

+{
+    "fileFormatVersion": "1.0.0",
+    "itemInfoEntries": {
+        "020F5B51-5C87-41D5-80DF-5325AF2B6675": {
+            "author": "com.apple.CoreML",
+            "description": "CoreML Model Specification",
+            "name": "model.mlmodel",
+            "path": "com.apple.CoreML/model.mlmodel"
+        },
+        "4904B9B1-0D93-46AC-A850-C57C42392CA7": {
+            "author": "com.apple.CoreML",
+            "description": "CoreML Model Weights",
+            "name": "weights",
+            "path": "com.apple.CoreML/weights"
+        }
+    },
+    "rootModelIdentifier": "020F5B51-5C87-41D5-80DF-5325AF2B6675"
+}

split_einsum_v2/compiled/TextEncoder.mlmodelc/analytics/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a26bdd792e919ca3412c0685e74ea507a6de835532f0ec58d780c99b0a7a0193
+size 207

split_einsum_v2/compiled/TextEncoder.mlmodelc/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2f0484a1a04e023da06787de4140cf215f9ccd67f93d916dc388b846d8607899
+size 839

split_einsum_v2/compiled/TextEncoder.mlmodelc/metadata.json ADDED Viewed

	@@ -0,0 +1,83 @@

+[
+  {
+    "shortDescription" : "Stable Diffusion generates images conditioned on text and\/or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
+    "metadataOutputVersion" : "3.0",
+    "outputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float32",
+        "formattedType" : "MultiArray (Float32)",
+        "shortDescription" : "The token embeddings as encoded by the Transformer model",
+        "shape" : "[]",
+        "name" : "last_hidden_state",
+        "type" : "MultiArray"
+      },
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float32",
+        "formattedType" : "MultiArray (Float32)",
+        "shortDescription" : "The version of the `last_hidden_state` output after pooling",
+        "shape" : "[]",
+        "name" : "pooled_outputs",
+        "type" : "MultiArray"
+      }
+    ],
+    "version" : "stabilityai\/stable-diffusion-2-1-base",
+    "modelParameters" : [
+    ],
+    "author" : "Please refer to the Model Card available at huggingface.co\/stabilityai\/stable-diffusion-2-1-base",
+    "specificationVersion" : 7,
+    "storagePrecision" : "Mixed (Float16, Palettized (6 bits))",
+    "license" : "OpenRAIL (https:\/\/huggingface.co\/spaces\/CompVis\/stable-diffusion-license)",
+    "mlProgramOperationTypeHistogram" : {
+      "Ios16.cast" : 3,
+      "Ios16.mul" : 23,
+      "Ios16.layerNorm" : 47,
+      "Ios16.constexprLutToDense" : 163,
+      "Stack" : 1,
+      "Transpose" : 115,
+      "Ios16.linear" : 138,
+      "Ios16.add" : 70,
+      "Ios16.matmul" : 46,
+      "Ios16.gelu" : 23,
+      "Ios16.softmax" : 23,
+      "Ios16.gatherNd" : 1,
+      "Ios16.gather" : 1,
+      "Ios16.reshape" : 230,
+      "Ios16.reduceArgmax" : 1
+    },
+    "computePrecision" : "Mixed (Float16, Float32, Int32)",
+    "isUpdatable" : "0",
+    "availability" : {
+      "macOS" : "13.0",
+      "tvOS" : "16.0",
+      "watchOS" : "9.0",
+      "iOS" : "16.0",
+      "macCatalyst" : "16.0"
+    },
+    "modelType" : {
+      "name" : "MLModelType_mlProgram"
+    },
+    "inputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float32",
+        "formattedType" : "MultiArray (Float32 1 × 77)",
+        "shortDescription" : "The token ids that represent the input text",
+        "shape" : "[1, 77]",
+        "name" : "input_ids",
+        "type" : "MultiArray"
+      }
+    ],
+    "userDefinedMetadata" : {
+      "com.github.apple.coremltools.version" : "7.0b1",
+      "com.github.apple.coremltools.source" : "torch==2.0.1"
+    },
+    "generatedClassName" : "Stable_Diffusion_version_stabilityai_stable_diffusion_2_1_base_text_encoder",
+    "method" : "predict"
+  }
+]

split_einsum_v2/compiled/TextEncoder.mlmodelc/model.mil ADDED Viewed

The diff for this file is too large to render. See raw diff

split_einsum_v2/compiled/TextEncoder.mlmodelc/weights/weight.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3be3ff19e2ed53774d8c4c22f58bb4f9d37a44c2d6d34955e72decef86aa8615
+size 318860352

split_einsum_v2/compiled/Unet.mlmodelc/analytics/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7432befba40c728344d55ededaedcbeebf04eca023437afb4418e655515c066c
+size 207

split_einsum_v2/compiled/Unet.mlmodelc/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5bc742d03b80b46feaa6f9e2159a5c89acda3ed2c1562f2b4f781bb7bfbce110
+size 1221

split_einsum_v2/compiled/Unet.mlmodelc/metadata.json ADDED Viewed

	@@ -0,0 +1,103 @@

+[
+  {
+    "shortDescription" : "Stable Diffusion generates images conditioned on text or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
+    "metadataOutputVersion" : "3.0",
+    "outputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float32",
+        "formattedType" : "MultiArray (Float32)",
+        "shortDescription" : "Same shape and dtype as the `sample` input. The predicted noise to facilitate the reverse diffusion (denoising) process",
+        "shape" : "[]",
+        "name" : "noise_pred",
+        "type" : "MultiArray"
+      }
+    ],
+    "version" : "stabilityai\/stable-diffusion-2-1-base",
+    "modelParameters" : [
+    ],
+    "author" : "Please refer to the Model Card available at huggingface.co\/stabilityai\/stable-diffusion-2-1-base",
+    "specificationVersion" : 7,
+    "storagePrecision" : "Mixed (Float16, Palettized (6 bits))",
+    "license" : "OpenRAIL (https:\/\/huggingface.co\/spaces\/CompVis\/stable-diffusion-license)",
+    "mlProgramOperationTypeHistogram" : {
+      "Transpose" : 32,
+      "UpsampleNearestNeighbor" : 3,
+      "Ios16.reduceMean" : 218,
+      "Ios16.sin" : 1,
+      "Ios16.softmax" : 840,
+      "Split" : 16,
+      "Ios16.add" : 265,
+      "Concat" : 196,
+      "Ios16.realDiv" : 61,
+      "Ios16.square" : 61,
+      "ExpandDims" : 3,
+      "Ios16.sub" : 109,
+      "Ios16.cast" : 1,
+      "Ios16.conv" : 282,
+      "Ios16.constexprLutToDense" : 310,
+      "Ios16.einsum" : 1680,
+      "Ios16.gelu" : 16,
+      "Ios16.batchNorm" : 61,
+      "Ios16.reshape" : 154,
+      "Ios16.rsqrt" : 48,
+      "Ios16.silu" : 47,
+      "Ios16.sqrt" : 61,
+      "Ios16.mul" : 1001,
+      "Ios16.cos" : 1,
+      "SliceByIndex" : 1772
+    },
+    "computePrecision" : "Mixed (Float16, Float32, Int32)",
+    "isUpdatable" : "0",
+    "availability" : {
+      "macOS" : "13.0",
+      "tvOS" : "16.0",
+      "watchOS" : "9.0",
+      "iOS" : "16.0",
+      "macCatalyst" : "16.0"
+    },
+    "modelType" : {
+      "name" : "MLModelType_mlProgram"
+    },
+    "inputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 2 × 4 × 64 × 64)",
+        "shortDescription" : "The low resolution latent feature maps being denoised through reverse diffusion",
+        "shape" : "[2, 4, 64, 64]",
+        "name" : "sample",
+        "type" : "MultiArray"
+      },
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 2)",
+        "shortDescription" : "A value emitted by the associated scheduler object to condition the model on a given noise schedule",
+        "shape" : "[2]",
+        "name" : "timestep",
+        "type" : "MultiArray"
+      },
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 2 × 1024 × 1 × 77)",
+        "shortDescription" : "Output embeddings from the associated text_encoder model to condition to generated image on text. A maximum of 77 tokens (~40 words) are allowed. Longer text is truncated. Shorter text does not reduce computation.",
+        "shape" : "[2, 1024, 1, 77]",
+        "name" : "encoder_hidden_states",
+        "type" : "MultiArray"
+      }
+    ],
+    "userDefinedMetadata" : {
+      "com.github.apple.coremltools.version" : "7.0b1",
+      "com.github.apple.coremltools.source" : "torch==2.0.1"
+    },
+    "generatedClassName" : "Stable_Diffusion_version_stabilityai_stable_diffusion_2_1_base_unet",
+    "method" : "predict"
+  }
+]

split_einsum_v2/compiled/Unet.mlmodelc/model.mil ADDED Viewed

The diff for this file is too large to render. See raw diff

split_einsum_v2/compiled/Unet.mlmodelc/weights/weight.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a4bfeb078744274ac2000593ae80522c8e3363bec8a4cf5e35ef93e3f7b14056
+size 649959936

split_einsum_v2/compiled/VAEDecoder.mlmodelc/analytics/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:682f30dbd27b8c96fae9dd5d7cec36e85812e370cc2a920d9a6cef7a908e29d3
+size 207

split_einsum_v2/compiled/VAEDecoder.mlmodelc/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:57555bee9ff5d60c5b6fd48564eac43523d954a2d34101273b8e3fa8f1aee3d0
+size 769

split_einsum_v2/compiled/VAEDecoder.mlmodelc/metadata.json ADDED Viewed

	@@ -0,0 +1,75 @@

+[
+  {
+    "shortDescription" : "Stable Diffusion generates images conditioned on text and\/or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
+    "metadataOutputVersion" : "3.0",
+    "outputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float32",
+        "formattedType" : "MultiArray (Float32)",
+        "shortDescription" : "Generated image normalized to range [-1, 1]",
+        "shape" : "[]",
+        "name" : "image",
+        "type" : "MultiArray"
+      }
+    ],
+    "version" : "stabilityai\/stable-diffusion-2-1-base",
+    "modelParameters" : [
+    ],
+    "author" : "Please refer to the Model Card available at huggingface.co\/stabilityai\/stable-diffusion-2-1-base",
+    "specificationVersion" : 7,
+    "storagePrecision" : "Float16",
+    "license" : "OpenRAIL (https:\/\/huggingface.co\/spaces\/CompVis\/stable-diffusion-license)",
+    "mlProgramOperationTypeHistogram" : {
+      "Ios16.cast" : 1,
+      "Ios16.mul" : 1,
+      "Ios16.sqrt" : 30,
+      "Ios16.sub" : 30,
+      "Transpose" : 7,
+      "UpsampleNearestNeighbor" : 3,
+      "Ios16.conv" : 36,
+      "Ios16.add" : 45,
+      "Ios16.linear" : 4,
+      "Ios16.matmul" : 2,
+      "Ios16.realDiv" : 30,
+      "Ios16.reduceMean" : 60,
+      "Ios16.softmax" : 1,
+      "Ios16.batchNorm" : 30,
+      "Ios16.square" : 30,
+      "Ios16.reshape" : 70,
+      "Ios16.silu" : 29
+    },
+    "computePrecision" : "Mixed (Float16, Float32, Int32)",
+    "isUpdatable" : "0",
+    "availability" : {
+      "macOS" : "13.0",
+      "tvOS" : "16.0",
+      "watchOS" : "9.0",
+      "iOS" : "16.0",
+      "macCatalyst" : "16.0"
+    },
+    "modelType" : {
+      "name" : "MLModelType_mlProgram"
+    },
+    "inputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 1 × 4 × 64 × 64)",
+        "shortDescription" : "The denoised latent embeddings from the unet model after the last step of reverse diffusion",
+        "shape" : "[1, 4, 64, 64]",
+        "name" : "z",
+        "type" : "MultiArray"
+      }
+    ],
+    "userDefinedMetadata" : {
+      "com.github.apple.coremltools.version" : "7.0b1",
+      "com.github.apple.coremltools.source" : "torch==2.0.1"
+    },
+    "generatedClassName" : "Stable_Diffusion_version_stabilityai_stable_diffusion_2_1_base_vae_decoder",
+    "method" : "predict"
+  }
+]

split_einsum_v2/compiled/VAEDecoder.mlmodelc/model.mil ADDED Viewed

The diff for this file is too large to render. See raw diff