adds bundle resources for split_einsum_v2 version of the model

Browse files

Files changed (17) hide show

split_einsum_v2/Resources/TextEncoder.mlmodelc/analytics/coremldata.bin +3 -0
split_einsum_v2/Resources/TextEncoder.mlmodelc/coremldata.bin +3 -0
split_einsum_v2/Resources/TextEncoder.mlmodelc/metadata.json +84 -0
split_einsum_v2/Resources/TextEncoder.mlmodelc/model.mil +0 -0
split_einsum_v2/Resources/TextEncoder.mlmodelc/weights/weight.bin +3 -0
split_einsum_v2/Resources/Unet.mlmodelc/analytics/coremldata.bin +3 -0
split_einsum_v2/Resources/Unet.mlmodelc/coremldata.bin +3 -0
split_einsum_v2/Resources/Unet.mlmodelc/metadata.json +105 -0
split_einsum_v2/Resources/Unet.mlmodelc/model.mil +0 -0
split_einsum_v2/Resources/Unet.mlmodelc/weights/weight.bin +3 -0
split_einsum_v2/Resources/VAEDecoder.mlmodelc/analytics/coremldata.bin +3 -0
split_einsum_v2/Resources/VAEDecoder.mlmodelc/coremldata.bin +3 -0
split_einsum_v2/Resources/VAEDecoder.mlmodelc/metadata.json +76 -0
split_einsum_v2/Resources/VAEDecoder.mlmodelc/model.mil +0 -0
split_einsum_v2/Resources/VAEDecoder.mlmodelc/weights/weight.bin +3 -0
split_einsum_v2/Resources/merges.txt +0 -0
split_einsum_v2/Resources/vocab.json +0 -0

split_einsum_v2/Resources/TextEncoder.mlmodelc/analytics/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0ee238459cac95d6ad3417d5e458417c1be2ce57f41c4974bb51491fed4e179a
+size 243

split_einsum_v2/Resources/TextEncoder.mlmodelc/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8947814e2b89c777ee684effb9f7cd481b85bd5f9a0e384e06b6b5b73642a416
+size 889

split_einsum_v2/Resources/TextEncoder.mlmodelc/metadata.json ADDED Viewed

	@@ -0,0 +1,84 @@

+[
+  {
+    "shortDescription" : "Stable Diffusion generates images conditioned on text and\/or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
+    "metadataOutputVersion" : "3.0",
+    "outputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float32",
+        "formattedType" : "MultiArray (Float32 1 × 77 × 768)",
+        "shortDescription" : "The token embeddings as encoded by the Transformer model",
+        "shape" : "[1, 77, 768]",
+        "name" : "last_hidden_state",
+        "type" : "MultiArray"
+      },
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float32",
+        "formattedType" : "MultiArray (Float32 1 × 768)",
+        "shortDescription" : "The version of the `last_hidden_state` output after pooling",
+        "shape" : "[1, 768]",
+        "name" : "pooled_outputs",
+        "type" : "MultiArray"
+      }
+    ],
+    "version" : "wavymulder\/Analog-Diffusion",
+    "modelParameters" : [
+    ],
+    "author" : "Please refer to the Model Card available at huggingface.co\/wavymulder\/Analog-Diffusion",
+    "specificationVersion" : 7,
+    "storagePrecision" : "Float16",
+    "license" : "OpenRAIL (https:\/\/huggingface.co\/spaces\/CompVis\/stable-diffusion-license)",
+    "mlProgramOperationTypeHistogram" : {
+      "Ios16.cast" : 3,
+      "Ios16.mul" : 36,
+      "Ios16.layerNorm" : 25,
+      "Stack" : 1,
+      "Transpose" : 48,
+      "Ios16.sigmoid" : 12,
+      "Ios16.linear" : 72,
+      "Ios16.add" : 37,
+      "Ios16.matmul" : 24,
+      "Ios16.softmax" : 12,
+      "Ios16.gatherNd" : 1,
+      "Ios16.gather" : 1,
+      "Ios16.reshape" : 120,
+      "Ios16.reduceArgmax" : 1
+    },
+    "computePrecision" : "Mixed (Float16, Float32, Int32)",
+    "isUpdatable" : "0",
+    "availability" : {
+      "macOS" : "13.0",
+      "tvOS" : "16.0",
+      "visionOS" : "1.0",
+      "watchOS" : "9.0",
+      "iOS" : "16.0",
+      "macCatalyst" : "16.0"
+    },
+    "modelType" : {
+      "name" : "MLModelType_mlProgram"
+    },
+    "inputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float32",
+        "formattedType" : "MultiArray (Float32 1 × 77)",
+        "shortDescription" : "The token ids that represent the input text",
+        "shape" : "[1, 77]",
+        "name" : "input_ids",
+        "type" : "MultiArray"
+      }
+    ],
+    "userDefinedMetadata" : {
+      "com.github.apple.coremltools.source_dialect" : "TorchScript",
+      "com.github.apple.coremltools.source" : "torch==2.2.0",
+      "com.github.apple.coremltools.version" : "7.2"
+    },
+    "generatedClassName" : "Stable_Diffusion_version_wavymulder_Analog_Diffusion_text_encoder",
+    "method" : "predict"
+  }
+]

split_einsum_v2/Resources/TextEncoder.mlmodelc/model.mil ADDED Viewed

The diff for this file is too large to render. See raw diff

split_einsum_v2/Resources/TextEncoder.mlmodelc/weights/weight.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:be0a4ff787df1627fc5d1627817eb745ec09e0d47b574c39293d12871ecaa961
+size 246145536

split_einsum_v2/Resources/Unet.mlmodelc/analytics/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:31a187a2eaab48fcc9d654359900bbabf8bfc8537a7bff7226ff6886e6ee8661
+size 243

split_einsum_v2/Resources/Unet.mlmodelc/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2038763af87361e253dd1e6d314252b8bf496dca7ed4ec96a8ddc72ce60283b1
+size 1322

split_einsum_v2/Resources/Unet.mlmodelc/metadata.json ADDED Viewed

	@@ -0,0 +1,105 @@

+[
+  {
+    "shortDescription" : "Stable Diffusion generates images conditioned on text or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
+    "metadataOutputVersion" : "3.0",
+    "outputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float32",
+        "formattedType" : "MultiArray (Float32 2 × 4 × 64 × 64)",
+        "shortDescription" : "Same shape and dtype as the `sample` input. The predicted noise to facilitate the reverse diffusion (denoising) process",
+        "shape" : "[2, 4, 64, 64]",
+        "name" : "noise_pred",
+        "type" : "MultiArray"
+      }
+    ],
+    "version" : "wavymulder\/Analog-Diffusion",
+    "modelParameters" : [
+    ],
+    "author" : "Please refer to the Model Card available at huggingface.co\/wavymulder\/Analog-Diffusion",
+    "specificationVersion" : 7,
+    "storagePrecision" : "Float16",
+    "license" : "OpenRAIL (https:\/\/huggingface.co\/spaces\/CompVis\/stable-diffusion-license)",
+    "mlProgramOperationTypeHistogram" : {
+      "Transpose" : 32,
+      "UpsampleNearestNeighbor" : 3,
+      "Ios16.reduceMean" : 122,
+      "Ios16.sin" : 1,
+      "Ios16.softmax" : 896,
+      "Split" : 16,
+      "Ios16.add" : 169,
+      "Concat" : 206,
+      "Ios16.realDiv" : 61,
+      "Ios16.square" : 61,
+      "ExpandDims" : 3,
+      "Ios16.sub" : 61,
+      "Ios16.cast" : 1,
+      "Ios16.conv" : 282,
+      "Ios16.einsum" : 1792,
+      "Ios16.gelu" : 16,
+      "Ios16.layerNorm" : 48,
+      "Ios16.batchNorm" : 61,
+      "Ios16.reshape" : 154,
+      "Ios16.silu" : 47,
+      "Ios16.sqrt" : 61,
+      "SliceByIndex" : 1570,
+      "Ios16.mul" : 913,
+      "Ios16.cos" : 1
+    },
+    "computePrecision" : "Mixed (Float16, Float32, Int32)",
+    "isUpdatable" : "0",
+    "availability" : {
+      "macOS" : "13.0",
+      "tvOS" : "16.0",
+      "visionOS" : "1.0",
+      "watchOS" : "9.0",
+      "iOS" : "16.0",
+      "macCatalyst" : "16.0"
+    },
+    "modelType" : {
+      "name" : "MLModelType_mlProgram"
+    },
+    "inputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 2 × 4 × 64 × 64)",
+        "shortDescription" : "The low resolution latent feature maps being denoised through reverse diffusion",
+        "shape" : "[2, 4, 64, 64]",
+        "name" : "sample",
+        "type" : "MultiArray"
+      },
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 2)",
+        "shortDescription" : "A value emitted by the associated scheduler object to condition the model on a given noise schedule",
+        "shape" : "[2]",
+        "name" : "timestep",
+        "type" : "MultiArray"
+      },
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 2 × 768 × 1 × 77)",
+        "shortDescription" : "Output embeddings from the associated text_encoder model to condition to generated image on text. A maximum of 77 tokens (~40 words) are allowed. Longer text is truncated. Shorter text does not reduce computation.",
+        "shape" : "[2, 768, 1, 77]",
+        "name" : "encoder_hidden_states",
+        "type" : "MultiArray"
+      }
+    ],
+    "userDefinedMetadata" : {
+      "com.github.apple.ml-stable-diffusion.version" : "1.1.0",
+      "com.github.apple.coremltools.source" : "torch==2.2.0",
+      "com.github.apple.coremltools.version" : "7.2",
+      "com.github.apple.coremltools.source_dialect" : "TorchScript"
+    },
+    "generatedClassName" : "Stable_Diffusion_version_wavymulder_Analog_Diffusion_unet",
+    "method" : "predict"
+  }
+]

split_einsum_v2/Resources/Unet.mlmodelc/model.mil ADDED Viewed

The diff for this file is too large to render. See raw diff

split_einsum_v2/Resources/Unet.mlmodelc/weights/weight.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7f25879bd54ad589d1085c2a53d6f7285b7c48f89548303e0d6c89f01432f9c8
+size 1719117696

split_einsum_v2/Resources/VAEDecoder.mlmodelc/analytics/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7e3ff162d1108e3dfc5cf1fd787abcd48436ee79f21eb0e83a37743836e8f5c8
+size 243

split_einsum_v2/Resources/VAEDecoder.mlmodelc/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:57030ec7d19bda416ddb0caf678a18a6896ce5292419aa3e91d41d2e44819fc8
+size 842

split_einsum_v2/Resources/VAEDecoder.mlmodelc/metadata.json ADDED Viewed

	@@ -0,0 +1,76 @@

+[
+  {
+    "shortDescription" : "Stable Diffusion generates images conditioned on text and\/or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
+    "metadataOutputVersion" : "3.0",
+    "outputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float32",
+        "formattedType" : "MultiArray (Float32 1 × 3 × 512 × 512)",
+        "shortDescription" : "Generated image normalized to range [-1, 1]",
+        "shape" : "[1, 3, 512, 512]",
+        "name" : "image",
+        "type" : "MultiArray"
+      }
+    ],
+    "version" : "wavymulder\/Analog-Diffusion",
+    "modelParameters" : [
+    ],
+    "author" : "Please refer to the Model Card available at huggingface.co\/wavymulder\/Analog-Diffusion",
+    "specificationVersion" : 7,
+    "storagePrecision" : "Float32",
+    "license" : "OpenRAIL++-M (https:\/\/huggingface.co\/stabilityai\/stable-diffusion-xl-base-1.0\/blob\/main\/LICENSE.md)",
+    "mlProgramOperationTypeHistogram" : {
+      "Ios16.mul" : 2,
+      "Ios16.sqrt" : 30,
+      "Ios16.sub" : 30,
+      "Transpose" : 6,
+      "UpsampleNearestNeighbor" : 3,
+      "Ios16.conv" : 36,
+      "Ios16.add" : 46,
+      "Ios16.linear" : 4,
+      "Ios16.matmul" : 2,
+      "Ios16.realDiv" : 30,
+      "Ios16.reduceMean" : 60,
+      "Ios16.softmax" : 1,
+      "Ios16.batchNorm" : 29,
+      "Ios16.square" : 30,
+      "Ios16.reshape" : 65,
+      "Ios16.silu" : 29
+    },
+    "computePrecision" : "Mixed (Float32, Int32)",
+    "isUpdatable" : "0",
+    "availability" : {
+      "macOS" : "13.0",
+      "tvOS" : "16.0",
+      "visionOS" : "1.0",
+      "watchOS" : "9.0",
+      "iOS" : "16.0",
+      "macCatalyst" : "16.0"
+    },
+    "modelType" : {
+      "name" : "MLModelType_mlProgram"
+    },
+    "inputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float32",
+        "formattedType" : "MultiArray (Float32 1 × 4 × 64 × 64)",
+        "shortDescription" : "The denoised latent embeddings from the unet model after the last step of reverse diffusion",
+        "shape" : "[1, 4, 64, 64]",
+        "name" : "z",
+        "type" : "MultiArray"
+      }
+    ],
+    "userDefinedMetadata" : {
+      "com.github.apple.coremltools.source_dialect" : "TorchScript",
+      "com.github.apple.coremltools.source" : "torch==2.2.0",
+      "com.github.apple.coremltools.version" : "7.2"
+    },
+    "generatedClassName" : "Stable_Diffusion_version_wavymulder_Analog_Diffusion_vae_decoder",
+    "method" : "predict"
+  }
+]

split_einsum_v2/Resources/VAEDecoder.mlmodelc/model.mil ADDED Viewed

The diff for this file is too large to render. See raw diff

split_einsum_v2/Resources/VAEDecoder.mlmodelc/weights/weight.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:65c78025e1ffb7ec954fbb878564d0b041186ea08601ce87ea62fb25e356fca5
+size 197977216

split_einsum_v2/Resources/merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

split_einsum_v2/Resources/vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff