c2p-cmd commited on
Commit
bf14973
1 Parent(s): 79bcea8

adds bundle resources for split_einsum_v2 version of the model

Browse files
split_einsum_v2/Resources/TextEncoder.mlmodelc/analytics/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ee238459cac95d6ad3417d5e458417c1be2ce57f41c4974bb51491fed4e179a
3
+ size 243
split_einsum_v2/Resources/TextEncoder.mlmodelc/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8947814e2b89c777ee684effb9f7cd481b85bd5f9a0e384e06b6b5b73642a416
3
+ size 889
split_einsum_v2/Resources/TextEncoder.mlmodelc/metadata.json ADDED
@@ -0,0 +1,84 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "shortDescription" : "Stable Diffusion generates images conditioned on text and\/or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
4
+ "metadataOutputVersion" : "3.0",
5
+ "outputSchema" : [
6
+ {
7
+ "hasShapeFlexibility" : "0",
8
+ "isOptional" : "0",
9
+ "dataType" : "Float32",
10
+ "formattedType" : "MultiArray (Float32 1 × 77 × 768)",
11
+ "shortDescription" : "The token embeddings as encoded by the Transformer model",
12
+ "shape" : "[1, 77, 768]",
13
+ "name" : "last_hidden_state",
14
+ "type" : "MultiArray"
15
+ },
16
+ {
17
+ "hasShapeFlexibility" : "0",
18
+ "isOptional" : "0",
19
+ "dataType" : "Float32",
20
+ "formattedType" : "MultiArray (Float32 1 × 768)",
21
+ "shortDescription" : "The version of the `last_hidden_state` output after pooling",
22
+ "shape" : "[1, 768]",
23
+ "name" : "pooled_outputs",
24
+ "type" : "MultiArray"
25
+ }
26
+ ],
27
+ "version" : "wavymulder\/Analog-Diffusion",
28
+ "modelParameters" : [
29
+
30
+ ],
31
+ "author" : "Please refer to the Model Card available at huggingface.co\/wavymulder\/Analog-Diffusion",
32
+ "specificationVersion" : 7,
33
+ "storagePrecision" : "Float16",
34
+ "license" : "OpenRAIL (https:\/\/huggingface.co\/spaces\/CompVis\/stable-diffusion-license)",
35
+ "mlProgramOperationTypeHistogram" : {
36
+ "Ios16.cast" : 3,
37
+ "Ios16.mul" : 36,
38
+ "Ios16.layerNorm" : 25,
39
+ "Stack" : 1,
40
+ "Transpose" : 48,
41
+ "Ios16.sigmoid" : 12,
42
+ "Ios16.linear" : 72,
43
+ "Ios16.add" : 37,
44
+ "Ios16.matmul" : 24,
45
+ "Ios16.softmax" : 12,
46
+ "Ios16.gatherNd" : 1,
47
+ "Ios16.gather" : 1,
48
+ "Ios16.reshape" : 120,
49
+ "Ios16.reduceArgmax" : 1
50
+ },
51
+ "computePrecision" : "Mixed (Float16, Float32, Int32)",
52
+ "isUpdatable" : "0",
53
+ "availability" : {
54
+ "macOS" : "13.0",
55
+ "tvOS" : "16.0",
56
+ "visionOS" : "1.0",
57
+ "watchOS" : "9.0",
58
+ "iOS" : "16.0",
59
+ "macCatalyst" : "16.0"
60
+ },
61
+ "modelType" : {
62
+ "name" : "MLModelType_mlProgram"
63
+ },
64
+ "inputSchema" : [
65
+ {
66
+ "hasShapeFlexibility" : "0",
67
+ "isOptional" : "0",
68
+ "dataType" : "Float32",
69
+ "formattedType" : "MultiArray (Float32 1 × 77)",
70
+ "shortDescription" : "The token ids that represent the input text",
71
+ "shape" : "[1, 77]",
72
+ "name" : "input_ids",
73
+ "type" : "MultiArray"
74
+ }
75
+ ],
76
+ "userDefinedMetadata" : {
77
+ "com.github.apple.coremltools.source_dialect" : "TorchScript",
78
+ "com.github.apple.coremltools.source" : "torch==2.2.0",
79
+ "com.github.apple.coremltools.version" : "7.2"
80
+ },
81
+ "generatedClassName" : "Stable_Diffusion_version_wavymulder_Analog_Diffusion_text_encoder",
82
+ "method" : "predict"
83
+ }
84
+ ]
split_einsum_v2/Resources/TextEncoder.mlmodelc/model.mil ADDED
The diff for this file is too large to render. See raw diff
 
split_einsum_v2/Resources/TextEncoder.mlmodelc/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be0a4ff787df1627fc5d1627817eb745ec09e0d47b574c39293d12871ecaa961
3
+ size 246145536
split_einsum_v2/Resources/Unet.mlmodelc/analytics/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31a187a2eaab48fcc9d654359900bbabf8bfc8537a7bff7226ff6886e6ee8661
3
+ size 243
split_einsum_v2/Resources/Unet.mlmodelc/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2038763af87361e253dd1e6d314252b8bf496dca7ed4ec96a8ddc72ce60283b1
3
+ size 1322
split_einsum_v2/Resources/Unet.mlmodelc/metadata.json ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "shortDescription" : "Stable Diffusion generates images conditioned on text or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
4
+ "metadataOutputVersion" : "3.0",
5
+ "outputSchema" : [
6
+ {
7
+ "hasShapeFlexibility" : "0",
8
+ "isOptional" : "0",
9
+ "dataType" : "Float32",
10
+ "formattedType" : "MultiArray (Float32 2 × 4 × 64 × 64)",
11
+ "shortDescription" : "Same shape and dtype as the `sample` input. The predicted noise to facilitate the reverse diffusion (denoising) process",
12
+ "shape" : "[2, 4, 64, 64]",
13
+ "name" : "noise_pred",
14
+ "type" : "MultiArray"
15
+ }
16
+ ],
17
+ "version" : "wavymulder\/Analog-Diffusion",
18
+ "modelParameters" : [
19
+
20
+ ],
21
+ "author" : "Please refer to the Model Card available at huggingface.co\/wavymulder\/Analog-Diffusion",
22
+ "specificationVersion" : 7,
23
+ "storagePrecision" : "Float16",
24
+ "license" : "OpenRAIL (https:\/\/huggingface.co\/spaces\/CompVis\/stable-diffusion-license)",
25
+ "mlProgramOperationTypeHistogram" : {
26
+ "Transpose" : 32,
27
+ "UpsampleNearestNeighbor" : 3,
28
+ "Ios16.reduceMean" : 122,
29
+ "Ios16.sin" : 1,
30
+ "Ios16.softmax" : 896,
31
+ "Split" : 16,
32
+ "Ios16.add" : 169,
33
+ "Concat" : 206,
34
+ "Ios16.realDiv" : 61,
35
+ "Ios16.square" : 61,
36
+ "ExpandDims" : 3,
37
+ "Ios16.sub" : 61,
38
+ "Ios16.cast" : 1,
39
+ "Ios16.conv" : 282,
40
+ "Ios16.einsum" : 1792,
41
+ "Ios16.gelu" : 16,
42
+ "Ios16.layerNorm" : 48,
43
+ "Ios16.batchNorm" : 61,
44
+ "Ios16.reshape" : 154,
45
+ "Ios16.silu" : 47,
46
+ "Ios16.sqrt" : 61,
47
+ "SliceByIndex" : 1570,
48
+ "Ios16.mul" : 913,
49
+ "Ios16.cos" : 1
50
+ },
51
+ "computePrecision" : "Mixed (Float16, Float32, Int32)",
52
+ "isUpdatable" : "0",
53
+ "availability" : {
54
+ "macOS" : "13.0",
55
+ "tvOS" : "16.0",
56
+ "visionOS" : "1.0",
57
+ "watchOS" : "9.0",
58
+ "iOS" : "16.0",
59
+ "macCatalyst" : "16.0"
60
+ },
61
+ "modelType" : {
62
+ "name" : "MLModelType_mlProgram"
63
+ },
64
+ "inputSchema" : [
65
+ {
66
+ "hasShapeFlexibility" : "0",
67
+ "isOptional" : "0",
68
+ "dataType" : "Float16",
69
+ "formattedType" : "MultiArray (Float16 2 × 4 × 64 × 64)",
70
+ "shortDescription" : "The low resolution latent feature maps being denoised through reverse diffusion",
71
+ "shape" : "[2, 4, 64, 64]",
72
+ "name" : "sample",
73
+ "type" : "MultiArray"
74
+ },
75
+ {
76
+ "hasShapeFlexibility" : "0",
77
+ "isOptional" : "0",
78
+ "dataType" : "Float16",
79
+ "formattedType" : "MultiArray (Float16 2)",
80
+ "shortDescription" : "A value emitted by the associated scheduler object to condition the model on a given noise schedule",
81
+ "shape" : "[2]",
82
+ "name" : "timestep",
83
+ "type" : "MultiArray"
84
+ },
85
+ {
86
+ "hasShapeFlexibility" : "0",
87
+ "isOptional" : "0",
88
+ "dataType" : "Float16",
89
+ "formattedType" : "MultiArray (Float16 2 × 768 × 1 × 77)",
90
+ "shortDescription" : "Output embeddings from the associated text_encoder model to condition to generated image on text. A maximum of 77 tokens (~40 words) are allowed. Longer text is truncated. Shorter text does not reduce computation.",
91
+ "shape" : "[2, 768, 1, 77]",
92
+ "name" : "encoder_hidden_states",
93
+ "type" : "MultiArray"
94
+ }
95
+ ],
96
+ "userDefinedMetadata" : {
97
+ "com.github.apple.ml-stable-diffusion.version" : "1.1.0",
98
+ "com.github.apple.coremltools.source" : "torch==2.2.0",
99
+ "com.github.apple.coremltools.version" : "7.2",
100
+ "com.github.apple.coremltools.source_dialect" : "TorchScript"
101
+ },
102
+ "generatedClassName" : "Stable_Diffusion_version_wavymulder_Analog_Diffusion_unet",
103
+ "method" : "predict"
104
+ }
105
+ ]
split_einsum_v2/Resources/Unet.mlmodelc/model.mil ADDED
The diff for this file is too large to render. See raw diff
 
split_einsum_v2/Resources/Unet.mlmodelc/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f25879bd54ad589d1085c2a53d6f7285b7c48f89548303e0d6c89f01432f9c8
3
+ size 1719117696
split_einsum_v2/Resources/VAEDecoder.mlmodelc/analytics/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e3ff162d1108e3dfc5cf1fd787abcd48436ee79f21eb0e83a37743836e8f5c8
3
+ size 243
split_einsum_v2/Resources/VAEDecoder.mlmodelc/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57030ec7d19bda416ddb0caf678a18a6896ce5292419aa3e91d41d2e44819fc8
3
+ size 842
split_einsum_v2/Resources/VAEDecoder.mlmodelc/metadata.json ADDED
@@ -0,0 +1,76 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "shortDescription" : "Stable Diffusion generates images conditioned on text and\/or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
4
+ "metadataOutputVersion" : "3.0",
5
+ "outputSchema" : [
6
+ {
7
+ "hasShapeFlexibility" : "0",
8
+ "isOptional" : "0",
9
+ "dataType" : "Float32",
10
+ "formattedType" : "MultiArray (Float32 1 × 3 × 512 × 512)",
11
+ "shortDescription" : "Generated image normalized to range [-1, 1]",
12
+ "shape" : "[1, 3, 512, 512]",
13
+ "name" : "image",
14
+ "type" : "MultiArray"
15
+ }
16
+ ],
17
+ "version" : "wavymulder\/Analog-Diffusion",
18
+ "modelParameters" : [
19
+
20
+ ],
21
+ "author" : "Please refer to the Model Card available at huggingface.co\/wavymulder\/Analog-Diffusion",
22
+ "specificationVersion" : 7,
23
+ "storagePrecision" : "Float32",
24
+ "license" : "OpenRAIL++-M (https:\/\/huggingface.co\/stabilityai\/stable-diffusion-xl-base-1.0\/blob\/main\/LICENSE.md)",
25
+ "mlProgramOperationTypeHistogram" : {
26
+ "Ios16.mul" : 2,
27
+ "Ios16.sqrt" : 30,
28
+ "Ios16.sub" : 30,
29
+ "Transpose" : 6,
30
+ "UpsampleNearestNeighbor" : 3,
31
+ "Ios16.conv" : 36,
32
+ "Ios16.add" : 46,
33
+ "Ios16.linear" : 4,
34
+ "Ios16.matmul" : 2,
35
+ "Ios16.realDiv" : 30,
36
+ "Ios16.reduceMean" : 60,
37
+ "Ios16.softmax" : 1,
38
+ "Ios16.batchNorm" : 29,
39
+ "Ios16.square" : 30,
40
+ "Ios16.reshape" : 65,
41
+ "Ios16.silu" : 29
42
+ },
43
+ "computePrecision" : "Mixed (Float32, Int32)",
44
+ "isUpdatable" : "0",
45
+ "availability" : {
46
+ "macOS" : "13.0",
47
+ "tvOS" : "16.0",
48
+ "visionOS" : "1.0",
49
+ "watchOS" : "9.0",
50
+ "iOS" : "16.0",
51
+ "macCatalyst" : "16.0"
52
+ },
53
+ "modelType" : {
54
+ "name" : "MLModelType_mlProgram"
55
+ },
56
+ "inputSchema" : [
57
+ {
58
+ "hasShapeFlexibility" : "0",
59
+ "isOptional" : "0",
60
+ "dataType" : "Float32",
61
+ "formattedType" : "MultiArray (Float32 1 × 4 × 64 × 64)",
62
+ "shortDescription" : "The denoised latent embeddings from the unet model after the last step of reverse diffusion",
63
+ "shape" : "[1, 4, 64, 64]",
64
+ "name" : "z",
65
+ "type" : "MultiArray"
66
+ }
67
+ ],
68
+ "userDefinedMetadata" : {
69
+ "com.github.apple.coremltools.source_dialect" : "TorchScript",
70
+ "com.github.apple.coremltools.source" : "torch==2.2.0",
71
+ "com.github.apple.coremltools.version" : "7.2"
72
+ },
73
+ "generatedClassName" : "Stable_Diffusion_version_wavymulder_Analog_Diffusion_vae_decoder",
74
+ "method" : "predict"
75
+ }
76
+ ]
split_einsum_v2/Resources/VAEDecoder.mlmodelc/model.mil ADDED
The diff for this file is too large to render. See raw diff
 
split_einsum_v2/Resources/VAEDecoder.mlmodelc/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65c78025e1ffb7ec954fbb878564d0b041186ea08601ce87ea62fb25e356fca5
3
+ size 197977216
split_einsum_v2/Resources/merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
split_einsum_v2/Resources/vocab.json ADDED
The diff for this file is too large to render. See raw diff