jblalock30 commited on
Commit
7f5979d
1 Parent(s): cb99a64

Upload folder using huggingface_hub

Browse files
Files changed (22) hide show
  1. sd-turbo/compiled/quantize-2-bit/ORIGINAL/TextEncoder.mlmodelc/analytics/coremldata.bin +3 -0
  2. sd-turbo/compiled/quantize-2-bit/ORIGINAL/TextEncoder.mlmodelc/coremldata.bin +3 -0
  3. sd-turbo/compiled/quantize-2-bit/ORIGINAL/TextEncoder.mlmodelc/metadata.json +85 -0
  4. sd-turbo/compiled/quantize-2-bit/ORIGINAL/TextEncoder.mlmodelc/model.mil +0 -0
  5. sd-turbo/compiled/quantize-2-bit/ORIGINAL/Unet.mlmodelc/analytics/coremldata.bin +3 -0
  6. sd-turbo/compiled/quantize-2-bit/ORIGINAL/Unet.mlmodelc/coremldata.bin +3 -0
  7. sd-turbo/compiled/quantize-2-bit/ORIGINAL/Unet.mlmodelc/metadata.json +105 -0
  8. sd-turbo/compiled/quantize-2-bit/ORIGINAL/Unet.mlmodelc/model.mil +0 -0
  9. sd-turbo/compiled/quantize-2-bit/ORIGINAL/UnetChunk1.mlmodelc/analytics/coremldata.bin +3 -0
  10. sd-turbo/compiled/quantize-2-bit/ORIGINAL/UnetChunk1.mlmodelc/coremldata.bin +3 -0
  11. sd-turbo/compiled/quantize-2-bit/ORIGINAL/UnetChunk1.mlmodelc/metadata.json +217 -0
  12. sd-turbo/compiled/quantize-2-bit/ORIGINAL/UnetChunk1.mlmodelc/model.mil +0 -0
  13. sd-turbo/compiled/quantize-2-bit/ORIGINAL/UnetChunk2.mlmodelc/analytics/coremldata.bin +3 -0
  14. sd-turbo/compiled/quantize-2-bit/ORIGINAL/UnetChunk2.mlmodelc/coremldata.bin +3 -0
  15. sd-turbo/compiled/quantize-2-bit/ORIGINAL/UnetChunk2.mlmodelc/metadata.json +204 -0
  16. sd-turbo/compiled/quantize-2-bit/ORIGINAL/UnetChunk2.mlmodelc/model.mil +0 -0
  17. sd-turbo/compiled/quantize-2-bit/ORIGINAL/VAEDecoder.mlmodelc/analytics/coremldata.bin +3 -0
  18. sd-turbo/compiled/quantize-2-bit/ORIGINAL/VAEDecoder.mlmodelc/coremldata.bin +3 -0
  19. sd-turbo/compiled/quantize-2-bit/ORIGINAL/VAEDecoder.mlmodelc/metadata.json +77 -0
  20. sd-turbo/compiled/quantize-2-bit/ORIGINAL/VAEDecoder.mlmodelc/model.mil +0 -0
  21. sd-turbo/compiled/quantize-2-bit/ORIGINAL/merges.txt +0 -0
  22. sd-turbo/compiled/quantize-2-bit/ORIGINAL/vocab.json +0 -0
sd-turbo/compiled/quantize-2-bit/ORIGINAL/TextEncoder.mlmodelc/analytics/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8dc74ba7028c27f065c92303e1521672070188d27652a0fd65174028d1074bf7
3
+ size 243
sd-turbo/compiled/quantize-2-bit/ORIGINAL/TextEncoder.mlmodelc/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2adfe4b49c2fe0d0d254ce00efa7586387a556936b356b87818b7b52dc97a8b
3
+ size 881
sd-turbo/compiled/quantize-2-bit/ORIGINAL/TextEncoder.mlmodelc/metadata.json ADDED
@@ -0,0 +1,85 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "shortDescription" : "Stable Diffusion generates images conditioned on text and\/or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
4
+ "metadataOutputVersion" : "3.0",
5
+ "outputSchema" : [
6
+ {
7
+ "hasShapeFlexibility" : "0",
8
+ "isOptional" : "0",
9
+ "dataType" : "Float32",
10
+ "formattedType" : "MultiArray (Float32 1 × 77 × 1024)",
11
+ "shortDescription" : "The token embeddings as encoded by the Transformer model",
12
+ "shape" : "[1, 77, 1024]",
13
+ "name" : "last_hidden_state",
14
+ "type" : "MultiArray"
15
+ },
16
+ {
17
+ "hasShapeFlexibility" : "0",
18
+ "isOptional" : "0",
19
+ "dataType" : "Float32",
20
+ "formattedType" : "MultiArray (Float32 1 × 1024)",
21
+ "shortDescription" : "The version of the `last_hidden_state` output after pooling",
22
+ "shape" : "[1, 1024]",
23
+ "name" : "pooled_outputs",
24
+ "type" : "MultiArray"
25
+ }
26
+ ],
27
+ "version" : "stabilityai\/sd-turbo",
28
+ "modelParameters" : [
29
+
30
+ ],
31
+ "author" : "Please refer to the Model Card available at huggingface.co\/stabilityai\/sd-turbo",
32
+ "specificationVersion" : 7,
33
+ "storagePrecision" : "Mixed (Float16, Palettized (2 bits))",
34
+ "license" : "OpenRAIL (https:\/\/huggingface.co\/spaces\/CompVis\/stable-diffusion-license)",
35
+ "mlProgramOperationTypeHistogram" : {
36
+ "Ios16.cast" : 3,
37
+ "Ios16.mul" : 23,
38
+ "Ios16.layerNorm" : 47,
39
+ "Ios16.constexprLutToDense" : 163,
40
+ "Stack" : 1,
41
+ "Transpose" : 115,
42
+ "Ios16.linear" : 138,
43
+ "Ios16.add" : 70,
44
+ "Ios16.matmul" : 46,
45
+ "Ios16.gelu" : 23,
46
+ "Ios16.softmax" : 23,
47
+ "Ios16.gatherNd" : 1,
48
+ "Ios16.gather" : 1,
49
+ "Ios16.reshape" : 230,
50
+ "Ios16.reduceArgmax" : 1
51
+ },
52
+ "computePrecision" : "Mixed (Float16, Float32, Int32)",
53
+ "isUpdatable" : "0",
54
+ "availability" : {
55
+ "macOS" : "13.0",
56
+ "tvOS" : "16.0",
57
+ "visionOS" : "1.0",
58
+ "watchOS" : "9.0",
59
+ "iOS" : "16.0",
60
+ "macCatalyst" : "16.0"
61
+ },
62
+ "modelType" : {
63
+ "name" : "MLModelType_mlProgram"
64
+ },
65
+ "inputSchema" : [
66
+ {
67
+ "hasShapeFlexibility" : "0",
68
+ "isOptional" : "0",
69
+ "dataType" : "Float32",
70
+ "formattedType" : "MultiArray (Float32 1 × 77)",
71
+ "shortDescription" : "The token ids that represent the input text",
72
+ "shape" : "[1, 77]",
73
+ "name" : "input_ids",
74
+ "type" : "MultiArray"
75
+ }
76
+ ],
77
+ "userDefinedMetadata" : {
78
+ "com.github.apple.coremltools.version" : "7.1",
79
+ "com.github.apple.coremltools.source" : "torch==2.1.0+cu121",
80
+ "com.github.apple.coremltools.source_dialect" : "TorchScript"
81
+ },
82
+ "generatedClassName" : "Stable_Diffusion_version_stabilityai_sd_turbo_text_encoder",
83
+ "method" : "predict"
84
+ }
85
+ ]
sd-turbo/compiled/quantize-2-bit/ORIGINAL/TextEncoder.mlmodelc/model.mil ADDED
The diff for this file is too large to render. See raw diff
 
sd-turbo/compiled/quantize-2-bit/ORIGINAL/Unet.mlmodelc/analytics/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9838025d53a13bd2c2a86b1f9c5eba3a7c70c2a3d04845117b16612cbf79bd99
3
+ size 243
sd-turbo/compiled/quantize-2-bit/ORIGINAL/Unet.mlmodelc/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5af13cf115bdd42e40aeffaf2b6e0bf270c837c8edcba344938c66e779520e15
3
+ size 1314
sd-turbo/compiled/quantize-2-bit/ORIGINAL/Unet.mlmodelc/metadata.json ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "shortDescription" : "Stable Diffusion generates images conditioned on text or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
4
+ "metadataOutputVersion" : "3.0",
5
+ "outputSchema" : [
6
+ {
7
+ "hasShapeFlexibility" : "0",
8
+ "isOptional" : "0",
9
+ "dataType" : "Float32",
10
+ "formattedType" : "MultiArray (Float32 2 × 4 × 64 × 64)",
11
+ "shortDescription" : "Same shape and dtype as the `sample` input. The predicted noise to facilitate the reverse diffusion (denoising) process",
12
+ "shape" : "[2, 4, 64, 64]",
13
+ "name" : "noise_pred",
14
+ "type" : "MultiArray"
15
+ }
16
+ ],
17
+ "version" : "stabilityai\/sd-turbo",
18
+ "modelParameters" : [
19
+
20
+ ],
21
+ "author" : "Please refer to the Model Card available at huggingface.co\/stabilityai\/sd-turbo",
22
+ "specificationVersion" : 7,
23
+ "storagePrecision" : "Mixed (Float16, Palettized (2 bits))",
24
+ "license" : "OpenRAIL (https:\/\/huggingface.co\/spaces\/CompVis\/stable-diffusion-license)",
25
+ "mlProgramOperationTypeHistogram" : {
26
+ "UpsampleNearestNeighbor" : 3,
27
+ "Ios16.reduceMean" : 218,
28
+ "Ios16.sin" : 1,
29
+ "Ios16.softmax" : 32,
30
+ "Split" : 16,
31
+ "Ios16.add" : 265,
32
+ "Concat" : 14,
33
+ "Ios16.realDiv" : 61,
34
+ "Ios16.square" : 61,
35
+ "ExpandDims" : 3,
36
+ "Ios16.sub" : 109,
37
+ "Ios16.cast" : 1,
38
+ "Ios16.conv" : 282,
39
+ "Ios16.constexprLutToDense" : 310,
40
+ "Ios16.gelu" : 16,
41
+ "Ios16.matmul" : 64,
42
+ "Ios16.batchNorm" : 61,
43
+ "Ios16.reshape" : 282,
44
+ "Ios16.rsqrt" : 48,
45
+ "Ios16.silu" : 47,
46
+ "Ios16.sqrt" : 61,
47
+ "Ios16.mul" : 193,
48
+ "Ios16.cos" : 1,
49
+ "SliceByIndex" : 2
50
+ },
51
+ "computePrecision" : "Mixed (Float16, Float32, Int32)",
52
+ "isUpdatable" : "0",
53
+ "availability" : {
54
+ "macOS" : "13.0",
55
+ "tvOS" : "16.0",
56
+ "visionOS" : "1.0",
57
+ "watchOS" : "9.0",
58
+ "iOS" : "16.0",
59
+ "macCatalyst" : "16.0"
60
+ },
61
+ "modelType" : {
62
+ "name" : "MLModelType_mlProgram"
63
+ },
64
+ "inputSchema" : [
65
+ {
66
+ "hasShapeFlexibility" : "0",
67
+ "isOptional" : "0",
68
+ "dataType" : "Float16",
69
+ "formattedType" : "MultiArray (Float16 2 × 4 × 64 × 64)",
70
+ "shortDescription" : "The low resolution latent feature maps being denoised through reverse diffusion",
71
+ "shape" : "[2, 4, 64, 64]",
72
+ "name" : "sample",
73
+ "type" : "MultiArray"
74
+ },
75
+ {
76
+ "hasShapeFlexibility" : "0",
77
+ "isOptional" : "0",
78
+ "dataType" : "Float16",
79
+ "formattedType" : "MultiArray (Float16 2)",
80
+ "shortDescription" : "A value emitted by the associated scheduler object to condition the model on a given noise schedule",
81
+ "shape" : "[2]",
82
+ "name" : "timestep",
83
+ "type" : "MultiArray"
84
+ },
85
+ {
86
+ "hasShapeFlexibility" : "0",
87
+ "isOptional" : "0",
88
+ "dataType" : "Float16",
89
+ "formattedType" : "MultiArray (Float16 2 × 1024 × 1 × 77)",
90
+ "shortDescription" : "Output embeddings from the associated text_encoder model to condition to generated image on text. A maximum of 77 tokens (~40 words) are allowed. Longer text is truncated. Shorter text does not reduce computation.",
91
+ "shape" : "[2, 1024, 1, 77]",
92
+ "name" : "encoder_hidden_states",
93
+ "type" : "MultiArray"
94
+ }
95
+ ],
96
+ "userDefinedMetadata" : {
97
+ "com.github.apple.ml-stable-diffusion.version" : "1.1.0",
98
+ "com.github.apple.coremltools.source" : "torch==2.1.0+cu121",
99
+ "com.github.apple.coremltools.version" : "7.1",
100
+ "com.github.apple.coremltools.source_dialect" : "TorchScript"
101
+ },
102
+ "generatedClassName" : "Stable_Diffusion_version_stabilityai_sd_turbo_unet",
103
+ "method" : "predict"
104
+ }
105
+ ]
sd-turbo/compiled/quantize-2-bit/ORIGINAL/Unet.mlmodelc/model.mil ADDED
The diff for this file is too large to render. See raw diff
 
sd-turbo/compiled/quantize-2-bit/ORIGINAL/UnetChunk1.mlmodelc/analytics/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e87e72c6538b66cfd06e87878f7dec702341a5e8bdbedc9f2089ff475489733
3
+ size 243
sd-turbo/compiled/quantize-2-bit/ORIGINAL/UnetChunk1.mlmodelc/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:945f6e795739315745e2ed10aeef235b7878018f06faa55a3c1fdfeb56128977
3
+ size 783
sd-turbo/compiled/quantize-2-bit/ORIGINAL/UnetChunk1.mlmodelc/metadata.json ADDED
@@ -0,0 +1,217 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "metadataOutputVersion" : "3.0",
4
+ "storagePrecision" : "Float16",
5
+ "outputSchema" : [
6
+ {
7
+ "hasShapeFlexibility" : "0",
8
+ "isOptional" : "0",
9
+ "dataType" : "Float32",
10
+ "formattedType" : "MultiArray (Float32 2 × 320 × 64 × 64)",
11
+ "shortDescription" : "",
12
+ "shape" : "[2, 320, 64, 64]",
13
+ "name" : "input_7_cast_fp16",
14
+ "type" : "MultiArray"
15
+ },
16
+ {
17
+ "hasShapeFlexibility" : "0",
18
+ "isOptional" : "0",
19
+ "dataType" : "Float32",
20
+ "formattedType" : "MultiArray (Float32 2 × 320 × 64 × 64)",
21
+ "shortDescription" : "",
22
+ "shape" : "[2, 320, 64, 64]",
23
+ "name" : "input_61_cast_fp16",
24
+ "type" : "MultiArray"
25
+ },
26
+ {
27
+ "hasShapeFlexibility" : "0",
28
+ "isOptional" : "0",
29
+ "dataType" : "Float32",
30
+ "formattedType" : "MultiArray (Float32 2 × 1280 × 8 × 8)",
31
+ "shortDescription" : "",
32
+ "shape" : "[2, 1280, 8, 8]",
33
+ "name" : "input_171_cast_fp16",
34
+ "type" : "MultiArray"
35
+ },
36
+ {
37
+ "hasShapeFlexibility" : "0",
38
+ "isOptional" : "0",
39
+ "dataType" : "Float32",
40
+ "formattedType" : "MultiArray (Float32 2 × 1280 × 1 × 1)",
41
+ "shortDescription" : "",
42
+ "shape" : "[2, 1280, 1, 1]",
43
+ "name" : "input_15_cast_fp16",
44
+ "type" : "MultiArray"
45
+ },
46
+ {
47
+ "hasShapeFlexibility" : "0",
48
+ "isOptional" : "0",
49
+ "dataType" : "Float32",
50
+ "formattedType" : "MultiArray (Float32 2 × 320 × 64 × 64)",
51
+ "shortDescription" : "",
52
+ "shape" : "[2, 320, 64, 64]",
53
+ "name" : "input_35_cast_fp16",
54
+ "type" : "MultiArray"
55
+ },
56
+ {
57
+ "hasShapeFlexibility" : "0",
58
+ "isOptional" : "0",
59
+ "dataType" : "Float32",
60
+ "formattedType" : "MultiArray (Float32 2 × 640 × 32 × 32)",
61
+ "shortDescription" : "",
62
+ "shape" : "[2, 640, 32, 32]",
63
+ "name" : "input_89_cast_fp16",
64
+ "type" : "MultiArray"
65
+ },
66
+ {
67
+ "hasShapeFlexibility" : "0",
68
+ "isOptional" : "0",
69
+ "dataType" : "Float32",
70
+ "formattedType" : "MultiArray (Float32 2 × 1280 × 16 × 16)",
71
+ "shortDescription" : "",
72
+ "shape" : "[2, 1280, 16, 16]",
73
+ "name" : "input_143_cast_fp16",
74
+ "type" : "MultiArray"
75
+ },
76
+ {
77
+ "hasShapeFlexibility" : "0",
78
+ "isOptional" : "0",
79
+ "dataType" : "Float32",
80
+ "formattedType" : "MultiArray (Float32 2 × 320 × 32 × 32)",
81
+ "shortDescription" : "",
82
+ "shape" : "[2, 320, 32, 32]",
83
+ "name" : "input_63_cast_fp16",
84
+ "type" : "MultiArray"
85
+ },
86
+ {
87
+ "hasShapeFlexibility" : "0",
88
+ "isOptional" : "0",
89
+ "dataType" : "Float32",
90
+ "formattedType" : "MultiArray (Float32 2 × 1280 × 16 × 16)",
91
+ "shortDescription" : "",
92
+ "shape" : "[2, 1280, 16, 16]",
93
+ "name" : "input_169_cast_fp16",
94
+ "type" : "MultiArray"
95
+ },
96
+ {
97
+ "hasShapeFlexibility" : "0",
98
+ "isOptional" : "0",
99
+ "dataType" : "Float32",
100
+ "formattedType" : "MultiArray (Float32 2 × 1280 × 8 × 8)",
101
+ "shortDescription" : "",
102
+ "shape" : "[2, 1280, 8, 8]",
103
+ "name" : "hidden_states_149_cast_fp16",
104
+ "type" : "MultiArray"
105
+ },
106
+ {
107
+ "hasShapeFlexibility" : "0",
108
+ "isOptional" : "0",
109
+ "dataType" : "Float32",
110
+ "formattedType" : "MultiArray (Float32 2 × 640 × 16 × 16)",
111
+ "shortDescription" : "",
112
+ "shape" : "[2, 640, 16, 16]",
113
+ "name" : "input_117_cast_fp16",
114
+ "type" : "MultiArray"
115
+ },
116
+ {
117
+ "hasShapeFlexibility" : "0",
118
+ "isOptional" : "0",
119
+ "dataType" : "Float32",
120
+ "formattedType" : "MultiArray (Float32 2 × 640 × 32 × 32)",
121
+ "shortDescription" : "",
122
+ "shape" : "[2, 640, 32, 32]",
123
+ "name" : "input_115_cast_fp16",
124
+ "type" : "MultiArray"
125
+ },
126
+ {
127
+ "hasShapeFlexibility" : "0",
128
+ "isOptional" : "0",
129
+ "dataType" : "Float32",
130
+ "formattedType" : "MultiArray (Float32 2 × 2560 × 8 × 8)",
131
+ "shortDescription" : "",
132
+ "shape" : "[2, 2560, 8, 8]",
133
+ "name" : "input_253_cast_fp16",
134
+ "type" : "MultiArray"
135
+ }
136
+ ],
137
+ "modelParameters" : [
138
+
139
+ ],
140
+ "specificationVersion" : 7,
141
+ "mlProgramOperationTypeHistogram" : {
142
+ "Ios16.reduceMean" : 104,
143
+ "Ios16.sin" : 1,
144
+ "Ios16.softmax" : 14,
145
+ "Split" : 7,
146
+ "Ios16.add" : 124,
147
+ "Concat" : 4,
148
+ "Ios16.realDiv" : 31,
149
+ "Ios16.square" : 31,
150
+ "ExpandDims" : 3,
151
+ "Ios16.sub" : 52,
152
+ "Ios16.cast" : 13,
153
+ "Ios16.conv" : 129,
154
+ "Ios16.gelu" : 7,
155
+ "Ios16.matmul" : 28,
156
+ "Ios16.reshape" : 132,
157
+ "Ios16.batchNorm" : 31,
158
+ "Ios16.rsqrt" : 21,
159
+ "Ios16.silu" : 26,
160
+ "Ios16.sqrt" : 31,
161
+ "SliceByIndex" : 2,
162
+ "Ios16.mul" : 85,
163
+ "Ios16.cos" : 1
164
+ },
165
+ "computePrecision" : "Mixed (Float16, Float32, Int32)",
166
+ "isUpdatable" : "0",
167
+ "availability" : {
168
+ "macOS" : "13.0",
169
+ "tvOS" : "16.0",
170
+ "visionOS" : "1.0",
171
+ "watchOS" : "9.0",
172
+ "iOS" : "16.0",
173
+ "macCatalyst" : "16.0"
174
+ },
175
+ "modelType" : {
176
+ "name" : "MLModelType_mlProgram"
177
+ },
178
+ "userDefinedMetadata" : {
179
+ "com.github.apple.coremltools.version" : "7.1",
180
+ "com.github.apple.coremltools.source" : "milinternal"
181
+ },
182
+ "inputSchema" : [
183
+ {
184
+ "hasShapeFlexibility" : "0",
185
+ "isOptional" : "0",
186
+ "dataType" : "Float16",
187
+ "formattedType" : "MultiArray (Float16 2 × 4 × 64 × 64)",
188
+ "shortDescription" : "",
189
+ "shape" : "[2, 4, 64, 64]",
190
+ "name" : "sample",
191
+ "type" : "MultiArray"
192
+ },
193
+ {
194
+ "hasShapeFlexibility" : "0",
195
+ "isOptional" : "0",
196
+ "dataType" : "Float16",
197
+ "formattedType" : "MultiArray (Float16 2)",
198
+ "shortDescription" : "",
199
+ "shape" : "[2]",
200
+ "name" : "timestep",
201
+ "type" : "MultiArray"
202
+ },
203
+ {
204
+ "hasShapeFlexibility" : "0",
205
+ "isOptional" : "0",
206
+ "dataType" : "Float16",
207
+ "formattedType" : "MultiArray (Float16 2 × 1024 × 1 × 77)",
208
+ "shortDescription" : "",
209
+ "shape" : "[2, 1024, 1, 77]",
210
+ "name" : "encoder_hidden_states",
211
+ "type" : "MultiArray"
212
+ }
213
+ ],
214
+ "generatedClassName" : "Stable_Diffusion_version_stabilityai_sd_turbo_unet_chunk1",
215
+ "method" : "predict"
216
+ }
217
+ ]
sd-turbo/compiled/quantize-2-bit/ORIGINAL/UnetChunk1.mlmodelc/model.mil ADDED
The diff for this file is too large to render. See raw diff
 
sd-turbo/compiled/quantize-2-bit/ORIGINAL/UnetChunk2.mlmodelc/analytics/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c81557e4f40e1c3b06586b9f32be564bbebe9e9fc6df661421b059ca35caf8a
3
+ size 243
sd-turbo/compiled/quantize-2-bit/ORIGINAL/UnetChunk2.mlmodelc/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d4a8655637d03406f91370c047e5dcc4264ba0ba57a79c6322ffc37f4764d98
3
+ size 764
sd-turbo/compiled/quantize-2-bit/ORIGINAL/UnetChunk2.mlmodelc/metadata.json ADDED
@@ -0,0 +1,204 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "metadataOutputVersion" : "3.0",
4
+ "storagePrecision" : "Float16",
5
+ "outputSchema" : [
6
+ {
7
+ "hasShapeFlexibility" : "0",
8
+ "isOptional" : "0",
9
+ "dataType" : "Float32",
10
+ "formattedType" : "MultiArray (Float32 2 × 4 × 64 × 64)",
11
+ "shortDescription" : "",
12
+ "shape" : "[2, 4, 64, 64]",
13
+ "name" : "noise_pred",
14
+ "type" : "MultiArray"
15
+ }
16
+ ],
17
+ "modelParameters" : [
18
+
19
+ ],
20
+ "specificationVersion" : 7,
21
+ "mlProgramOperationTypeHistogram" : {
22
+ "Split" : 9,
23
+ "Concat" : 10,
24
+ "Ios16.cast" : 14,
25
+ "Ios16.mul" : 108,
26
+ "Ios16.rsqrt" : 27,
27
+ "Ios16.sqrt" : 30,
28
+ "Ios16.sub" : 57,
29
+ "UpsampleNearestNeighbor" : 3,
30
+ "Ios16.conv" : 153,
31
+ "Ios16.add" : 141,
32
+ "Ios16.realDiv" : 30,
33
+ "Ios16.matmul" : 36,
34
+ "Ios16.gelu" : 9,
35
+ "Ios16.reduceMean" : 114,
36
+ "Ios16.softmax" : 18,
37
+ "Ios16.batchNorm" : 30,
38
+ "Ios16.square" : 30,
39
+ "Ios16.reshape" : 150,
40
+ "Ios16.silu" : 21
41
+ },
42
+ "computePrecision" : "Mixed (Float16, Float32, Int32)",
43
+ "isUpdatable" : "0",
44
+ "availability" : {
45
+ "macOS" : "13.0",
46
+ "tvOS" : "16.0",
47
+ "visionOS" : "1.0",
48
+ "watchOS" : "9.0",
49
+ "iOS" : "16.0",
50
+ "macCatalyst" : "16.0"
51
+ },
52
+ "modelType" : {
53
+ "name" : "MLModelType_mlProgram"
54
+ },
55
+ "userDefinedMetadata" : {
56
+ "com.github.apple.coremltools.version" : "7.1",
57
+ "com.github.apple.coremltools.source" : "milinternal"
58
+ },
59
+ "inputSchema" : [
60
+ {
61
+ "hasShapeFlexibility" : "0",
62
+ "isOptional" : "0",
63
+ "dataType" : "Float16",
64
+ "formattedType" : "MultiArray (Float16 2 × 1024 × 1 × 77)",
65
+ "shortDescription" : "",
66
+ "shape" : "[2, 1024, 1, 77]",
67
+ "name" : "encoder_hidden_states",
68
+ "type" : "MultiArray"
69
+ },
70
+ {
71
+ "hasShapeFlexibility" : "0",
72
+ "isOptional" : "0",
73
+ "dataType" : "Float32",
74
+ "formattedType" : "MultiArray (Float32 2 × 320 × 64 × 64)",
75
+ "shortDescription" : "",
76
+ "shape" : "[2, 320, 64, 64]",
77
+ "name" : "input_7_cast_fp16",
78
+ "type" : "MultiArray"
79
+ },
80
+ {
81
+ "hasShapeFlexibility" : "0",
82
+ "isOptional" : "0",
83
+ "dataType" : "Float32",
84
+ "formattedType" : "MultiArray (Float32 2 × 1280 × 8 × 8)",
85
+ "shortDescription" : "",
86
+ "shape" : "[2, 1280, 8, 8]",
87
+ "name" : "input_171_cast_fp16",
88
+ "type" : "MultiArray"
89
+ },
90
+ {
91
+ "hasShapeFlexibility" : "0",
92
+ "isOptional" : "0",
93
+ "dataType" : "Float32",
94
+ "formattedType" : "MultiArray (Float32 2 × 1280 × 8 × 8)",
95
+ "shortDescription" : "",
96
+ "shape" : "[2, 1280, 8, 8]",
97
+ "name" : "hidden_states_149_cast_fp16",
98
+ "type" : "MultiArray"
99
+ },
100
+ {
101
+ "hasShapeFlexibility" : "0",
102
+ "isOptional" : "0",
103
+ "dataType" : "Float32",
104
+ "formattedType" : "MultiArray (Float32 2 × 640 × 32 × 32)",
105
+ "shortDescription" : "",
106
+ "shape" : "[2, 640, 32, 32]",
107
+ "name" : "input_89_cast_fp16",
108
+ "type" : "MultiArray"
109
+ },
110
+ {
111
+ "hasShapeFlexibility" : "0",
112
+ "isOptional" : "0",
113
+ "dataType" : "Float32",
114
+ "formattedType" : "MultiArray (Float32 2 × 1280 × 16 × 16)",
115
+ "shortDescription" : "",
116
+ "shape" : "[2, 1280, 16, 16]",
117
+ "name" : "input_143_cast_fp16",
118
+ "type" : "MultiArray"
119
+ },
120
+ {
121
+ "hasShapeFlexibility" : "0",
122
+ "isOptional" : "0",
123
+ "dataType" : "Float32",
124
+ "formattedType" : "MultiArray (Float32 2 × 320 × 64 × 64)",
125
+ "shortDescription" : "",
126
+ "shape" : "[2, 320, 64, 64]",
127
+ "name" : "input_61_cast_fp16",
128
+ "type" : "MultiArray"
129
+ },
130
+ {
131
+ "hasShapeFlexibility" : "0",
132
+ "isOptional" : "0",
133
+ "dataType" : "Float32",
134
+ "formattedType" : "MultiArray (Float32 2 × 320 × 64 × 64)",
135
+ "shortDescription" : "",
136
+ "shape" : "[2, 320, 64, 64]",
137
+ "name" : "input_35_cast_fp16",
138
+ "type" : "MultiArray"
139
+ },
140
+ {
141
+ "hasShapeFlexibility" : "0",
142
+ "isOptional" : "0",
143
+ "dataType" : "Float32",
144
+ "formattedType" : "MultiArray (Float32 2 × 640 × 32 × 32)",
145
+ "shortDescription" : "",
146
+ "shape" : "[2, 640, 32, 32]",
147
+ "name" : "input_115_cast_fp16",
148
+ "type" : "MultiArray"
149
+ },
150
+ {
151
+ "hasShapeFlexibility" : "0",
152
+ "isOptional" : "0",
153
+ "dataType" : "Float32",
154
+ "formattedType" : "MultiArray (Float32 2 × 1280 × 1 × 1)",
155
+ "shortDescription" : "",
156
+ "shape" : "[2, 1280, 1, 1]",
157
+ "name" : "input_15_cast_fp16",
158
+ "type" : "MultiArray"
159
+ },
160
+ {
161
+ "hasShapeFlexibility" : "0",
162
+ "isOptional" : "0",
163
+ "dataType" : "Float32",
164
+ "formattedType" : "MultiArray (Float32 2 × 1280 × 16 × 16)",
165
+ "shortDescription" : "",
166
+ "shape" : "[2, 1280, 16, 16]",
167
+ "name" : "input_169_cast_fp16",
168
+ "type" : "MultiArray"
169
+ },
170
+ {
171
+ "hasShapeFlexibility" : "0",
172
+ "isOptional" : "0",
173
+ "dataType" : "Float32",
174
+ "formattedType" : "MultiArray (Float32 2 × 2560 × 8 × 8)",
175
+ "shortDescription" : "",
176
+ "shape" : "[2, 2560, 8, 8]",
177
+ "name" : "input_253_cast_fp16",
178
+ "type" : "MultiArray"
179
+ },
180
+ {
181
+ "hasShapeFlexibility" : "0",
182
+ "isOptional" : "0",
183
+ "dataType" : "Float32",
184
+ "formattedType" : "MultiArray (Float32 2 × 320 × 32 × 32)",
185
+ "shortDescription" : "",
186
+ "shape" : "[2, 320, 32, 32]",
187
+ "name" : "input_63_cast_fp16",
188
+ "type" : "MultiArray"
189
+ },
190
+ {
191
+ "hasShapeFlexibility" : "0",
192
+ "isOptional" : "0",
193
+ "dataType" : "Float32",
194
+ "formattedType" : "MultiArray (Float32 2 × 640 × 16 × 16)",
195
+ "shortDescription" : "",
196
+ "shape" : "[2, 640, 16, 16]",
197
+ "name" : "input_117_cast_fp16",
198
+ "type" : "MultiArray"
199
+ }
200
+ ],
201
+ "generatedClassName" : "Stable_Diffusion_version_stabilityai_sd_turbo_unet_chunk2",
202
+ "method" : "predict"
203
+ }
204
+ ]
sd-turbo/compiled/quantize-2-bit/ORIGINAL/UnetChunk2.mlmodelc/model.mil ADDED
The diff for this file is too large to render. See raw diff
 
sd-turbo/compiled/quantize-2-bit/ORIGINAL/VAEDecoder.mlmodelc/analytics/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:926ecbbeafe5b09ea617a9eb99884249a4fbb60f0ee8404233141a79e491d023
3
+ size 243
sd-turbo/compiled/quantize-2-bit/ORIGINAL/VAEDecoder.mlmodelc/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98ab0e617864c2082eaec54b1db16239b6f3f084fe710346c4a2d1280afc02e7
3
+ size 808
sd-turbo/compiled/quantize-2-bit/ORIGINAL/VAEDecoder.mlmodelc/metadata.json ADDED
@@ -0,0 +1,77 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "shortDescription" : "Stable Diffusion generates images conditioned on text and\/or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
4
+ "metadataOutputVersion" : "3.0",
5
+ "outputSchema" : [
6
+ {
7
+ "hasShapeFlexibility" : "0",
8
+ "isOptional" : "0",
9
+ "dataType" : "Float32",
10
+ "formattedType" : "MultiArray (Float32 1 × 3 × 512 × 512)",
11
+ "shortDescription" : "Generated image normalized to range [-1, 1]",
12
+ "shape" : "[1, 3, 512, 512]",
13
+ "name" : "image",
14
+ "type" : "MultiArray"
15
+ }
16
+ ],
17
+ "version" : "stabilityai\/sd-turbo",
18
+ "modelParameters" : [
19
+
20
+ ],
21
+ "author" : "Please refer to the Model Card available at huggingface.co\/stabilityai\/sd-turbo",
22
+ "specificationVersion" : 7,
23
+ "storagePrecision" : "Float16",
24
+ "license" : "OpenRAIL (https:\/\/huggingface.co\/spaces\/CompVis\/stable-diffusion-license)",
25
+ "mlProgramOperationTypeHistogram" : {
26
+ "Ios16.cast" : 1,
27
+ "Ios16.mul" : 2,
28
+ "Ios16.sqrt" : 30,
29
+ "Ios16.sub" : 30,
30
+ "Transpose" : 6,
31
+ "UpsampleNearestNeighbor" : 3,
32
+ "Ios16.conv" : 36,
33
+ "Ios16.add" : 46,
34
+ "Ios16.linear" : 4,
35
+ "Ios16.matmul" : 2,
36
+ "Ios16.realDiv" : 30,
37
+ "Ios16.reduceMean" : 60,
38
+ "Ios16.softmax" : 1,
39
+ "Ios16.batchNorm" : 29,
40
+ "Ios16.square" : 30,
41
+ "Ios16.reshape" : 65,
42
+ "Ios16.silu" : 29
43
+ },
44
+ "computePrecision" : "Mixed (Float16, Float32, Int32)",
45
+ "isUpdatable" : "0",
46
+ "availability" : {
47
+ "macOS" : "13.0",
48
+ "tvOS" : "16.0",
49
+ "visionOS" : "1.0",
50
+ "watchOS" : "9.0",
51
+ "iOS" : "16.0",
52
+ "macCatalyst" : "16.0"
53
+ },
54
+ "modelType" : {
55
+ "name" : "MLModelType_mlProgram"
56
+ },
57
+ "inputSchema" : [
58
+ {
59
+ "hasShapeFlexibility" : "0",
60
+ "isOptional" : "0",
61
+ "dataType" : "Float16",
62
+ "formattedType" : "MultiArray (Float16 1 × 4 × 64 × 64)",
63
+ "shortDescription" : "The denoised latent embeddings from the unet model after the last step of reverse diffusion",
64
+ "shape" : "[1, 4, 64, 64]",
65
+ "name" : "z",
66
+ "type" : "MultiArray"
67
+ }
68
+ ],
69
+ "userDefinedMetadata" : {
70
+ "com.github.apple.coremltools.source_dialect" : "TorchScript",
71
+ "com.github.apple.coremltools.source" : "torch==2.1.0+cu121",
72
+ "com.github.apple.coremltools.version" : "7.1"
73
+ },
74
+ "generatedClassName" : "Stable_Diffusion_version_stabilityai_sd_turbo_vae_decoder",
75
+ "method" : "predict"
76
+ }
77
+ ]
sd-turbo/compiled/quantize-2-bit/ORIGINAL/VAEDecoder.mlmodelc/model.mil ADDED
The diff for this file is too large to render. See raw diff
 
sd-turbo/compiled/quantize-2-bit/ORIGINAL/merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
sd-turbo/compiled/quantize-2-bit/ORIGINAL/vocab.json ADDED
The diff for this file is too large to render. See raw diff