digitalbrain79 commited on
Commit
d65f954
·
verified ·
1 Parent(s): 947d7b8

Upload 6 files

Browse files
config.json ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "ControlNetModel",
3
+ "_diffusers_version": "0.27.2",
4
+ "act_fn": "silu",
5
+ "addition_embed_type": "text_time",
6
+ "addition_embed_type_num_heads": 64,
7
+ "addition_time_embed_dim": 256,
8
+ "attention_head_dim": [
9
+ 5,
10
+ 10,
11
+ 20
12
+ ],
13
+ "block_out_channels": [
14
+ 320,
15
+ 640,
16
+ 1280
17
+ ],
18
+ "class_embed_type": null,
19
+ "conditioning_channels": 3,
20
+ "conditioning_embedding_out_channels": [
21
+ 16,
22
+ 32,
23
+ 96,
24
+ 256
25
+ ],
26
+ "controlnet_conditioning_channel_order": "rgb",
27
+ "cross_attention_dim": 2048,
28
+ "down_block_types": [
29
+ "DownBlock2D",
30
+ "CrossAttnDownBlock2D",
31
+ "CrossAttnDownBlock2D"
32
+ ],
33
+ "downsample_padding": 1,
34
+ "encoder_hid_dim": null,
35
+ "encoder_hid_dim_type": null,
36
+ "flip_sin_to_cos": true,
37
+ "freq_shift": 0,
38
+ "global_pool_conditions": false,
39
+ "in_channels": 4,
40
+ "layers_per_block": 2,
41
+ "mid_block_scale_factor": 1,
42
+ "mid_block_type": "UNetMidBlock2DCrossAttn",
43
+ "norm_eps": 1e-05,
44
+ "norm_num_groups": 32,
45
+ "num_attention_heads": null,
46
+ "num_class_embeds": null,
47
+ "only_cross_attention": false,
48
+ "projection_class_embeddings_input_dim": 2816,
49
+ "resnet_time_scale_shift": "default",
50
+ "transformer_layers_per_block": [
51
+ 1,
52
+ 2,
53
+ 10
54
+ ],
55
+ "upcast_attention": false,
56
+ "use_linear_projection": true
57
+ }
coreml_model.mlmodelc/analytics/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e515a0a803963196140e6b79c2a7fb9c38fcf88a241f442e69ef17c28aeea565
3
+ size 243
coreml_model.mlmodelc/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebbf714378063c9665ff365cfffcc7eb5abf281443d1d49e8fb07ce271392a2e
3
+ size 2923
coreml_model.mlmodelc/metadata.json ADDED
@@ -0,0 +1,235 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "shortDescription" : "ControlNet is a neural network structure to control diffusion models by adding extra conditions. Please refer to https:\/\/arxiv.org\/abs\/2302.05543 for details.",
4
+ "metadataOutputVersion" : "3.0",
5
+ "outputSchema" : [
6
+ {
7
+ "hasShapeFlexibility" : "0",
8
+ "isOptional" : "0",
9
+ "dataType" : "Float32",
10
+ "formattedType" : "MultiArray (Float32 1 × 320 × 128 × 128)",
11
+ "shortDescription" : "One of the outputs of each downsampling block in ControlNet. The value added to the corresponding resnet output in UNet.",
12
+ "shape" : "[1, 320, 128, 128]",
13
+ "name" : "additional_residual_0",
14
+ "type" : "MultiArray"
15
+ },
16
+ {
17
+ "hasShapeFlexibility" : "0",
18
+ "isOptional" : "0",
19
+ "dataType" : "Float32",
20
+ "formattedType" : "MultiArray (Float32 1 × 320 × 128 × 128)",
21
+ "shortDescription" : "One of the outputs of each downsampling block in ControlNet. The value added to the corresponding resnet output in UNet.",
22
+ "shape" : "[1, 320, 128, 128]",
23
+ "name" : "additional_residual_1",
24
+ "type" : "MultiArray"
25
+ },
26
+ {
27
+ "hasShapeFlexibility" : "0",
28
+ "isOptional" : "0",
29
+ "dataType" : "Float32",
30
+ "formattedType" : "MultiArray (Float32 1 × 320 × 128 × 128)",
31
+ "shortDescription" : "One of the outputs of each downsampling block in ControlNet. The value added to the corresponding resnet output in UNet.",
32
+ "shape" : "[1, 320, 128, 128]",
33
+ "name" : "additional_residual_2",
34
+ "type" : "MultiArray"
35
+ },
36
+ {
37
+ "hasShapeFlexibility" : "0",
38
+ "isOptional" : "0",
39
+ "dataType" : "Float32",
40
+ "formattedType" : "MultiArray (Float32 1 × 320 × 64 × 64)",
41
+ "shortDescription" : "One of the outputs of each downsampling block in ControlNet. The value added to the corresponding resnet output in UNet.",
42
+ "shape" : "[1, 320, 64, 64]",
43
+ "name" : "additional_residual_3",
44
+ "type" : "MultiArray"
45
+ },
46
+ {
47
+ "hasShapeFlexibility" : "0",
48
+ "isOptional" : "0",
49
+ "dataType" : "Float32",
50
+ "formattedType" : "MultiArray (Float32 1 × 640 × 64 × 64)",
51
+ "shortDescription" : "One of the outputs of each downsampling block in ControlNet. The value added to the corresponding resnet output in UNet.",
52
+ "shape" : "[1, 640, 64, 64]",
53
+ "name" : "additional_residual_4",
54
+ "type" : "MultiArray"
55
+ },
56
+ {
57
+ "hasShapeFlexibility" : "0",
58
+ "isOptional" : "0",
59
+ "dataType" : "Float32",
60
+ "formattedType" : "MultiArray (Float32 1 × 640 × 64 × 64)",
61
+ "shortDescription" : "One of the outputs of each downsampling block in ControlNet. The value added to the corresponding resnet output in UNet.",
62
+ "shape" : "[1, 640, 64, 64]",
63
+ "name" : "additional_residual_5",
64
+ "type" : "MultiArray"
65
+ },
66
+ {
67
+ "hasShapeFlexibility" : "0",
68
+ "isOptional" : "0",
69
+ "dataType" : "Float32",
70
+ "formattedType" : "MultiArray (Float32 1 × 640 × 32 × 32)",
71
+ "shortDescription" : "One of the outputs of each downsampling block in ControlNet. The value added to the corresponding resnet output in UNet.",
72
+ "shape" : "[1, 640, 32, 32]",
73
+ "name" : "additional_residual_6",
74
+ "type" : "MultiArray"
75
+ },
76
+ {
77
+ "hasShapeFlexibility" : "0",
78
+ "isOptional" : "0",
79
+ "dataType" : "Float32",
80
+ "formattedType" : "MultiArray (Float32 1 × 1280 × 32 × 32)",
81
+ "shortDescription" : "One of the outputs of each downsampling block in ControlNet. The value added to the corresponding resnet output in UNet.",
82
+ "shape" : "[1, 1280, 32, 32]",
83
+ "name" : "additional_residual_7",
84
+ "type" : "MultiArray"
85
+ },
86
+ {
87
+ "hasShapeFlexibility" : "0",
88
+ "isOptional" : "0",
89
+ "dataType" : "Float32",
90
+ "formattedType" : "MultiArray (Float32 1 × 1280 × 32 × 32)",
91
+ "shortDescription" : "One of the outputs of each downsampling block in ControlNet. The value added to the corresponding resnet output in UNet.",
92
+ "shape" : "[1, 1280, 32, 32]",
93
+ "name" : "additional_residual_8",
94
+ "type" : "MultiArray"
95
+ },
96
+ {
97
+ "hasShapeFlexibility" : "0",
98
+ "isOptional" : "0",
99
+ "dataType" : "Float32",
100
+ "formattedType" : "MultiArray (Float32 1 × 1280 × 32 × 32)",
101
+ "shortDescription" : "One of the outputs of each downsampling block in ControlNet. The value added to the corresponding resnet output in UNet.",
102
+ "shape" : "[1, 1280, 32, 32]",
103
+ "name" : "additional_residual_9",
104
+ "type" : "MultiArray"
105
+ }
106
+ ],
107
+ "version" : "TheMistoAI\/MistoLine",
108
+ "modelParameters" : [
109
+
110
+ ],
111
+ "author" : "Please refer to the Model Card available at huggingface.co\/TheMistoAI\/MistoLine",
112
+ "specificationVersion" : 7,
113
+ "storagePrecision" : "Mixed (Float16, Palettized (6 bits))",
114
+ "license" : "OpenRAIL (https:\/\/huggingface.co\/spaces\/CompVis\/stable-diffusion-license)",
115
+ "mlProgramOperationTypeHistogram" : {
116
+ "Transpose" : 282,
117
+ "Ios16.reduceMean" : 42,
118
+ "Ios16.sin" : 2,
119
+ "Ios16.softmax" : 68,
120
+ "Split" : 34,
121
+ "Ios16.linear" : 362,
122
+ "Ios16.add" : 146,
123
+ "Concat" : 5,
124
+ "Ios16.realDiv" : 21,
125
+ "Ios16.square" : 21,
126
+ "ExpandDims" : 18,
127
+ "Ios16.sub" : 21,
128
+ "Ios16.cast" : 10,
129
+ "Ios16.conv" : 39,
130
+ "Ios16.constexprLutToDense" : 434,
131
+ "Ios16.gelu" : 34,
132
+ "Ios16.layerNorm" : 102,
133
+ "Ios16.batchNorm" : 21,
134
+ "Ios16.matmul" : 136,
135
+ "Ios16.reshape" : 326,
136
+ "Ios16.silu" : 26,
137
+ "Ios16.sqrt" : 21,
138
+ "Ios16.mul" : 114,
139
+ "Ios16.cos" : 2,
140
+ "SliceByIndex" : 4
141
+ },
142
+ "computePrecision" : "Mixed (Float16, Float32, Int32)",
143
+ "isUpdatable" : "0",
144
+ "availability" : {
145
+ "macOS" : "13.0",
146
+ "tvOS" : "16.0",
147
+ "visionOS" : "1.0",
148
+ "watchOS" : "9.0",
149
+ "iOS" : "16.0",
150
+ "macCatalyst" : "16.0"
151
+ },
152
+ "modelType" : {
153
+ "name" : "MLModelType_mlProgram"
154
+ },
155
+ "inputSchema" : [
156
+ {
157
+ "hasShapeFlexibility" : "0",
158
+ "isOptional" : "0",
159
+ "dataType" : "Float16",
160
+ "formattedType" : "MultiArray (Float16 1 × 4 × 128 × 128)",
161
+ "shortDescription" : "The low resolution latent feature maps being denoised through reverse diffusion",
162
+ "shape" : "[1, 4, 128, 128]",
163
+ "name" : "sample",
164
+ "type" : "MultiArray"
165
+ },
166
+ {
167
+ "hasShapeFlexibility" : "0",
168
+ "isOptional" : "0",
169
+ "dataType" : "Float16",
170
+ "formattedType" : "MultiArray (Float16 1)",
171
+ "shortDescription" : "A value emitted by the associated scheduler object to condition the model on a given noise schedule",
172
+ "shape" : "[1]",
173
+ "name" : "timestep",
174
+ "type" : "MultiArray"
175
+ },
176
+ {
177
+ "hasShapeFlexibility" : "0",
178
+ "isOptional" : "0",
179
+ "dataType" : "Float16",
180
+ "formattedType" : "MultiArray (Float16 1 × 77 × 2048)",
181
+ "shortDescription" : "Output embeddings from the associated text_encoder model to condition to generated image on text. A maximum of 77 tokens (~40 words) are allowed. Longer text is truncated. Shorter text does not reduce computation.",
182
+ "shape" : "[1, 77, 2048]",
183
+ "name" : "encoder_hidden_states",
184
+ "type" : "MultiArray"
185
+ },
186
+ {
187
+ "hasShapeFlexibility" : "0",
188
+ "isOptional" : "0",
189
+ "dataType" : "Float16",
190
+ "formattedType" : "MultiArray (Float16 1 × 3 × 1024 × 1024)",
191
+ "shortDescription" : "An additional input image for ControlNet to condition the generated images.",
192
+ "shape" : "[1, 3, 1024, 1024]",
193
+ "name" : "controlnet_cond",
194
+ "type" : "MultiArray"
195
+ },
196
+ {
197
+ "hasShapeFlexibility" : "0",
198
+ "isOptional" : "0",
199
+ "dataType" : "Float16",
200
+ "formattedType" : "MultiArray (Float16 1)",
201
+ "shortDescription" : "",
202
+ "shape" : "[1]",
203
+ "name" : "conditioning_scale",
204
+ "type" : "MultiArray"
205
+ },
206
+ {
207
+ "hasShapeFlexibility" : "0",
208
+ "isOptional" : "0",
209
+ "dataType" : "Float16",
210
+ "formattedType" : "MultiArray (Float16 1 × 1280)",
211
+ "shortDescription" : "",
212
+ "shape" : "[1, 1280]",
213
+ "name" : "text_embeds",
214
+ "type" : "MultiArray"
215
+ },
216
+ {
217
+ "hasShapeFlexibility" : "0",
218
+ "isOptional" : "0",
219
+ "dataType" : "Float16",
220
+ "formattedType" : "MultiArray (Float16 1 × 6)",
221
+ "shortDescription" : "",
222
+ "shape" : "[1, 6]",
223
+ "name" : "time_ids",
224
+ "type" : "MultiArray"
225
+ }
226
+ ],
227
+ "userDefinedMetadata" : {
228
+ "com.github.apple.coremltools.source_dialect" : "TorchScript",
229
+ "com.github.apple.coremltools.source" : "torch==2.2.0",
230
+ "com.github.apple.coremltools.version" : "7.2"
231
+ },
232
+ "generatedClassName" : "ControlNet_TheMistoAI_MistoLine",
233
+ "method" : "predict"
234
+ }
235
+ ]
coreml_model.mlmodelc/model.mil ADDED
The diff for this file is too large to render. See raw diff
 
coreml_model.mlmodelc/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aaf8ae4cc2b9fc12b45cf4a34bbe3bc3aa05840031aa0e382c40fe1c3e034a72
3
+ size 938974592