digitalbrain79
commited on
Upload 12 files
Browse files- vae_decoder/config.json +32 -0
- vae_decoder/coreml_model.mlmodelc/analytics/coremldata.bin +3 -0
- vae_decoder/coreml_model.mlmodelc/coremldata.bin +3 -0
- vae_decoder/coreml_model.mlmodelc/metadata.json +77 -0
- vae_decoder/coreml_model.mlmodelc/model.mil +0 -0
- vae_decoder/coreml_model.mlmodelc/weights/weight.bin +3 -0
- vae_encoder/config.json +32 -0
- vae_encoder/coreml_model.mlmodelc/analytics/coremldata.bin +3 -0
- vae_encoder/coreml_model.mlmodelc/coremldata.bin +3 -0
- vae_encoder/coreml_model.mlmodelc/metadata.json +76 -0
- vae_encoder/coreml_model.mlmodelc/model.mil +0 -0
- vae_encoder/coreml_model.mlmodelc/weights/weight.bin +3 -0
vae_decoder/config.json
ADDED
@@ -0,0 +1,32 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "AutoencoderKL",
|
3 |
+
"_diffusers_version": "0.19.0.dev0",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"block_out_channels": [
|
6 |
+
128,
|
7 |
+
256,
|
8 |
+
512,
|
9 |
+
512
|
10 |
+
],
|
11 |
+
"down_block_types": [
|
12 |
+
"DownEncoderBlock2D",
|
13 |
+
"DownEncoderBlock2D",
|
14 |
+
"DownEncoderBlock2D",
|
15 |
+
"DownEncoderBlock2D"
|
16 |
+
],
|
17 |
+
"force_upcast": false,
|
18 |
+
"in_channels": 3,
|
19 |
+
"latent_channels": 4,
|
20 |
+
"layers_per_block": 2,
|
21 |
+
"norm_num_groups": 32,
|
22 |
+
"out_channels": 3,
|
23 |
+
"sample_size": 1024,
|
24 |
+
"scaling_factor": 0.13025,
|
25 |
+
"up_block_types": [
|
26 |
+
"UpDecoderBlock2D",
|
27 |
+
"UpDecoderBlock2D",
|
28 |
+
"UpDecoderBlock2D",
|
29 |
+
"UpDecoderBlock2D"
|
30 |
+
]
|
31 |
+
}
|
32 |
+
|
vae_decoder/coreml_model.mlmodelc/analytics/coremldata.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:334026589a5d44461397828b5365d2cb0fe8e4e0746efe7ff23432e84330091d
|
3 |
+
size 243
|
vae_decoder/coreml_model.mlmodelc/coremldata.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:416ed5dcb73ffc557f85b0f448bd8775b76b15094f7df58a2d4b96bc4134454b
|
3 |
+
size 870
|
vae_decoder/coreml_model.mlmodelc/metadata.json
ADDED
@@ -0,0 +1,77 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"shortDescription" : "Stable Diffusion generates images conditioned on text and\/or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
|
4 |
+
"metadataOutputVersion" : "3.0",
|
5 |
+
"outputSchema" : [
|
6 |
+
{
|
7 |
+
"hasShapeFlexibility" : "0",
|
8 |
+
"isOptional" : "0",
|
9 |
+
"dataType" : "Float32",
|
10 |
+
"formattedType" : "MultiArray (Float32 1 × 3 × 1024 × 1024)",
|
11 |
+
"shortDescription" : "Generated image normalized to range [-1, 1]",
|
12 |
+
"shape" : "[1, 3, 1024, 1024]",
|
13 |
+
"name" : "image",
|
14 |
+
"type" : "MultiArray"
|
15 |
+
}
|
16 |
+
],
|
17 |
+
"version" : "stabilityai\/stable-diffusion-xl-base-1.0",
|
18 |
+
"modelParameters" : [
|
19 |
+
|
20 |
+
],
|
21 |
+
"author" : "Please refer to the Model Card available at huggingface.co\/stabilityai\/stable-diffusion-xl-base-1.0",
|
22 |
+
"specificationVersion" : 7,
|
23 |
+
"storagePrecision" : "Float16",
|
24 |
+
"license" : "OpenRAIL++-M (https:\/\/huggingface.co\/stabilityai\/stable-diffusion-xl-base-1.0\/blob\/main\/LICENSE.md)",
|
25 |
+
"mlProgramOperationTypeHistogram" : {
|
26 |
+
"Ios16.cast" : 1,
|
27 |
+
"Ios16.mul" : 2,
|
28 |
+
"Ios16.sqrt" : 30,
|
29 |
+
"Ios16.sub" : 30,
|
30 |
+
"Transpose" : 6,
|
31 |
+
"UpsampleNearestNeighbor" : 3,
|
32 |
+
"Ios16.conv" : 36,
|
33 |
+
"Ios16.add" : 46,
|
34 |
+
"Ios16.linear" : 4,
|
35 |
+
"Ios16.matmul" : 2,
|
36 |
+
"Ios16.realDiv" : 30,
|
37 |
+
"Ios16.reduceMean" : 60,
|
38 |
+
"Ios16.softmax" : 1,
|
39 |
+
"Ios16.batchNorm" : 29,
|
40 |
+
"Ios16.square" : 30,
|
41 |
+
"Ios16.reshape" : 65,
|
42 |
+
"Ios16.silu" : 29
|
43 |
+
},
|
44 |
+
"computePrecision" : "Mixed (Float16, Float32, Int32)",
|
45 |
+
"isUpdatable" : "0",
|
46 |
+
"availability" : {
|
47 |
+
"macOS" : "13.0",
|
48 |
+
"tvOS" : "16.0",
|
49 |
+
"visionOS" : "1.0",
|
50 |
+
"watchOS" : "9.0",
|
51 |
+
"iOS" : "16.0",
|
52 |
+
"macCatalyst" : "16.0"
|
53 |
+
},
|
54 |
+
"modelType" : {
|
55 |
+
"name" : "MLModelType_mlProgram"
|
56 |
+
},
|
57 |
+
"inputSchema" : [
|
58 |
+
{
|
59 |
+
"hasShapeFlexibility" : "0",
|
60 |
+
"isOptional" : "0",
|
61 |
+
"dataType" : "Float16",
|
62 |
+
"formattedType" : "MultiArray (Float16 1 × 4 × 128 × 128)",
|
63 |
+
"shortDescription" : "The denoised latent embeddings from the unet model after the last step of reverse diffusion",
|
64 |
+
"shape" : "[1, 4, 128, 128]",
|
65 |
+
"name" : "z",
|
66 |
+
"type" : "MultiArray"
|
67 |
+
}
|
68 |
+
],
|
69 |
+
"userDefinedMetadata" : {
|
70 |
+
"com.github.apple.coremltools.source_dialect" : "TorchScript",
|
71 |
+
"com.github.apple.coremltools.source" : "torch==2.2.0",
|
72 |
+
"com.github.apple.coremltools.version" : "7.2"
|
73 |
+
},
|
74 |
+
"generatedClassName" : "Stable_Diffusion_version_stabilityai_stable_diffusion_xl_base_1_0_vae_decoder",
|
75 |
+
"method" : "predict"
|
76 |
+
}
|
77 |
+
]
|
vae_decoder/coreml_model.mlmodelc/model.mil
ADDED
The diff for this file is too large to render.
See raw diff
|
|
vae_decoder/coreml_model.mlmodelc/weights/weight.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b6dced84df022c469c52e6369393bcd62bd47df2327e7eedaa750e9a705332a
|
3 |
+
size 98993280
|
vae_encoder/config.json
ADDED
@@ -0,0 +1,32 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "AutoencoderKL",
|
3 |
+
"_diffusers_version": "0.19.0.dev0",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"block_out_channels": [
|
6 |
+
128,
|
7 |
+
256,
|
8 |
+
512,
|
9 |
+
512
|
10 |
+
],
|
11 |
+
"down_block_types": [
|
12 |
+
"DownEncoderBlock2D",
|
13 |
+
"DownEncoderBlock2D",
|
14 |
+
"DownEncoderBlock2D",
|
15 |
+
"DownEncoderBlock2D"
|
16 |
+
],
|
17 |
+
"force_upcast": false,
|
18 |
+
"in_channels": 3,
|
19 |
+
"latent_channels": 4,
|
20 |
+
"layers_per_block": 2,
|
21 |
+
"norm_num_groups": 32,
|
22 |
+
"out_channels": 3,
|
23 |
+
"sample_size": 1024,
|
24 |
+
"scaling_factor": 0.13025,
|
25 |
+
"up_block_types": [
|
26 |
+
"UpDecoderBlock2D",
|
27 |
+
"UpDecoderBlock2D",
|
28 |
+
"UpDecoderBlock2D",
|
29 |
+
"UpDecoderBlock2D"
|
30 |
+
]
|
31 |
+
}
|
32 |
+
|
vae_encoder/coreml_model.mlmodelc/analytics/coremldata.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e44d9c0d47fd3c820932cb3fd5a709c70694f479f12c048a1367f655d21aa1cb
|
3 |
+
size 243
|
vae_encoder/coreml_model.mlmodelc/coremldata.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cc44873ad4c7ab4d3a0c951b65616d2bb4e633f1c1835af8041dfcd97d0f73e2
|
3 |
+
size 874
|
vae_encoder/coreml_model.mlmodelc/metadata.json
ADDED
@@ -0,0 +1,76 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"shortDescription" : "Stable Diffusion generates images conditioned on text and\/or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
|
4 |
+
"metadataOutputVersion" : "3.0",
|
5 |
+
"outputSchema" : [
|
6 |
+
{
|
7 |
+
"hasShapeFlexibility" : "0",
|
8 |
+
"isOptional" : "0",
|
9 |
+
"dataType" : "Float32",
|
10 |
+
"formattedType" : "MultiArray (Float32 1 × 8 × 128 × 128)",
|
11 |
+
"shortDescription" : "The latent embeddings from the unet model from the input image.",
|
12 |
+
"shape" : "[1, 8, 128, 128]",
|
13 |
+
"name" : "latent",
|
14 |
+
"type" : "MultiArray"
|
15 |
+
}
|
16 |
+
],
|
17 |
+
"version" : "stabilityai\/stable-diffusion-xl-base-1.0",
|
18 |
+
"modelParameters" : [
|
19 |
+
|
20 |
+
],
|
21 |
+
"author" : "Please refer to the Model Card available at huggingface.co\/stabilityai\/stable-diffusion-xl-base-1.0",
|
22 |
+
"specificationVersion" : 7,
|
23 |
+
"storagePrecision" : "Float32",
|
24 |
+
"license" : "OpenRAIL++-M (https:\/\/huggingface.co\/stabilityai\/stable-diffusion-xl-base-1.0\/blob\/main\/LICENSE.md)",
|
25 |
+
"mlProgramOperationTypeHistogram" : {
|
26 |
+
"Pad" : 3,
|
27 |
+
"Ios16.mul" : 2,
|
28 |
+
"Ios16.sqrt" : 22,
|
29 |
+
"Ios16.sub" : 22,
|
30 |
+
"Transpose" : 6,
|
31 |
+
"Ios16.conv" : 28,
|
32 |
+
"Ios16.add" : 34,
|
33 |
+
"Ios16.linear" : 4,
|
34 |
+
"Ios16.matmul" : 2,
|
35 |
+
"Ios16.realDiv" : 22,
|
36 |
+
"Ios16.reduceMean" : 44,
|
37 |
+
"Ios16.softmax" : 1,
|
38 |
+
"Ios16.batchNorm" : 21,
|
39 |
+
"Ios16.square" : 22,
|
40 |
+
"Ios16.reshape" : 49,
|
41 |
+
"Ios16.silu" : 21
|
42 |
+
},
|
43 |
+
"computePrecision" : "Mixed (Float32, Int32)",
|
44 |
+
"isUpdatable" : "0",
|
45 |
+
"availability" : {
|
46 |
+
"macOS" : "13.0",
|
47 |
+
"tvOS" : "16.0",
|
48 |
+
"visionOS" : "1.0",
|
49 |
+
"watchOS" : "9.0",
|
50 |
+
"iOS" : "16.0",
|
51 |
+
"macCatalyst" : "16.0"
|
52 |
+
},
|
53 |
+
"modelType" : {
|
54 |
+
"name" : "MLModelType_mlProgram"
|
55 |
+
},
|
56 |
+
"inputSchema" : [
|
57 |
+
{
|
58 |
+
"hasShapeFlexibility" : "0",
|
59 |
+
"isOptional" : "0",
|
60 |
+
"dataType" : "Float32",
|
61 |
+
"formattedType" : "MultiArray (Float32 1 × 3 × 1024 × 1024)",
|
62 |
+
"shortDescription" : "The input image to base the initial latents on normalized to range [-1, 1]",
|
63 |
+
"shape" : "[1, 3, 1024, 1024]",
|
64 |
+
"name" : "x",
|
65 |
+
"type" : "MultiArray"
|
66 |
+
}
|
67 |
+
],
|
68 |
+
"userDefinedMetadata" : {
|
69 |
+
"com.github.apple.coremltools.source_dialect" : "TorchScript",
|
70 |
+
"com.github.apple.coremltools.version" : "7.2",
|
71 |
+
"com.github.apple.coremltools.source" : "torch==2.2.0"
|
72 |
+
},
|
73 |
+
"generatedClassName" : "Stable_Diffusion_version_stabilityai_stable_diffusion_xl_base_1_0_vae_encoder",
|
74 |
+
"method" : "predict"
|
75 |
+
}
|
76 |
+
]
|
vae_encoder/coreml_model.mlmodelc/model.mil
ADDED
The diff for this file is too large to render.
See raw diff
|
|
vae_encoder/coreml_model.mlmodelc/weights/weight.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7a5eade1f3e6997e664a65e26ac86ba2a3205674910e151f98a9d91f13cd272b
|
3 |
+
size 136668992
|