Upload 12 files

Browse files

Files changed (12) hide show

vae_decoder/config.json +32 -0
vae_decoder/coreml_model.mlmodelc/analytics/coremldata.bin +3 -0
vae_decoder/coreml_model.mlmodelc/coremldata.bin +3 -0
vae_decoder/coreml_model.mlmodelc/metadata.json +77 -0
vae_decoder/coreml_model.mlmodelc/model.mil +0 -0
vae_decoder/coreml_model.mlmodelc/weights/weight.bin +3 -0
vae_encoder/config.json +32 -0
vae_encoder/coreml_model.mlmodelc/analytics/coremldata.bin +3 -0
vae_encoder/coreml_model.mlmodelc/coremldata.bin +3 -0
vae_encoder/coreml_model.mlmodelc/metadata.json +76 -0
vae_encoder/coreml_model.mlmodelc/model.mil +0 -0
vae_encoder/coreml_model.mlmodelc/weights/weight.bin +3 -0

vae_decoder/config.json ADDED Viewed

	@@ -0,0 +1,32 @@

+{
+  "_class_name": "AutoencoderKL",
+  "_diffusers_version": "0.19.0.dev0",
+  "act_fn": "silu",
+  "block_out_channels": [
+    128,
+    256,
+    512,
+    512
+  ],
+  "down_block_types": [
+    "DownEncoderBlock2D",
+    "DownEncoderBlock2D",
+    "DownEncoderBlock2D",
+    "DownEncoderBlock2D"
+  ],
+  "force_upcast": false,
+  "in_channels": 3,
+  "latent_channels": 4,
+  "layers_per_block": 2,
+  "norm_num_groups": 32,
+  "out_channels": 3,
+  "sample_size": 1024,
+  "scaling_factor": 0.13025,
+  "up_block_types": [
+    "UpDecoderBlock2D",
+    "UpDecoderBlock2D",
+    "UpDecoderBlock2D",
+    "UpDecoderBlock2D"
+  ]
+}

vae_decoder/coreml_model.mlmodelc/analytics/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:334026589a5d44461397828b5365d2cb0fe8e4e0746efe7ff23432e84330091d
+size 243

vae_decoder/coreml_model.mlmodelc/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:416ed5dcb73ffc557f85b0f448bd8775b76b15094f7df58a2d4b96bc4134454b
+size 870

vae_decoder/coreml_model.mlmodelc/metadata.json ADDED Viewed

	@@ -0,0 +1,77 @@

+[
+  {
+    "shortDescription" : "Stable Diffusion generates images conditioned on text and\/or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
+    "metadataOutputVersion" : "3.0",
+    "outputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float32",
+        "formattedType" : "MultiArray (Float32 1 × 3 × 1024 × 1024)",
+        "shortDescription" : "Generated image normalized to range [-1, 1]",
+        "shape" : "[1, 3, 1024, 1024]",
+        "name" : "image",
+        "type" : "MultiArray"
+      }
+    ],
+    "version" : "stabilityai\/stable-diffusion-xl-base-1.0",
+    "modelParameters" : [
+    ],
+    "author" : "Please refer to the Model Card available at huggingface.co\/stabilityai\/stable-diffusion-xl-base-1.0",
+    "specificationVersion" : 7,
+    "storagePrecision" : "Float16",
+    "license" : "OpenRAIL++-M (https:\/\/huggingface.co\/stabilityai\/stable-diffusion-xl-base-1.0\/blob\/main\/LICENSE.md)",
+    "mlProgramOperationTypeHistogram" : {
+      "Ios16.cast" : 1,
+      "Ios16.mul" : 2,
+      "Ios16.sqrt" : 30,
+      "Ios16.sub" : 30,
+      "Transpose" : 6,
+      "UpsampleNearestNeighbor" : 3,
+      "Ios16.conv" : 36,
+      "Ios16.add" : 46,
+      "Ios16.linear" : 4,
+      "Ios16.matmul" : 2,
+      "Ios16.realDiv" : 30,
+      "Ios16.reduceMean" : 60,
+      "Ios16.softmax" : 1,
+      "Ios16.batchNorm" : 29,
+      "Ios16.square" : 30,
+      "Ios16.reshape" : 65,
+      "Ios16.silu" : 29
+    },
+    "computePrecision" : "Mixed (Float16, Float32, Int32)",
+    "isUpdatable" : "0",
+    "availability" : {
+      "macOS" : "13.0",
+      "tvOS" : "16.0",
+      "visionOS" : "1.0",
+      "watchOS" : "9.0",
+      "iOS" : "16.0",
+      "macCatalyst" : "16.0"
+    },
+    "modelType" : {
+      "name" : "MLModelType_mlProgram"
+    },
+    "inputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 1 × 4 × 128 × 128)",
+        "shortDescription" : "The denoised latent embeddings from the unet model after the last step of reverse diffusion",
+        "shape" : "[1, 4, 128, 128]",
+        "name" : "z",
+        "type" : "MultiArray"
+      }
+    ],
+    "userDefinedMetadata" : {
+      "com.github.apple.coremltools.source_dialect" : "TorchScript",
+      "com.github.apple.coremltools.source" : "torch==2.2.0",
+      "com.github.apple.coremltools.version" : "7.2"
+    },
+    "generatedClassName" : "Stable_Diffusion_version_stabilityai_stable_diffusion_xl_base_1_0_vae_decoder",
+    "method" : "predict"
+  }
+]

vae_decoder/coreml_model.mlmodelc/model.mil ADDED Viewed

The diff for this file is too large to render. See raw diff

vae_decoder/coreml_model.mlmodelc/weights/weight.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5b6dced84df022c469c52e6369393bcd62bd47df2327e7eedaa750e9a705332a
+size 98993280

vae_encoder/config.json ADDED Viewed

	@@ -0,0 +1,32 @@

+{
+  "_class_name": "AutoencoderKL",
+  "_diffusers_version": "0.19.0.dev0",
+  "act_fn": "silu",
+  "block_out_channels": [
+    128,
+    256,
+    512,
+    512
+  ],
+  "down_block_types": [
+    "DownEncoderBlock2D",
+    "DownEncoderBlock2D",
+    "DownEncoderBlock2D",
+    "DownEncoderBlock2D"
+  ],
+  "force_upcast": false,
+  "in_channels": 3,
+  "latent_channels": 4,
+  "layers_per_block": 2,
+  "norm_num_groups": 32,
+  "out_channels": 3,
+  "sample_size": 1024,
+  "scaling_factor": 0.13025,
+  "up_block_types": [
+    "UpDecoderBlock2D",
+    "UpDecoderBlock2D",
+    "UpDecoderBlock2D",
+    "UpDecoderBlock2D"
+  ]
+}

vae_encoder/coreml_model.mlmodelc/analytics/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e44d9c0d47fd3c820932cb3fd5a709c70694f479f12c048a1367f655d21aa1cb
+size 243

vae_encoder/coreml_model.mlmodelc/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cc44873ad4c7ab4d3a0c951b65616d2bb4e633f1c1835af8041dfcd97d0f73e2
+size 874

vae_encoder/coreml_model.mlmodelc/metadata.json ADDED Viewed

	@@ -0,0 +1,76 @@

+[
+  {
+    "shortDescription" : "Stable Diffusion generates images conditioned on text and\/or other images as input through the diffusion process. Please refer to https:\/\/arxiv.org\/abs\/2112.10752 for details.",
+    "metadataOutputVersion" : "3.0",
+    "outputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float32",
+        "formattedType" : "MultiArray (Float32 1 × 8 × 128 × 128)",
+        "shortDescription" : "The latent embeddings from the unet model from the input image.",
+        "shape" : "[1, 8, 128, 128]",
+        "name" : "latent",
+        "type" : "MultiArray"
+      }
+    ],
+    "version" : "stabilityai\/stable-diffusion-xl-base-1.0",
+    "modelParameters" : [
+    ],
+    "author" : "Please refer to the Model Card available at huggingface.co\/stabilityai\/stable-diffusion-xl-base-1.0",
+    "specificationVersion" : 7,
+    "storagePrecision" : "Float32",
+    "license" : "OpenRAIL++-M (https:\/\/huggingface.co\/stabilityai\/stable-diffusion-xl-base-1.0\/blob\/main\/LICENSE.md)",
+    "mlProgramOperationTypeHistogram" : {
+      "Pad" : 3,
+      "Ios16.mul" : 2,
+      "Ios16.sqrt" : 22,
+      "Ios16.sub" : 22,
+      "Transpose" : 6,
+      "Ios16.conv" : 28,
+      "Ios16.add" : 34,
+      "Ios16.linear" : 4,
+      "Ios16.matmul" : 2,
+      "Ios16.realDiv" : 22,
+      "Ios16.reduceMean" : 44,
+      "Ios16.softmax" : 1,
+      "Ios16.batchNorm" : 21,
+      "Ios16.square" : 22,
+      "Ios16.reshape" : 49,
+      "Ios16.silu" : 21
+    },
+    "computePrecision" : "Mixed (Float32, Int32)",
+    "isUpdatable" : "0",
+    "availability" : {
+      "macOS" : "13.0",
+      "tvOS" : "16.0",
+      "visionOS" : "1.0",
+      "watchOS" : "9.0",
+      "iOS" : "16.0",
+      "macCatalyst" : "16.0"
+    },
+    "modelType" : {
+      "name" : "MLModelType_mlProgram"
+    },
+    "inputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float32",
+        "formattedType" : "MultiArray (Float32 1 × 3 × 1024 × 1024)",
+        "shortDescription" : "The input image to base the initial latents on normalized to range [-1, 1]",
+        "shape" : "[1, 3, 1024, 1024]",
+        "name" : "x",
+        "type" : "MultiArray"
+      }
+    ],
+    "userDefinedMetadata" : {
+      "com.github.apple.coremltools.source_dialect" : "TorchScript",
+      "com.github.apple.coremltools.version" : "7.2",
+      "com.github.apple.coremltools.source" : "torch==2.2.0"
+    },
+    "generatedClassName" : "Stable_Diffusion_version_stabilityai_stable_diffusion_xl_base_1_0_vae_encoder",
+    "method" : "predict"
+  }
+]

vae_encoder/coreml_model.mlmodelc/model.mil ADDED Viewed

The diff for this file is too large to render. See raw diff

vae_encoder/coreml_model.mlmodelc/weights/weight.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7a5eade1f3e6997e664a65e26ac86ba2a3205674910e151f98a9d91f13cd272b
+size 136668992