nousr
/

robo-diffusion-2-base

StableDiffusionPipeline

stable-diffusion

Inference Endpoints

Model card Files Files and versions Community

webuickpt

#5

by flowwolf - opened Nov 30, 2022

base: refs/heads/main

←

from: refs/pr/5

Discussion Files changed

Files changed (3) hide show

robo-diffusion-v2-base.ckpt +0 -3
robo-diffusion-v2-base.yaml +0 -67
vae/config.json +0 -1

robo-diffusion-v2-base.ckpt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:60c4ea708f4648e5be9d8b1edadc0784d9fd97281f1bd88b6c92208ec36e312e
-size 2580250968

robo-diffusion-v2-base.yaml DELETED Viewed

@@ -1,67 +0,0 @@
-model:
-  base_learning_rate: 1.0e-4
-  target: ldm.models.diffusion.ddpm.LatentDiffusion
-  params:
-    linear_start: 0.00085
-    linear_end: 0.0120
-    num_timesteps_cond: 1
-    log_every_t: 200
-    timesteps: 1000
-    first_stage_key: "jpg"
-    cond_stage_key: "txt"
-    image_size: 64
-    channels: 4
-    cond_stage_trainable: false
-    conditioning_key: crossattn
-    monitor: val/loss_simple_ema
-    scale_factor: 0.18215
-    use_ema: False # we set this to false because this is an inference only config
-    unet_config:
-      target: ldm.modules.diffusionmodules.openaimodel.UNetModel
-      params:
-        use_checkpoint: True
-        use_fp16: True
-        image_size: 32 # unused
-        in_channels: 4
-        out_channels: 4
-        model_channels: 320
-        attention_resolutions: [ 4, 2, 1 ]
-        num_res_blocks: 2
-        channel_mult: [ 1, 2, 4, 4 ]
-        num_head_channels: 64 # need to fix for flash-attn
-        use_spatial_transformer: True
-        use_linear_in_transformer: True
-        transformer_depth: 1
-        context_dim: 1024
-        legacy: False
-    first_stage_config:
-      target: ldm.models.autoencoder.AutoencoderKL
-      params:
-        embed_dim: 4
-        monitor: val/rec_loss
-        ddconfig:
-          #attn_type: "vanilla-xformers"
-          double_z: true
-          z_channels: 4
-          resolution: 256
-          in_channels: 3
-          out_ch: 3
-          ch: 128
-          ch_mult:
-          - 1
-          - 2
-          - 4
-          - 4
-          num_res_blocks: 2
-          attn_resolutions: []
-          dropout: 0.0
-        lossconfig:
-          target: torch.nn.Identity
-    cond_stage_config:
-      target: ldm.modules.encoders.modules.FrozenOpenCLIPEmbedder
-      params:
-        freeze: True
-        layer: "penultimate"

vae/config.json CHANGED Viewed

@@ -21,7 +21,6 @@
   "norm_num_groups": 32,
   "out_channels": 3,
   "sample_size": 512,
-  "scaling_factor": 0.18215,
   "up_block_types": [
     "UpDecoderBlock2D",
     "UpDecoderBlock2D",

   "norm_num_groups": 32,
   "out_channels": 3,
   "sample_size": 512,
   "up_block_types": [
     "UpDecoderBlock2D",
     "UpDecoderBlock2D",