{ "embed_dim": 640, "vision_cfg": { "image_size": 512, "layers": 12, "width": 768, "patch_size": 4, "latent_encoder_name": "madebyollin/sdxl-vae-fp16-fix", "latent_factor": 8, "latent_n_channels": 4 }, "text_cfg": { "context_length": 77, "vocab_size": 49408, "width": 640, "heads": 10, "layers": 12 } }