{ "embed_dim": 768, "vision_cfg": { "image_size": 224, "layers": 12, "width": 768, "patch_size": 16 }, "text_cfg": { "context_length": 280, "vocab_size": 49411, "width": 768, "heads": 12, "layers": 12, "tokenizer_kwargs": { "additional_special_tokens": [ "", "", "" ] } }, "pool_project_cfg": { "pool_proj_type": "attn", "input_dim": 768, "output_dim": 768, "attn_num_heads": 12 }, "special_token_ids": { "": 49406, "": 49407, "": 49408, "": 49409, "": 49410 }, "custom_text": true }