{ "architectures": [ "MaskFormerForInstanceSegmentation" ], "backbone": null, "backbone_config": { "depths": [ 2, 2, 6, 2 ], "drop_path_rate": 0.3, "embed_dim": 96, "encoder_stride": 32, "hidden_size": 768, "image_size": 224, "in_channels": 3, "model_type": "maskformer-swin", "num_heads": [ 3, 6, 12, 24 ], "out_features": [ "stage1", "stage2", "stage3", "stage4" ], "out_indices": [ 1, 2, 3, 4 ], "path_norm": true, "pretrain_img_size": 224, "window_size": 7 }, "backbone_kwargs": null, "ce_weight": 1.0, "cross_entropy_weight": 1.0, "decoder_config": { "max_position_embeddings": 1024, "model_type": "detr", "scale_embedding": false }, "dice_weight": 1.0, "fpn_feature_size": 256, "id2label": { "0": "unlabeled", "1": "Roofs" }, "init_std": 0.02, "init_xavier_std": 1.0, "label2id": { "Roofs": "1", "unlabeled": "0" }, "mask_feature_size": 256, "mask_weight": 20.0, "model_type": "maskformer", "no_object_weight": 0.1, "num_attention_heads": 8, "num_hidden_layers": 6, "num_queries": 100, "output_auxiliary_logits": null, "torch_dtype": "float32", "transformers_version": "4.45.0.dev0", "use_auxiliary_loss": false, "use_pretrained_backbone": false, "use_timm_backbone": false }