|
{ |
|
"_name_or_path": "dandelin/vilt-b32-mlm", |
|
"architectures": [ |
|
"ViltForQuestionAnswering" |
|
], |
|
"attention_probs_dropout_prob": 0.0, |
|
"hidden_act": "gelu", |
|
"hidden_dropout_prob": 0.0, |
|
"hidden_size": 768, |
|
"id2label": { |
|
"0": "mouse", |
|
"1": "british", |
|
"2": "freezer", |
|
"3": "yes", |
|
"4": "nowhere", |
|
"5": "england", |
|
"6": "car", |
|
"7": "uk", |
|
"8": "cows", |
|
"9": "dog", |
|
"10": "room", |
|
"11": "us", |
|
"12": "on sidewalk", |
|
"13": "indoors", |
|
"14": "nothing", |
|
"15": "airport", |
|
"16": "usa", |
|
"17": "park", |
|
"18": "hallway", |
|
"19": "australia", |
|
"20": "windows", |
|
"21": "refrigerator", |
|
"22": "buildings", |
|
"23": "sun", |
|
"24": "living room", |
|
"25": "bus", |
|
"26": "in car", |
|
"27": "home", |
|
"28": "woods", |
|
"29": "inside", |
|
"30": "hotel", |
|
"31": "united states", |
|
"32": "fridge", |
|
"33": "smile", |
|
"34": "ground", |
|
"35": "america" |
|
}, |
|
"image_size": 384, |
|
"initializer_range": 0.02, |
|
"intermediate_size": 3072, |
|
"label2id": { |
|
"airport": 15, |
|
"america": 35, |
|
"australia": 19, |
|
"british": 1, |
|
"buildings": 22, |
|
"bus": 25, |
|
"car": 6, |
|
"cows": 8, |
|
"dog": 9, |
|
"england": 5, |
|
"freezer": 2, |
|
"fridge": 32, |
|
"ground": 34, |
|
"hallway": 18, |
|
"home": 27, |
|
"hotel": 30, |
|
"in car": 26, |
|
"indoors": 13, |
|
"inside": 29, |
|
"living room": 24, |
|
"mouse": 0, |
|
"nothing": 14, |
|
"nowhere": 4, |
|
"on sidewalk": 12, |
|
"park": 17, |
|
"refrigerator": 21, |
|
"room": 10, |
|
"smile": 33, |
|
"sun": 23, |
|
"uk": 7, |
|
"united states": 31, |
|
"us": 11, |
|
"usa": 16, |
|
"windows": 20, |
|
"woods": 28, |
|
"yes": 3 |
|
}, |
|
"layer_norm_eps": 1e-12, |
|
"max_image_length": -1, |
|
"max_position_embeddings": 40, |
|
"modality_type_vocab_size": 2, |
|
"model_type": "vilt", |
|
"num_attention_heads": 12, |
|
"num_channels": 3, |
|
"num_hidden_layers": 12, |
|
"num_images": -1, |
|
"patch_size": 32, |
|
"qkv_bias": true, |
|
"tie_word_embeddings": false, |
|
"torch_dtype": "float32", |
|
"transformers_version": "4.40.2", |
|
"type_vocab_size": 2, |
|
"vocab_size": 30522 |
|
} |
|
|