disk0dancer's picture
End of training
7dfdfa4 verified
{
"_name_or_path": "disk0dancer/ruBert-base-finetuned-pos",
"architectures": [
"BertForTokenClassification"
],
"attention_probs_dropout_prob": 0.1,
"classifier_dropout": null,
"directionality": "bidi",
"hidden_act": "gelu",
"hidden_dropout_prob": 0.1,
"hidden_size": 768,
"id2label": {
"0": "O",
"1": "Not",
"2": "Abbr",
"3": "Adj",
"4": "Adv",
"5": "Adv/action_des\u0441",
"6": "Adv/action_time",
"7": "Adv/measure",
"8": "Adv/place",
"9": "Adv/emph",
"10": "Advt",
"11": "Advt1",
"12": "Aux",
"13": "Bracket",
"14": "Colon",
"15": "Comma",
"16": "Conj.comp",
"17": "Coord",
"18": "Dash",
"19": "Dot",
"20": "Ellipsis",
"21": "Fw",
"22": "Interj.",
"23": "Interrog.word",
"24": "Introduct",
"25": "Mark/excl",
"26": "Mark/quest",
"27": "Measure",
"28": "N",
"29": "Num",
"30": "Num/ordinal",
"31": "Part/dem",
"32": "Part/excl",
"33": "Part/limit",
"34": "Part/imp",
"35": "Part/intens",
"36": "Part/neg",
"37": "Part/quest",
"38": "Part/soft",
"39": "Prep",
"40": "Pron",
"41": "Pron/attr",
"42": "Pron/dem",
"43": "Pron/neg",
"44": "Pron/pos",
"45": "Pron/rel",
"46": "Particip/adj",
"47": "Particip/v",
"48": "Punct",
"49": "Quote",
"50": "Semicolon",
"51": "State",
"52": "Sub",
"53": "Vf",
"54": "Vinf",
"55": "Vm"
},
"initializer_range": 0.02,
"intermediate_size": 3072,
"label2id": {
"Abbr": 2,
"Adj": 3,
"Adv": 4,
"Adv/action_des\u0441": 5,
"Adv/action_time": 6,
"Adv/emph": 9,
"Adv/measure": 7,
"Adv/place": 8,
"Advt": 10,
"Advt1": 11,
"Aux": 12,
"Bracket": 13,
"Colon": 14,
"Comma": 15,
"Conj.comp": 16,
"Coord": 17,
"Dash": 18,
"Dot": 19,
"Ellipsis": 20,
"Fw": 21,
"Interj.": 22,
"Interrog.word": 23,
"Introduct": 24,
"Mark/excl": 25,
"Mark/quest": 26,
"Measure": 27,
"N": 28,
"Not": 1,
"Num": 29,
"Num/ordinal": 30,
"O": 0,
"Part/dem": 31,
"Part/excl": 32,
"Part/imp": 34,
"Part/intens": 35,
"Part/limit": 33,
"Part/neg": 36,
"Part/quest": 37,
"Part/soft": 38,
"Particip/adj": 46,
"Particip/v": 47,
"Prep": 39,
"Pron": 40,
"Pron/attr": 41,
"Pron/dem": 42,
"Pron/neg": 43,
"Pron/pos": 44,
"Pron/rel": 45,
"Punct": 48,
"Quote": 49,
"Semicolon": 50,
"State": 51,
"Sub": 52,
"Vf": 53,
"Vinf": 54,
"Vm": 55
},
"layer_norm_eps": 1e-12,
"max_position_embeddings": 512,
"model_type": "bert",
"num_attention_heads": 12,
"num_hidden_layers": 12,
"pad_token_id": 0,
"pooler_fc_size": 768,
"pooler_num_attention_heads": 12,
"pooler_num_fc_layers": 3,
"pooler_size_per_head": 128,
"pooler_type": "first_token_transform",
"position_embedding_type": "absolute",
"torch_dtype": "float32",
"transformers_version": "4.39.0",
"type_vocab_size": 2,
"use_cache": true,
"vocab_size": 120138
}