{ "architectures": [ "ModernBertForTokenClassification" ], "attention_bias": false, "attention_dropout": 0.0, "auto_map": { "AutoConfig": "configuration_modernbert.ModernBertConfig", "AutoModel": "modeling_modernbert.ModernBertModel", "AutoModelForMaskedLM": "modeling_modernbert.ModernBertForMaskedLM", "AutoModelForSequenceClassification": "modeling_modernbert.ModernBertForSequenceClassification", "AutoModelForTokenClassification": "modeling_modernbert.ModernBertForTokenClassification" }, "bos_token_id": 0, "classifier_activation": "gelu", "classifier_bias": false, "classifier_dropout": 0.0, "classifier_pooling": "mean", "cls_token_id": 0, "custom_pipelines": { "universal-dependencies": { "impl": "ud.UniversalDependenciesPipeline", "pt": "AutoModelForTokenClassification" } }, "decoder_bias": true, "deterministic_flash_attn": false, "embedding_dropout": 0.0, "eos_token_id": 2, "global_attn_every_n_layers": 3, "global_rope_theta": 160000.0, "gradient_checkpointing": false, "hidden_activation": "gelu", "hidden_size": 768, "id2label": { "0": "-|_|dep", "1": "ADJ|_|acl", "2": "ADJ|_|advcl", "3": "ADJ|_|amod", "4": "ADJ|_|ccomp", "5": "ADJ|_|csubj", "6": "ADJ|_|csubj:outer", "7": "ADJ|_|dep", "8": "ADJ|_|nmod", "9": "ADJ|_|nsubj", "10": "ADJ|_|obj", "11": "ADJ|_|obl", "12": "ADJ|_|root", "13": "ADP|_|case", "14": "ADP|_|fixed", "15": "ADV|_|advcl", "16": "ADV|_|advmod", "17": "ADV|_|dep", "18": "ADV|_|obj", "19": "ADV|_|root", "20": "AUX|Polarity=Neg|aux", "21": "AUX|Polarity=Neg|fixed", "22": "AUX|_|aux", "23": "AUX|_|cop", "24": "AUX|_|fixed", "25": "AUX|_|root", "26": "CCONJ|_|cc", "27": "DET|_|det", "28": "INTJ|_|discourse", "29": "INTJ|_|root", "30": "NOUN|Polarity=Neg|obl", "31": "NOUN|Polarity=Neg|root", "32": "NOUN|_|acl", "33": "NOUN|_|advcl", "34": "NOUN|_|ccomp", "35": "NOUN|_|compound", "36": "NOUN|_|csubj", "37": "NOUN|_|csubj:outer", "38": "NOUN|_|nmod", "39": "NOUN|_|nsubj", "40": "NOUN|_|nsubj:outer", "41": "NOUN|_|obj", "42": "NOUN|_|obl", "43": "NOUN|_|root", "44": "NUM|_|advcl", "45": "NUM|_|compound", "46": "NUM|_|nmod", "47": "NUM|_|nsubj", "48": "NUM|_|nsubj:outer", "49": "NUM|_|nummod", "50": "NUM|_|obj", "51": "NUM|_|obl", "52": "NUM|_|root", "53": "PART|_|mark", "54": "PRON|_|acl", "55": "PRON|_|advcl", "56": "PRON|_|nmod", "57": "PRON|_|nsubj", "58": "PRON|_|nsubj:outer", "59": "PRON|_|obj", "60": "PRON|_|obl", "61": "PRON|_|root", "62": "PROPN|_|acl", "63": "PROPN|_|advcl", "64": "PROPN|_|compound", "65": "PROPN|_|nmod", "66": "PROPN|_|nsubj", "67": "PROPN|_|nsubj:outer", "68": "PROPN|_|obj", "69": "PROPN|_|obl", "70": "PROPN|_|root", "71": "PUNCT|_|punct", "72": "SCONJ|_|dep", "73": "SCONJ|_|fixed", "74": "SCONJ|_|mark", "75": "SYM|_|compound", "76": "SYM|_|dep", "77": "SYM|_|nmod", "78": "SYM|_|obl", "79": "VERB|_|acl", "80": "VERB|_|advcl", "81": "VERB|_|ccomp", "82": "VERB|_|compound", "83": "VERB|_|csubj", "84": "VERB|_|csubj:outer", "85": "VERB|_|nmod", "86": "VERB|_|obj", "87": "VERB|_|obl", "88": "VERB|_|root", "89": "X|_|dep", "90": "X|_|goeswith", "91": "X|_|nmod" }, "initializer_cutoff_factor": 2.0, "initializer_range": 0.02, "intermediate_size": 1152, "label2id": { "-|_|dep": 0, "ADJ|_|acl": 1, "ADJ|_|advcl": 2, "ADJ|_|amod": 3, "ADJ|_|ccomp": 4, "ADJ|_|csubj": 5, "ADJ|_|csubj:outer": 6, "ADJ|_|dep": 7, "ADJ|_|nmod": 8, "ADJ|_|nsubj": 9, "ADJ|_|obj": 10, "ADJ|_|obl": 11, "ADJ|_|root": 12, "ADP|_|case": 13, "ADP|_|fixed": 14, "ADV|_|advcl": 15, "ADV|_|advmod": 16, "ADV|_|dep": 17, "ADV|_|obj": 18, "ADV|_|root": 19, "AUX|Polarity=Neg|aux": 20, "AUX|Polarity=Neg|fixed": 21, "AUX|_|aux": 22, "AUX|_|cop": 23, "AUX|_|fixed": 24, "AUX|_|root": 25, "CCONJ|_|cc": 26, "DET|_|det": 27, "INTJ|_|discourse": 28, "INTJ|_|root": 29, "NOUN|Polarity=Neg|obl": 30, "NOUN|Polarity=Neg|root": 31, "NOUN|_|acl": 32, "NOUN|_|advcl": 33, "NOUN|_|ccomp": 34, "NOUN|_|compound": 35, "NOUN|_|csubj": 36, "NOUN|_|csubj:outer": 37, "NOUN|_|nmod": 38, "NOUN|_|nsubj": 39, "NOUN|_|nsubj:outer": 40, "NOUN|_|obj": 41, "NOUN|_|obl": 42, "NOUN|_|root": 43, "NUM|_|advcl": 44, "NUM|_|compound": 45, "NUM|_|nmod": 46, "NUM|_|nsubj": 47, "NUM|_|nsubj:outer": 48, "NUM|_|nummod": 49, "NUM|_|obj": 50, "NUM|_|obl": 51, "NUM|_|root": 52, "PART|_|mark": 53, "PRON|_|acl": 54, "PRON|_|advcl": 55, "PRON|_|nmod": 56, "PRON|_|nsubj": 57, "PRON|_|nsubj:outer": 58, "PRON|_|obj": 59, "PRON|_|obl": 60, "PRON|_|root": 61, "PROPN|_|acl": 62, "PROPN|_|advcl": 63, "PROPN|_|compound": 64, "PROPN|_|nmod": 65, "PROPN|_|nsubj": 66, "PROPN|_|nsubj:outer": 67, "PROPN|_|obj": 68, "PROPN|_|obl": 69, "PROPN|_|root": 70, "PUNCT|_|punct": 71, "SCONJ|_|dep": 72, "SCONJ|_|fixed": 73, "SCONJ|_|mark": 74, "SYM|_|compound": 75, "SYM|_|dep": 76, "SYM|_|nmod": 77, "SYM|_|obl": 78, "VERB|_|acl": 79, "VERB|_|advcl": 80, "VERB|_|ccomp": 81, "VERB|_|compound": 82, "VERB|_|csubj": 83, "VERB|_|csubj:outer": 84, "VERB|_|nmod": 85, "VERB|_|obj": 86, "VERB|_|obl": 87, "VERB|_|root": 88, "X|_|dep": 89, "X|_|goeswith": 90, "X|_|nmod": 91 }, "layer_norm_eps": 1e-05, "local_attention": 128, "local_rope_theta": 10000.0, "max_position_embeddings": 8192, "mlp_bias": false, "mlp_dropout": 0.0, "model_type": "modernbert", "norm_bias": false, "norm_eps": 1e-05, "num_attention_heads": 12, "num_hidden_layers": 22, "pad_token_id": 1, "position_embedding_type": "absolute", "reference_compile": true, "sep_token_id": 2, "sparse_pred_ignore_index": -100, "sparse_prediction": false, "tokenizer_class": "DebertaV2TokenizerFast", "torch_dtype": "float32", "transformers_version": "4.47.1", "vocab_size": 65000 }