{ "activation_function": "gelu_new", "architectures": [ "GPT2ForTokenClassification" ], "attn_pdrop": 0.1, "bos_token_id": 2, "custom_pipelines": { "upos": { "impl": "ud.BellmanFordTokenClassificationPipeline", "pt": "AutoModelForTokenClassification" }, "universal-dependencies": { "impl": "ud.UniversalDependenciesCausalPipeline", "pt": "AutoModelForTokenClassification" } }, "embd_pdrop": 0.1, "eos_token_id": 2, "id2label": { "0": "ADJ", "1": "ADJ|l-acl", "2": "ADJ|l-advcl", "3": "ADJ|l-amod", "4": "ADJ|l-ccomp", "5": "ADJ|l-csubj", "6": "ADJ|l-csubj:outer", "7": "ADJ|l-nmod", "8": "ADJ|l-nsubj", "9": "ADJ|l-obj", "10": "ADJ|l-obl", "11": "ADJ|r-acl", "12": "ADJ|r-amod", "13": "ADJ|r-dep", "14": "ADJ|root", "15": "ADP", "16": "ADP|l-case", "17": "ADP|r-case", "18": "ADP|r-fixed", "19": "ADV", "20": "ADV|l-advcl", "21": "ADV|l-advmod", "22": "ADV|l-obj", "23": "ADV|r-dep", "24": "ADV|root", "25": "AUX", "26": "AUX|Polarity=Neg", "27": "AUX|Polarity=Neg|r-aux", "28": "AUX|Polarity=Neg|r-fixed", "29": "AUX|r-aux", "30": "AUX|r-cop", "31": "AUX|r-fixed", "32": "AUX|root", "33": "B-ADJ", "34": "B-ADP", "35": "B-ADV", "36": "B-AUX", "37": "B-AUX|Polarity=Neg", "38": "B-CCONJ", "39": "B-DET", "40": "B-INTJ", "41": "B-NOUN", "42": "B-NOUN|Polarity=Neg", "43": "B-NUM", "44": "B-PART", "45": "B-PRON", "46": "B-PROPN", "47": "B-PUNCT", "48": "B-SCONJ", "49": "B-SYM", "50": "B-VERB", "51": "B-X", "52": "CCONJ", "53": "CCONJ|l-cc", "54": "CCONJ|r-cc", "55": "DET", "56": "DET|l-det", "57": "I-ADJ", "58": "I-ADP", "59": "I-ADV", "60": "I-AUX", "61": "I-AUX|Polarity=Neg", "62": "I-CCONJ", "63": "I-DET", "64": "I-INTJ", "65": "I-NOUN", "66": "I-NOUN|Polarity=Neg", "67": "I-NUM", "68": "I-PART", "69": "I-PRON", "70": "I-PROPN", "71": "I-PUNCT", "72": "I-SCONJ", "73": "I-SYM", "74": "I-VERB", "75": "I-X", "76": "INTJ", "77": "INTJ|l-discourse", "78": "INTJ|r-discourse", "79": "INTJ|root", "80": "NOUN", "81": "NOUN|Polarity=Neg", "82": "NOUN|Polarity=Neg|l-obl", "83": "NOUN|Polarity=Neg|root", "84": "NOUN|l-acl", "85": "NOUN|l-advcl", "86": "NOUN|l-ccomp", "87": "NOUN|l-compound", "88": "NOUN|l-csubj", "89": "NOUN|l-csubj:outer", "90": "NOUN|l-nmod", "91": "NOUN|l-nsubj", "92": "NOUN|l-nsubj:outer", "93": "NOUN|l-obj", "94": "NOUN|l-obl", "95": "NOUN|r-compound", "96": "NOUN|r-nmod", "97": "NOUN|r-nsubj", "98": "NOUN|root", "99": "NUM", "100": "NUM|l-advcl", "101": "NUM|l-compound", "102": "NUM|l-nmod", "103": "NUM|l-nsubj", "104": "NUM|l-nsubj:outer", "105": "NUM|l-nummod", "106": "NUM|l-obj", "107": "NUM|l-obl", "108": "NUM|r-compound", "109": "NUM|root", "110": "PART", "111": "PART|l-mark", "112": "PART|r-mark", "113": "PRON", "114": "PRON|l-acl", "115": "PRON|l-advcl", "116": "PRON|l-nmod", "117": "PRON|l-nsubj", "118": "PRON|l-nsubj:outer", "119": "PRON|l-obj", "120": "PRON|l-obl", "121": "PRON|root", "122": "PROPN", "123": "PROPN|l-acl", "124": "PROPN|l-advcl", "125": "PROPN|l-compound", "126": "PROPN|l-nmod", "127": "PROPN|l-nsubj", "128": "PROPN|l-nsubj:outer", "129": "PROPN|l-obj", "130": "PROPN|l-obl", "131": "PROPN|r-compound", "132": "PROPN|r-nmod", "133": "PROPN|root", "134": "PUNCT", "135": "PUNCT|l-punct", "136": "PUNCT|r-punct", "137": "SCONJ", "138": "SCONJ|l-dep", "139": "SCONJ|r-fixed", "140": "SCONJ|r-mark", "141": "SYM", "142": "SYM|l-compound", "143": "SYM|l-dep", "144": "SYM|l-nmod", "145": "SYM|l-obl", "146": "SYM|r-compound", "147": "SYM|r-dep", "148": "VERB", "149": "VERB|l-acl", "150": "VERB|l-advcl", "151": "VERB|l-ccomp", "152": "VERB|l-compound", "153": "VERB|l-csubj", "154": "VERB|l-csubj:outer", "155": "VERB|l-nmod", "156": "VERB|l-obj", "157": "VERB|l-obl", "158": "VERB|r-acl", "159": "VERB|r-advcl", "160": "VERB|r-compound", "161": "VERB|root", "162": "X", "163": "X|l-nmod", "164": "X|r-dep" }, "initializer_range": 0.02, "label2id": { "ADJ": 0, "ADJ|l-acl": 1, "ADJ|l-advcl": 2, "ADJ|l-amod": 3, "ADJ|l-ccomp": 4, "ADJ|l-csubj": 5, "ADJ|l-csubj:outer": 6, "ADJ|l-nmod": 7, "ADJ|l-nsubj": 8, "ADJ|l-obj": 9, "ADJ|l-obl": 10, "ADJ|r-acl": 11, "ADJ|r-amod": 12, "ADJ|r-dep": 13, "ADJ|root": 14, "ADP": 15, "ADP|l-case": 16, "ADP|r-case": 17, "ADP|r-fixed": 18, "ADV": 19, "ADV|l-advcl": 20, "ADV|l-advmod": 21, "ADV|l-obj": 22, "ADV|r-dep": 23, "ADV|root": 24, "AUX": 25, "AUX|Polarity=Neg": 26, "AUX|Polarity=Neg|r-aux": 27, "AUX|Polarity=Neg|r-fixed": 28, "AUX|r-aux": 29, "AUX|r-cop": 30, "AUX|r-fixed": 31, "AUX|root": 32, "B-ADJ": 33, "B-ADP": 34, "B-ADV": 35, "B-AUX": 36, "B-AUX|Polarity=Neg": 37, "B-CCONJ": 38, "B-DET": 39, "B-INTJ": 40, "B-NOUN": 41, "B-NOUN|Polarity=Neg": 42, "B-NUM": 43, "B-PART": 44, "B-PRON": 45, "B-PROPN": 46, "B-PUNCT": 47, "B-SCONJ": 48, "B-SYM": 49, "B-VERB": 50, "B-X": 51, "CCONJ": 52, "CCONJ|l-cc": 53, "CCONJ|r-cc": 54, "DET": 55, "DET|l-det": 56, "I-ADJ": 57, "I-ADP": 58, "I-ADV": 59, "I-AUX": 60, "I-AUX|Polarity=Neg": 61, "I-CCONJ": 62, "I-DET": 63, "I-INTJ": 64, "I-NOUN": 65, "I-NOUN|Polarity=Neg": 66, "I-NUM": 67, "I-PART": 68, "I-PRON": 69, "I-PROPN": 70, "I-PUNCT": 71, "I-SCONJ": 72, "I-SYM": 73, "I-VERB": 74, "I-X": 75, "INTJ": 76, "INTJ|l-discourse": 77, "INTJ|r-discourse": 78, "INTJ|root": 79, "NOUN": 80, "NOUN|Polarity=Neg": 81, "NOUN|Polarity=Neg|l-obl": 82, "NOUN|Polarity=Neg|root": 83, "NOUN|l-acl": 84, "NOUN|l-advcl": 85, "NOUN|l-ccomp": 86, "NOUN|l-compound": 87, "NOUN|l-csubj": 88, "NOUN|l-csubj:outer": 89, "NOUN|l-nmod": 90, "NOUN|l-nsubj": 91, "NOUN|l-nsubj:outer": 92, "NOUN|l-obj": 93, "NOUN|l-obl": 94, "NOUN|r-compound": 95, "NOUN|r-nmod": 96, "NOUN|r-nsubj": 97, "NOUN|root": 98, "NUM": 99, "NUM|l-advcl": 100, "NUM|l-compound": 101, "NUM|l-nmod": 102, "NUM|l-nsubj": 103, "NUM|l-nsubj:outer": 104, "NUM|l-nummod": 105, "NUM|l-obj": 106, "NUM|l-obl": 107, "NUM|r-compound": 108, "NUM|root": 109, "PART": 110, "PART|l-mark": 111, "PART|r-mark": 112, "PRON": 113, "PRON|l-acl": 114, "PRON|l-advcl": 115, "PRON|l-nmod": 116, "PRON|l-nsubj": 117, "PRON|l-nsubj:outer": 118, "PRON|l-obj": 119, "PRON|l-obl": 120, "PRON|root": 121, "PROPN": 122, "PROPN|l-acl": 123, "PROPN|l-advcl": 124, "PROPN|l-compound": 125, "PROPN|l-nmod": 126, "PROPN|l-nsubj": 127, "PROPN|l-nsubj:outer": 128, "PROPN|l-obj": 129, "PROPN|l-obl": 130, "PROPN|r-compound": 131, "PROPN|r-nmod": 132, "PROPN|root": 133, "PUNCT": 134, "PUNCT|l-punct": 135, "PUNCT|r-punct": 136, "SCONJ": 137, "SCONJ|l-dep": 138, "SCONJ|r-fixed": 139, "SCONJ|r-mark": 140, "SYM": 141, "SYM|l-compound": 142, "SYM|l-dep": 143, "SYM|l-nmod": 144, "SYM|l-obl": 145, "SYM|r-compound": 146, "SYM|r-dep": 147, "VERB": 148, "VERB|l-acl": 149, "VERB|l-advcl": 150, "VERB|l-ccomp": 151, "VERB|l-compound": 152, "VERB|l-csubj": 153, "VERB|l-csubj:outer": 154, "VERB|l-nmod": 155, "VERB|l-obj": 156, "VERB|l-obl": 157, "VERB|r-acl": 158, "VERB|r-advcl": 159, "VERB|r-compound": 160, "VERB|root": 161, "X": 162, "X|l-nmod": 163, "X|r-dep": 164 }, "layer_norm_epsilon": 1e-05, "model_type": "gpt2", "n_embd": 768, "n_head": 12, "n_inner": null, "n_layer": 12, "n_positions": 1024, "reorder_and_upcast_attn": false, "resid_pdrop": 0.1, "scale_attn_by_inverse_layer_idx": false, "scale_attn_weights": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "summary_type": "cls_index", "summary_use_proj": true, "tokenizer_class": "JumanReformerTokenizerFast", "torch_dtype": "float32", "transformers_version": "4.44.2", "use_cache": true, "vocab_size": 32000 }