longluu commited on
Commit
f90103e
1 Parent(s): 3694aa0

--batch_size 4 --num_train_epochs 15 --learning_rate 1e-5 --weight_decay 0.0

Browse files
Files changed (2) hide show
  1. config.json +115 -1
  2. model.safetensors +1 -1
config.json CHANGED
@@ -1 +1,115 @@
1
- {"_name_or_path": "UFNLP/gatortrons", "architectures": ["MegatronBertForTokenClassification"], "attention_probs_dropout_prob": 0.1, "hidden_act": "gelu", "hidden_dropout_prob": 0.1, "hidden_size": 1024, "id2label": {"0": "['Living Beings', 'Virus']", "1": "['Living Beings', 'Virus']", "2": "['Living Beings', 'Bacterium']", "3": "['Living Beings', 'Bacterium']", "4": "['Anatomy', 'Anatomical Structure']", "5": "['Anatomy', 'Anatomical Structure']", "6": "['Anatomy', 'Body System']", "7": "['Anatomy', 'Body System']", "8": "['Anatomy', 'Body Substance']", "9": "['Anatomy', 'Body Substance']", "10": "['Disorders', 'Finding']", "11": "['Disorders', 'Finding']", "12": "['Disorders', 'Injury or Poisoning']", "13": "['Disorders', 'Injury or Poisoning']", "14": "['Phenomena', 'Biologic Function']", "15": "['Phenomena', 'Biologic Function']", "16": "['Procedures', 'Health Care Activity']", "17": "['Procedures', 'Health Care Activity']", "18": "['Procedures', 'Research Activity']", "19": "['Procedures', 'Research Activity']", "20": "['Devices', 'Medical Device']", "21": "['Devices', 'Medical Device']", "22": "['Concepts & Ideas', 'Spatial Concept']", "23": "['Concepts & Ideas', 'Spatial Concept']", "24": "['Occupations', 'Biomedical Occupation or Discipline']", "25": "['Occupations', 'Biomedical Occupation or Discipline']", "26": "['Organizations', 'Organization']", "27": "['Organizations', 'Organization']", "28": "['Living Beings', 'Professional or Occupational Group']", "29": "['Living Beings', 'Professional or Occupational Group']", "30": "['Living Beings', 'Population Group']", "31": "['Living Beings', 'Population Group']", "32": "['Chemicals & Drugs', 'Chemical']", "33": "['Chemicals & Drugs', 'Chemical']", "34": "['Objects', 'Food']", "35": "['Objects', 'Food']", "36": "['Concepts & Ideas', 'Intellectual Product']", "37": "['Concepts & Ideas', 'Intellectual Product']", "38": "['Physiology', 'Clinical Attribute']", "39": "['Physiology', 'Clinical Attribute']", "40": "['Living Beings', 'Eukaryote']", "41": "['Living Beings', 'Eukaryote']", "42": "None"}, "initializer_range": 0.02, "intermediate_size": 4096, "label2id": {"['Living Beings', 'Virus']": 1, "['Living Beings', 'Bacterium']": 3, "['Anatomy', 'Anatomical Structure']": 5, "['Anatomy', 'Body System']": 7, "['Anatomy', 'Body Substance']": 9, "['Disorders', 'Finding']": 11, "['Disorders', 'Injury or Poisoning']": 13, "['Phenomena', 'Biologic Function']": 15, "['Procedures', 'Health Care Activity']": 17, "['Procedures', 'Research Activity']": 19, "['Devices', 'Medical Device']": 21, "['Concepts & Ideas', 'Spatial Concept']": 23, "['Occupations', 'Biomedical Occupation or Discipline']": 25, "['Organizations', 'Organization']": 27, "['Living Beings', 'Professional or Occupational Group']": 29, "['Living Beings', 'Population Group']": 31, "['Chemicals & Drugs', 'Chemical']": 33, "['Objects', 'Food']": 35, "['Concepts & Ideas', 'Intellectual Product']": 37, "['Physiology', 'Clinical Attribute']": 39, "['Living Beings', 'Eukaryote']": 41, "None": 42}, "layer_norm_eps": 1e-12, "max_position_embeddings": 512, "model_type": "megatron-bert", "num_attention_heads": 16, "num_hidden_layers": 24, "pad_token_id": 0, "position_embedding_type": "absolute", "tokenizer_type": "BertWordPieceCase", "torch_dtype": "float32", "transformers_version": "4.37.1", "type_vocab_size": 2, "use_cache": true, "vocab_size": 50176}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "/home/ec2-user/SageMaker/LLM-NER-clinical-text/models/medmentions/gatortrons/checkpoint-5931",
3
+ "architectures": [
4
+ "MegatronBertForTokenClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "hidden_act": "gelu",
8
+ "hidden_dropout_prob": 0.1,
9
+ "hidden_size": 1024,
10
+ "id2label": {
11
+ "0": "LABEL_0",
12
+ "1": "LABEL_1",
13
+ "2": "LABEL_2",
14
+ "3": "LABEL_3",
15
+ "4": "LABEL_4",
16
+ "5": "LABEL_5",
17
+ "6": "LABEL_6",
18
+ "7": "LABEL_7",
19
+ "8": "LABEL_8",
20
+ "9": "LABEL_9",
21
+ "10": "LABEL_10",
22
+ "11": "LABEL_11",
23
+ "12": "LABEL_12",
24
+ "13": "LABEL_13",
25
+ "14": "LABEL_14",
26
+ "15": "LABEL_15",
27
+ "16": "LABEL_16",
28
+ "17": "LABEL_17",
29
+ "18": "LABEL_18",
30
+ "19": "LABEL_19",
31
+ "20": "LABEL_20",
32
+ "21": "LABEL_21",
33
+ "22": "LABEL_22",
34
+ "23": "LABEL_23",
35
+ "24": "LABEL_24",
36
+ "25": "LABEL_25",
37
+ "26": "LABEL_26",
38
+ "27": "LABEL_27",
39
+ "28": "LABEL_28",
40
+ "29": "LABEL_29",
41
+ "30": "LABEL_30",
42
+ "31": "LABEL_31",
43
+ "32": "LABEL_32",
44
+ "33": "LABEL_33",
45
+ "34": "LABEL_34",
46
+ "35": "LABEL_35",
47
+ "36": "LABEL_36",
48
+ "37": "LABEL_37",
49
+ "38": "LABEL_38",
50
+ "39": "LABEL_39",
51
+ "40": "LABEL_40",
52
+ "41": "LABEL_41",
53
+ "42": "LABEL_42"
54
+ },
55
+ "initializer_range": 0.02,
56
+ "intermediate_size": 4096,
57
+ "label2id": {
58
+ "LABEL_0": 0,
59
+ "LABEL_1": 1,
60
+ "LABEL_10": 10,
61
+ "LABEL_11": 11,
62
+ "LABEL_12": 12,
63
+ "LABEL_13": 13,
64
+ "LABEL_14": 14,
65
+ "LABEL_15": 15,
66
+ "LABEL_16": 16,
67
+ "LABEL_17": 17,
68
+ "LABEL_18": 18,
69
+ "LABEL_19": 19,
70
+ "LABEL_2": 2,
71
+ "LABEL_20": 20,
72
+ "LABEL_21": 21,
73
+ "LABEL_22": 22,
74
+ "LABEL_23": 23,
75
+ "LABEL_24": 24,
76
+ "LABEL_25": 25,
77
+ "LABEL_26": 26,
78
+ "LABEL_27": 27,
79
+ "LABEL_28": 28,
80
+ "LABEL_29": 29,
81
+ "LABEL_3": 3,
82
+ "LABEL_30": 30,
83
+ "LABEL_31": 31,
84
+ "LABEL_32": 32,
85
+ "LABEL_33": 33,
86
+ "LABEL_34": 34,
87
+ "LABEL_35": 35,
88
+ "LABEL_36": 36,
89
+ "LABEL_37": 37,
90
+ "LABEL_38": 38,
91
+ "LABEL_39": 39,
92
+ "LABEL_4": 4,
93
+ "LABEL_40": 40,
94
+ "LABEL_41": 41,
95
+ "LABEL_42": 42,
96
+ "LABEL_5": 5,
97
+ "LABEL_6": 6,
98
+ "LABEL_7": 7,
99
+ "LABEL_8": 8,
100
+ "LABEL_9": 9
101
+ },
102
+ "layer_norm_eps": 1e-12,
103
+ "max_position_embeddings": 512,
104
+ "model_type": "megatron-bert",
105
+ "num_attention_heads": 16,
106
+ "num_hidden_layers": 24,
107
+ "pad_token_id": 0,
108
+ "position_embedding_type": "absolute",
109
+ "tokenizer_type": "BertWordPieceCase",
110
+ "torch_dtype": "float32",
111
+ "transformers_version": "4.37.1",
112
+ "type_vocab_size": 2,
113
+ "use_cache": true,
114
+ "vocab_size": 50176
115
+ }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8505fba086bf12124180592993c06e8bcd441a9bb22d367df5efbb72d4ec1c3b
3
  size 1417093764
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9b67a41b4af21362e62ca9506f80da0f3bea7b406a52b27df99ea72d4f17614
3
  size 1417093764