mrovera commited on
Commit
57b1160
1 Parent(s): 714fcd8

model commit

Browse files
config.json ADDED
@@ -0,0 +1,1784 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "dbmdz/bert-base-italian-xxl-uncased",
3
+ "architectures": [
4
+ "BertForSequenceClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "classifier_dropout": null,
8
+ "hidden_act": "gelu",
9
+ "hidden_dropout_prob": 0.1,
10
+ "hidden_size": 768,
11
+ "id2label": {
12
+ "0": "A0040",
13
+ "1": "A0120",
14
+ "2": "A0125",
15
+ "3": "A0130",
16
+ "4": "A0140",
17
+ "5": "A0150",
18
+ "6": "A0160",
19
+ "7": "A0180",
20
+ "8": "A0190",
21
+ "9": "A0210",
22
+ "10": "A0230",
23
+ "11": "A0240",
24
+ "12": "A0245",
25
+ "13": "A0250",
26
+ "14": "A0260",
27
+ "15": "A0280",
28
+ "16": "A0290",
29
+ "17": "A0300",
30
+ "18": "A0310",
31
+ "19": "A0330",
32
+ "20": "A0340",
33
+ "21": "A0345",
34
+ "22": "A0360",
35
+ "23": "A0370",
36
+ "24": "A0380",
37
+ "25": "A0400",
38
+ "26": "A0420",
39
+ "27": "A0430",
40
+ "28": "A0460",
41
+ "29": "A0480",
42
+ "30": "A0490",
43
+ "31": "A0500",
44
+ "32": "A0510",
45
+ "33": "A0540",
46
+ "34": "A0545",
47
+ "35": "A0550",
48
+ "36": "A0570",
49
+ "37": "A0580",
50
+ "38": "A0675",
51
+ "39": "A0680",
52
+ "40": "A0700",
53
+ "41": "A0720",
54
+ "42": "A0730",
55
+ "43": "A0740",
56
+ "44": "A0770",
57
+ "45": "A0780",
58
+ "46": "A0790",
59
+ "47": "A0835",
60
+ "48": "A0850",
61
+ "49": "A0870",
62
+ "50": "A0880",
63
+ "51": "A0890",
64
+ "52": "A0920",
65
+ "53": "A0950",
66
+ "54": "A0960",
67
+ "55": "A0970",
68
+ "56": "A0980",
69
+ "57": "A0990",
70
+ "58": "A1010",
71
+ "59": "A1030",
72
+ "60": "A1040",
73
+ "61": "A1060",
74
+ "62": "A1080",
75
+ "63": "A1100",
76
+ "64": "A1115",
77
+ "65": "A1120",
78
+ "66": "A1140",
79
+ "67": "A1170",
80
+ "68": "A1180",
81
+ "69": "A1190",
82
+ "70": "A1215",
83
+ "71": "A1220",
84
+ "72": "A1260",
85
+ "73": "A1270",
86
+ "74": "A1280",
87
+ "75": "A1290",
88
+ "76": "A1300",
89
+ "77": "A1350",
90
+ "78": "A1380",
91
+ "79": "A1390",
92
+ "80": "A1410",
93
+ "81": "A1420",
94
+ "82": "A1425",
95
+ "83": "A1450",
96
+ "84": "A1470",
97
+ "85": "A1475",
98
+ "86": "A1490",
99
+ "87": "A1510",
100
+ "88": "A1530",
101
+ "89": "A1550",
102
+ "90": "A1590",
103
+ "91": "A1610",
104
+ "92": "A1630",
105
+ "93": "A1640",
106
+ "94": "A1650",
107
+ "95": "A1688",
108
+ "96": "A1689",
109
+ "97": "A1690",
110
+ "98": "A1710",
111
+ "99": "A1740",
112
+ "100": "A1750",
113
+ "101": "A1760",
114
+ "102": "A1780",
115
+ "103": "A1810",
116
+ "104": "A1820",
117
+ "105": "A1830",
118
+ "106": "A1850",
119
+ "107": "A1860",
120
+ "108": "A1870",
121
+ "109": "A1910",
122
+ "110": "A1920",
123
+ "111": "A1930",
124
+ "112": "A1940",
125
+ "113": "A1950",
126
+ "114": "A1970",
127
+ "115": "A1980",
128
+ "116": "A1990",
129
+ "117": "A2010",
130
+ "118": "A2020",
131
+ "119": "A2030",
132
+ "120": "A2040",
133
+ "121": "A2060",
134
+ "122": "A2110",
135
+ "123": "A2180",
136
+ "124": "A2190",
137
+ "125": "A2240",
138
+ "126": "A2300",
139
+ "127": "A2320",
140
+ "128": "A2340",
141
+ "129": "A2341",
142
+ "130": "A2350",
143
+ "131": "A2370",
144
+ "132": "A2380",
145
+ "133": "A2450",
146
+ "134": "A2470",
147
+ "135": "A2490",
148
+ "136": "A2500",
149
+ "137": "A2520",
150
+ "138": "A2530",
151
+ "139": "A2550",
152
+ "140": "A2560",
153
+ "141": "A2580",
154
+ "142": "A2585",
155
+ "143": "A2586",
156
+ "144": "A2590",
157
+ "145": "A2610",
158
+ "146": "A2620",
159
+ "147": "A2640",
160
+ "148": "A2660",
161
+ "149": "A2665",
162
+ "150": "A2670",
163
+ "151": "A2675",
164
+ "152": "A2677",
165
+ "153": "A2730",
166
+ "154": "A2740",
167
+ "155": "A2810",
168
+ "156": "A2820",
169
+ "157": "A2830",
170
+ "158": "A2840",
171
+ "159": "A2880",
172
+ "160": "A2890",
173
+ "161": "A3000",
174
+ "162": "A3020",
175
+ "163": "A3050",
176
+ "164": "A3060",
177
+ "165": "A3080",
178
+ "166": "A3090",
179
+ "167": "A3100",
180
+ "168": "A3125",
181
+ "169": "A3130",
182
+ "170": "A3140",
183
+ "171": "A3160",
184
+ "172": "A3170",
185
+ "173": "A3200",
186
+ "174": "A3225",
187
+ "175": "A3250",
188
+ "176": "A3260",
189
+ "177": "A3263",
190
+ "178": "A3310",
191
+ "179": "A3330",
192
+ "180": "A3360",
193
+ "181": "A3365",
194
+ "182": "A3370",
195
+ "183": "A3380",
196
+ "184": "A3400",
197
+ "185": "A3420",
198
+ "186": "A3430",
199
+ "187": "A3450",
200
+ "188": "A3460",
201
+ "189": "A3470",
202
+ "190": "A3540",
203
+ "191": "A3565",
204
+ "192": "A3570",
205
+ "193": "A3580",
206
+ "194": "A3650",
207
+ "195": "A3670",
208
+ "196": "A3710",
209
+ "197": "A3760",
210
+ "198": "A3785",
211
+ "199": "A3790",
212
+ "200": "A3800",
213
+ "201": "A3810",
214
+ "202": "A3840",
215
+ "203": "A3850",
216
+ "204": "A3860",
217
+ "205": "A3870",
218
+ "206": "A3880",
219
+ "207": "A3890",
220
+ "208": "A3900",
221
+ "209": "A3910",
222
+ "210": "A3915",
223
+ "211": "A3920",
224
+ "212": "A3950",
225
+ "213": "A3980",
226
+ "214": "A3990",
227
+ "215": "A4000",
228
+ "216": "A4010",
229
+ "217": "A4020",
230
+ "218": "A4040",
231
+ "219": "A4050",
232
+ "220": "A4055",
233
+ "221": "A4112",
234
+ "222": "A4120",
235
+ "223": "A4130",
236
+ "224": "A4140",
237
+ "225": "A4160",
238
+ "226": "A4170",
239
+ "227": "A4175",
240
+ "228": "A4180",
241
+ "229": "A4200",
242
+ "230": "A4210",
243
+ "231": "A4250",
244
+ "232": "A4260",
245
+ "233": "A4270",
246
+ "234": "A4274",
247
+ "235": "A4275",
248
+ "236": "A4277",
249
+ "237": "A4280",
250
+ "238": "A4290",
251
+ "239": "A4310",
252
+ "240": "A4320",
253
+ "241": "A4330",
254
+ "242": "A4340",
255
+ "243": "A4380",
256
+ "244": "A4390",
257
+ "245": "A4400",
258
+ "246": "A4420",
259
+ "247": "A4430",
260
+ "248": "A4440",
261
+ "249": "A4460",
262
+ "250": "A4470",
263
+ "251": "A4480",
264
+ "252": "A4490",
265
+ "253": "A4605",
266
+ "254": "A4610",
267
+ "255": "A4630",
268
+ "256": "A4650",
269
+ "257": "A4660",
270
+ "258": "A4661",
271
+ "259": "A4695",
272
+ "260": "A4700",
273
+ "261": "A4710",
274
+ "262": "A4720",
275
+ "263": "A4740",
276
+ "264": "A4760",
277
+ "265": "A4780",
278
+ "266": "A4790",
279
+ "267": "A4810",
280
+ "268": "A4840",
281
+ "269": "A4900",
282
+ "270": "A4960",
283
+ "271": "A4970",
284
+ "272": "A5000",
285
+ "273": "A5010",
286
+ "274": "A5030",
287
+ "275": "A5050",
288
+ "276": "A5070",
289
+ "277": "A5100",
290
+ "278": "A5130",
291
+ "279": "A5150",
292
+ "280": "A5170",
293
+ "281": "A5180",
294
+ "282": "A5210",
295
+ "283": "A5230",
296
+ "284": "A5250",
297
+ "285": "A5260",
298
+ "286": "A5330",
299
+ "287": "A5355",
300
+ "288": "A5360",
301
+ "289": "A5370",
302
+ "290": "A5380",
303
+ "291": "A5400",
304
+ "292": "A5460",
305
+ "293": "A5470",
306
+ "294": "A5480",
307
+ "295": "A5490",
308
+ "296": "A5550",
309
+ "297": "A5630",
310
+ "298": "A5640",
311
+ "299": "A5655",
312
+ "300": "A5660",
313
+ "301": "A5665",
314
+ "302": "A5690",
315
+ "303": "A5700",
316
+ "304": "A5720",
317
+ "305": "A5845",
318
+ "306": "A5860",
319
+ "307": "A5890",
320
+ "308": "A5920",
321
+ "309": "A5940",
322
+ "310": "A5990",
323
+ "311": "A6040",
324
+ "312": "A6050",
325
+ "313": "A6060",
326
+ "314": "A6080",
327
+ "315": "A6100",
328
+ "316": "A6180",
329
+ "317": "A6200",
330
+ "318": "A6210",
331
+ "319": "A6220",
332
+ "320": "A6240",
333
+ "321": "A6250",
334
+ "322": "A6255",
335
+ "323": "A6280",
336
+ "324": "A6290",
337
+ "325": "A6330",
338
+ "326": "A6350",
339
+ "327": "A6390",
340
+ "328": "A6410",
341
+ "329": "A6415",
342
+ "330": "A6430",
343
+ "331": "A6440",
344
+ "332": "A6450",
345
+ "333": "A6470",
346
+ "334": "A6480",
347
+ "335": "A6490",
348
+ "336": "A6500",
349
+ "337": "A6510",
350
+ "338": "A6550",
351
+ "339": "A6560",
352
+ "340": "A6570",
353
+ "341": "A6590",
354
+ "342": "A6640",
355
+ "343": "A6650",
356
+ "344": "A6705",
357
+ "345": "A6720",
358
+ "346": "A6730",
359
+ "347": "A6750",
360
+ "348": "A6760",
361
+ "349": "A6765",
362
+ "350": "A6770",
363
+ "351": "A6780",
364
+ "352": "A6800",
365
+ "353": "A6810",
366
+ "354": "A6820",
367
+ "355": "A6840",
368
+ "356": "A6850",
369
+ "357": "A6900",
370
+ "358": "A6930",
371
+ "359": "A6932",
372
+ "360": "A6935",
373
+ "361": "A6940",
374
+ "362": "A6970",
375
+ "363": "A6990",
376
+ "364": "A7000",
377
+ "365": "A7010",
378
+ "366": "A7030",
379
+ "367": "A7040",
380
+ "368": "A7110",
381
+ "369": "A7115",
382
+ "370": "A7130",
383
+ "371": "A7140",
384
+ "372": "C0A20",
385
+ "373": "C0A60",
386
+ "374": "C0AH8",
387
+ "375": "C0B10",
388
+ "376": "C0B75",
389
+ "377": "C0BC0",
390
+ "378": "C0BI0",
391
+ "379": "C0BZ0",
392
+ "380": "C0C90",
393
+ "381": "C0CE1",
394
+ "382": "C0CH0",
395
+ "383": "C0CQ0",
396
+ "384": "C0CS0",
397
+ "385": "C0CU0",
398
+ "386": "C0CV0",
399
+ "387": "C0DM1",
400
+ "388": "C0DP0",
401
+ "389": "C0DT0",
402
+ "390": "C0DV0",
403
+ "391": "C0ED0",
404
+ "392": "C0EG0",
405
+ "393": "C0FA0",
406
+ "394": "C0FC0",
407
+ "395": "C0FD1",
408
+ "396": "C0FG0",
409
+ "397": "C0FG1",
410
+ "398": "C0FG2",
411
+ "399": "C0FG4",
412
+ "400": "C0FH0",
413
+ "401": "C0FN0",
414
+ "402": "C0FQ0",
415
+ "403": "C0FT0",
416
+ "404": "C0FZ0",
417
+ "405": "C0G61",
418
+ "406": "C0GC1",
419
+ "407": "C0GF0",
420
+ "408": "C0GH0",
421
+ "409": "C0H50",
422
+ "410": "C0HF0",
423
+ "411": "C0HI0",
424
+ "412": "C0HM0",
425
+ "413": "C0HR2",
426
+ "414": "C0HR7",
427
+ "415": "C0HR8",
428
+ "416": "C0HR9",
429
+ "417": "C0HS0",
430
+ "418": "C0HV0",
431
+ "419": "C0I90",
432
+ "420": "C0ID0",
433
+ "421": "C0IN0",
434
+ "422": "C0IO0",
435
+ "423": "C0L30",
436
+ "424": "C0L40",
437
+ "425": "C0LF0",
438
+ "426": "C0LG0",
439
+ "427": "C0LP1",
440
+ "428": "C0LQ0",
441
+ "429": "C0M80",
442
+ "430": "C0M90",
443
+ "431": "C0MH0",
444
+ "432": "C0MN0",
445
+ "433": "C0MV0",
446
+ "434": "C0N60",
447
+ "435": "C0N70",
448
+ "436": "C0NB0",
449
+ "437": "C0NE0",
450
+ "438": "C0NI0",
451
+ "439": "C0NL0",
452
+ "440": "C0NM0",
453
+ "441": "C0NQ0",
454
+ "442": "C0NR0",
455
+ "443": "C0NS0",
456
+ "444": "C0NT0",
457
+ "445": "C0NU0",
458
+ "446": "C0NV0",
459
+ "447": "C0NV1",
460
+ "448": "C0NZ0",
461
+ "449": "C0O30",
462
+ "450": "C0OP0",
463
+ "451": "C0OV1",
464
+ "452": "C0OZ0",
465
+ "453": "C0OZ2",
466
+ "454": "C0P10",
467
+ "455": "C0P20",
468
+ "456": "C0P40",
469
+ "457": "C0PC0",
470
+ "458": "C0PF0",
471
+ "459": "C0PV0",
472
+ "460": "C0PZ0",
473
+ "461": "C0Q10",
474
+ "462": "C0Q20",
475
+ "463": "C0Q50",
476
+ "464": "C0QA0",
477
+ "465": "C0QZ0",
478
+ "466": "C0RB1",
479
+ "467": "C0RD1",
480
+ "468": "C0RE0",
481
+ "469": "C0RG0",
482
+ "470": "C0RH0",
483
+ "471": "C0RH1",
484
+ "472": "C0RL0",
485
+ "473": "C0SA0",
486
+ "474": "C0SL0",
487
+ "475": "C0SN1",
488
+ "476": "C0T20",
489
+ "477": "C0T21",
490
+ "478": "C0T50",
491
+ "479": "C0T80",
492
+ "480": "C0TF0",
493
+ "481": "C0TQ0",
494
+ "482": "C0TS0",
495
+ "483": "C0TU0",
496
+ "484": "C0U10",
497
+ "485": "C0U30",
498
+ "486": "C0UA0",
499
+ "487": "C0UG0",
500
+ "488": "C0UL0",
501
+ "489": "C0UQ0",
502
+ "490": "C0US0",
503
+ "491": "C0V10",
504
+ "492": "C0VA1",
505
+ "493": "C0VB0",
506
+ "494": "C0VF0",
507
+ "495": "C0VG2",
508
+ "496": "C0VI0",
509
+ "497": "C0VI1",
510
+ "498": "C0VL0",
511
+ "499": "C0VM0",
512
+ "500": "C0VO0",
513
+ "501": "C0VQ0",
514
+ "502": "C0VV0",
515
+ "503": "C0VZ0",
516
+ "504": "C0ZG0",
517
+ "505": "C0ZL0",
518
+ "506": "C0ZM0",
519
+ "507": "C0ZP0",
520
+ "508": "C0ZQ0",
521
+ "509": "C0ZV0",
522
+ "510": "C1A11",
523
+ "511": "C1AI0",
524
+ "512": "C1B30",
525
+ "513": "C1BE0",
526
+ "514": "C1C61",
527
+ "515": "C1C90",
528
+ "516": "C1CB0",
529
+ "517": "C1CF0",
530
+ "518": "C1CG0",
531
+ "519": "C1CR0",
532
+ "520": "C1DL0",
533
+ "521": "C1DQ0",
534
+ "522": "C1DT1",
535
+ "523": "C1E30",
536
+ "524": "C1EE0",
537
+ "525": "C1EI0",
538
+ "526": "C1EU0",
539
+ "527": "C1EV0",
540
+ "528": "C1F21",
541
+ "529": "C1F90",
542
+ "530": "C1FC0",
543
+ "531": "C1FD0",
544
+ "532": "C1FE0",
545
+ "533": "C1FT0",
546
+ "534": "C1G60",
547
+ "535": "C1GB0",
548
+ "536": "C1GE0",
549
+ "537": "C1GF0",
550
+ "538": "C1GH0",
551
+ "539": "C1GH1",
552
+ "540": "C1GL0",
553
+ "541": "C1GN2",
554
+ "542": "C1GP0",
555
+ "543": "C1GS0",
556
+ "544": "C1H21",
557
+ "545": "C1H90",
558
+ "546": "C1I60",
559
+ "547": "C1I90",
560
+ "548": "C1I91",
561
+ "549": "C1IZ0",
562
+ "550": "C1L20",
563
+ "551": "C1L40",
564
+ "552": "C1LB2",
565
+ "553": "C1LC0",
566
+ "554": "C1LF0",
567
+ "555": "C1LG0",
568
+ "556": "C1LI0",
569
+ "557": "C1LM1",
570
+ "558": "C1LS0",
571
+ "559": "C1M10",
572
+ "560": "C1M20",
573
+ "561": "C1M30",
574
+ "562": "C1M40",
575
+ "563": "C1M60",
576
+ "564": "C1M61",
577
+ "565": "C1M70",
578
+ "566": "C1M80",
579
+ "567": "C1MA0",
580
+ "568": "C1MA1",
581
+ "569": "C1MC0",
582
+ "570": "C1MP0",
583
+ "571": "C1MZ0",
584
+ "572": "C1NC0",
585
+ "573": "C1NG0",
586
+ "574": "C1O10",
587
+ "575": "C1O20",
588
+ "576": "C1O31",
589
+ "577": "C1O40",
590
+ "578": "C1O80",
591
+ "579": "C1OB0",
592
+ "580": "C1OB1",
593
+ "581": "C1OC0",
594
+ "582": "C1OD1",
595
+ "583": "C1OD2",
596
+ "584": "C1ON0",
597
+ "585": "C1ON2",
598
+ "586": "C1OR1",
599
+ "587": "C1OT0",
600
+ "588": "C1P10",
601
+ "589": "C1P80",
602
+ "590": "C1P90",
603
+ "591": "C1PE0",
604
+ "592": "C1PG0",
605
+ "593": "C1PI0",
606
+ "594": "C1PL0",
607
+ "595": "C1PM0",
608
+ "596": "C1Q21",
609
+ "597": "C1Q31",
610
+ "598": "C1Q40",
611
+ "599": "C1QA0",
612
+ "600": "C1QN0",
613
+ "601": "C1QP0",
614
+ "602": "C1QU0",
615
+ "603": "C1QZ0",
616
+ "604": "C1RB1",
617
+ "605": "C1RC0",
618
+ "606": "C1RD0",
619
+ "607": "C1RG0",
620
+ "608": "C1RN0",
621
+ "609": "C1RV0",
622
+ "610": "C1S10",
623
+ "611": "C1S20",
624
+ "612": "C1SG0",
625
+ "613": "C1SL1",
626
+ "614": "C1SM0",
627
+ "615": "C1SO0",
628
+ "616": "C1SZ0",
629
+ "617": "C1T10",
630
+ "618": "C1T60",
631
+ "619": "C1TC0",
632
+ "620": "C1TE0",
633
+ "621": "C1TF0",
634
+ "622": "C1TG0",
635
+ "623": "C1TL0",
636
+ "624": "C1TQ0",
637
+ "625": "C1TQ1",
638
+ "626": "C1TR0",
639
+ "627": "C1TU0",
640
+ "628": "C1TV0",
641
+ "629": "C1U40",
642
+ "630": "C1UB0",
643
+ "631": "C1UE0",
644
+ "632": "C1UI0",
645
+ "633": "C1V80",
646
+ "634": "C1VL0",
647
+ "635": "C1VP0",
648
+ "636": "C1VT0",
649
+ "637": "C1Z10",
650
+ "638": "C1Z40",
651
+ "639": "C1Z80",
652
+ "640": "C1Z90",
653
+ "641": "C1ZD0",
654
+ "642": "C1ZH0",
655
+ "643": "C1ZQ0",
656
+ "644": "C2A30",
657
+ "645": "C2AA0",
658
+ "646": "C2AE0",
659
+ "647": "C2AE1",
660
+ "648": "C2AG0",
661
+ "649": "C2AH0",
662
+ "650": "C2AN0",
663
+ "651": "C2AQ0",
664
+ "652": "C2AR0",
665
+ "653": "C2AS0",
666
+ "654": "C2AT0",
667
+ "655": "C2B40",
668
+ "656": "C2BA0",
669
+ "657": "C2BC0",
670
+ "658": "C2BL2",
671
+ "659": "C2BS0",
672
+ "660": "C2BU0",
673
+ "661": "C2BZ0",
674
+ "662": "C2C50",
675
+ "663": "C2CA0",
676
+ "664": "C2CM0",
677
+ "665": "C2CS0",
678
+ "666": "C2D90",
679
+ "667": "C2DO0",
680
+ "668": "C2DV0",
681
+ "669": "C2E10",
682
+ "670": "C2EC0",
683
+ "671": "C2F30",
684
+ "672": "C2F40",
685
+ "673": "C2F80",
686
+ "674": "C2FC0",
687
+ "675": "C2FG0",
688
+ "676": "C2FH0",
689
+ "677": "C2FL0",
690
+ "678": "C2FS0",
691
+ "679": "C2G81",
692
+ "680": "C2GC0",
693
+ "681": "C2GE0",
694
+ "682": "C2GI0",
695
+ "683": "C2GN1",
696
+ "684": "C2GR0",
697
+ "685": "C2GU0",
698
+ "686": "C2GZ0",
699
+ "687": "C2H10",
700
+ "688": "C2H30",
701
+ "689": "C2HA0",
702
+ "690": "C2HF0",
703
+ "691": "C2HG0",
704
+ "692": "C2HP0",
705
+ "693": "C2HV0",
706
+ "694": "C2HZ0",
707
+ "695": "C2HZ1",
708
+ "696": "C2ID0",
709
+ "697": "C2IO0",
710
+ "698": "C2IT0",
711
+ "699": "C2L50",
712
+ "700": "C2LF0",
713
+ "701": "C2LL0",
714
+ "702": "C2LL1",
715
+ "703": "C2LR0",
716
+ "704": "C2LS0",
717
+ "705": "C2M20",
718
+ "706": "C2M40",
719
+ "707": "C2M90",
720
+ "708": "C2MB0",
721
+ "709": "C2MD0",
722
+ "710": "C2MG0",
723
+ "711": "C2ML0",
724
+ "712": "C2MO0",
725
+ "713": "C2N50",
726
+ "714": "C2N60",
727
+ "715": "C2NE1",
728
+ "716": "C2NF0",
729
+ "717": "C2NP0",
730
+ "718": "C2NQ0",
731
+ "719": "C2O60",
732
+ "720": "C2OA0",
733
+ "721": "C2P90",
734
+ "722": "C2P91",
735
+ "723": "C2PA0",
736
+ "724": "C2PH0",
737
+ "725": "C2PM0",
738
+ "726": "C2Q90",
739
+ "727": "C2QN0",
740
+ "728": "C2QN2",
741
+ "729": "C2QZ1",
742
+ "730": "C2R60",
743
+ "731": "C2R70",
744
+ "732": "C2R90",
745
+ "733": "C2RA0",
746
+ "734": "C2RS0",
747
+ "735": "C2S30",
748
+ "736": "C2S80",
749
+ "737": "C2SR0",
750
+ "738": "C2SU0",
751
+ "739": "C2T10",
752
+ "740": "C2T30",
753
+ "741": "C2T60",
754
+ "742": "C2T80",
755
+ "743": "C2TA0",
756
+ "744": "C2TD0",
757
+ "745": "C2TF0",
758
+ "746": "C2TI0",
759
+ "747": "C2TT0",
760
+ "748": "C2U20",
761
+ "749": "C2U30",
762
+ "750": "C2U40",
763
+ "751": "C2U51",
764
+ "752": "C2U60",
765
+ "753": "C2U71",
766
+ "754": "C2U81",
767
+ "755": "C2U82",
768
+ "756": "C2U90",
769
+ "757": "C2UC0",
770
+ "758": "C2UE0",
771
+ "759": "C2UF0",
772
+ "760": "C2UR0",
773
+ "761": "C2UU0",
774
+ "762": "C2VI0",
775
+ "763": "C2VQ0",
776
+ "764": "C2VS0",
777
+ "765": "C2VT0",
778
+ "766": "C2Z70",
779
+ "767": "C2ZA0",
780
+ "768": "C2ZF0",
781
+ "769": "C2ZN2",
782
+ "770": "C2ZV0",
783
+ "771": "C3A41",
784
+ "772": "C3AC0",
785
+ "773": "C3AL2",
786
+ "774": "C3B70",
787
+ "775": "C3C80",
788
+ "776": "C3D20",
789
+ "777": "C3D60",
790
+ "778": "C3DB0",
791
+ "779": "C3DF0",
792
+ "780": "C3DG0",
793
+ "781": "C3DM0",
794
+ "782": "C3DP0",
795
+ "783": "C3DT0",
796
+ "784": "C3E30",
797
+ "785": "C3E50",
798
+ "786": "C3EG1",
799
+ "787": "C3EH0",
800
+ "788": "C3ES0",
801
+ "789": "C3EU0",
802
+ "790": "C3EZ0",
803
+ "791": "C3FM0",
804
+ "792": "C3FO1",
805
+ "793": "C3FP0",
806
+ "794": "C3FT0",
807
+ "795": "C3FU1",
808
+ "796": "C3G80",
809
+ "797": "C3GO0",
810
+ "798": "C3GP0",
811
+ "799": "C3GP1",
812
+ "800": "C3GQ0",
813
+ "801": "C3GT0",
814
+ "802": "C3H30",
815
+ "803": "C3H41",
816
+ "804": "C3H81",
817
+ "805": "C3HA0",
818
+ "806": "C3HC1",
819
+ "807": "C3HN0",
820
+ "808": "C3IB0",
821
+ "809": "C3IC0",
822
+ "810": "CHR28",
823
+ "811": "R0AC0",
824
+ "812": "R0AD0",
825
+ "813": "R0BF0",
826
+ "814": "R0BG0",
827
+ "815": "R0BM0",
828
+ "816": "R0BR0",
829
+ "817": "R0FH0",
830
+ "818": "R0LE0",
831
+ "819": "R0M51",
832
+ "820": "R0N50",
833
+ "821": "R0N90",
834
+ "822": "R0OE0",
835
+ "823": "R0P10",
836
+ "824": "R0RT1",
837
+ "825": "R0S30",
838
+ "826": "R0S70",
839
+ "827": "R0SB0",
840
+ "828": "R0SG0",
841
+ "829": "R0TA0",
842
+ "830": "R0ZT0",
843
+ "831": "R1IT0",
844
+ "832": "R1SC0",
845
+ "833": "RL002",
846
+ "834": "RL003",
847
+ "835": "S025",
848
+ "836": "S035",
849
+ "837": "S040",
850
+ "838": "S045",
851
+ "839": "S050",
852
+ "840": "S052",
853
+ "841": "S055",
854
+ "842": "S060",
855
+ "843": "S065",
856
+ "844": "S070",
857
+ "845": "S072",
858
+ "846": "S075",
859
+ "847": "S080",
860
+ "848": "S082",
861
+ "849": "S085",
862
+ "850": "S090",
863
+ "851": "S095",
864
+ "852": "S100",
865
+ "853": "S101",
866
+ "854": "S115",
867
+ "855": "S120",
868
+ "856": "S125",
869
+ "857": "S130",
870
+ "858": "S135",
871
+ "859": "S140",
872
+ "860": "S141",
873
+ "861": "S145",
874
+ "862": "S210",
875
+ "863": "S215",
876
+ "864": "S225",
877
+ "865": "S235",
878
+ "866": "S310",
879
+ "867": "S315",
880
+ "868": "S320",
881
+ "869": "S325",
882
+ "870": "S330",
883
+ "871": "S345",
884
+ "872": "S360",
885
+ "873": "S365",
886
+ "874": "S370",
887
+ "875": "S380",
888
+ "876": "S395"
889
+ },
890
+ "initializer_range": 0.02,
891
+ "intermediate_size": 3072,
892
+ "label2id": {
893
+ "A0040": 0,
894
+ "A0120": 1,
895
+ "A0125": 2,
896
+ "A0130": 3,
897
+ "A0140": 4,
898
+ "A0150": 5,
899
+ "A0160": 6,
900
+ "A0180": 7,
901
+ "A0190": 8,
902
+ "A0210": 9,
903
+ "A0230": 10,
904
+ "A0240": 11,
905
+ "A0245": 12,
906
+ "A0250": 13,
907
+ "A0260": 14,
908
+ "A0280": 15,
909
+ "A0290": 16,
910
+ "A0300": 17,
911
+ "A0310": 18,
912
+ "A0330": 19,
913
+ "A0340": 20,
914
+ "A0345": 21,
915
+ "A0360": 22,
916
+ "A0370": 23,
917
+ "A0380": 24,
918
+ "A0400": 25,
919
+ "A0420": 26,
920
+ "A0430": 27,
921
+ "A0460": 28,
922
+ "A0480": 29,
923
+ "A0490": 30,
924
+ "A0500": 31,
925
+ "A0510": 32,
926
+ "A0540": 33,
927
+ "A0545": 34,
928
+ "A0550": 35,
929
+ "A0570": 36,
930
+ "A0580": 37,
931
+ "A0675": 38,
932
+ "A0680": 39,
933
+ "A0700": 40,
934
+ "A0720": 41,
935
+ "A0730": 42,
936
+ "A0740": 43,
937
+ "A0770": 44,
938
+ "A0780": 45,
939
+ "A0790": 46,
940
+ "A0835": 47,
941
+ "A0850": 48,
942
+ "A0870": 49,
943
+ "A0880": 50,
944
+ "A0890": 51,
945
+ "A0920": 52,
946
+ "A0950": 53,
947
+ "A0960": 54,
948
+ "A0970": 55,
949
+ "A0980": 56,
950
+ "A0990": 57,
951
+ "A1010": 58,
952
+ "A1030": 59,
953
+ "A1040": 60,
954
+ "A1060": 61,
955
+ "A1080": 62,
956
+ "A1100": 63,
957
+ "A1115": 64,
958
+ "A1120": 65,
959
+ "A1140": 66,
960
+ "A1170": 67,
961
+ "A1180": 68,
962
+ "A1190": 69,
963
+ "A1215": 70,
964
+ "A1220": 71,
965
+ "A1260": 72,
966
+ "A1270": 73,
967
+ "A1280": 74,
968
+ "A1290": 75,
969
+ "A1300": 76,
970
+ "A1350": 77,
971
+ "A1380": 78,
972
+ "A1390": 79,
973
+ "A1410": 80,
974
+ "A1420": 81,
975
+ "A1425": 82,
976
+ "A1450": 83,
977
+ "A1470": 84,
978
+ "A1475": 85,
979
+ "A1490": 86,
980
+ "A1510": 87,
981
+ "A1530": 88,
982
+ "A1550": 89,
983
+ "A1590": 90,
984
+ "A1610": 91,
985
+ "A1630": 92,
986
+ "A1640": 93,
987
+ "A1650": 94,
988
+ "A1688": 95,
989
+ "A1689": 96,
990
+ "A1690": 97,
991
+ "A1710": 98,
992
+ "A1740": 99,
993
+ "A1750": 100,
994
+ "A1760": 101,
995
+ "A1780": 102,
996
+ "A1810": 103,
997
+ "A1820": 104,
998
+ "A1830": 105,
999
+ "A1850": 106,
1000
+ "A1860": 107,
1001
+ "A1870": 108,
1002
+ "A1910": 109,
1003
+ "A1920": 110,
1004
+ "A1930": 111,
1005
+ "A1940": 112,
1006
+ "A1950": 113,
1007
+ "A1970": 114,
1008
+ "A1980": 115,
1009
+ "A1990": 116,
1010
+ "A2010": 117,
1011
+ "A2020": 118,
1012
+ "A2030": 119,
1013
+ "A2040": 120,
1014
+ "A2060": 121,
1015
+ "A2110": 122,
1016
+ "A2180": 123,
1017
+ "A2190": 124,
1018
+ "A2240": 125,
1019
+ "A2300": 126,
1020
+ "A2320": 127,
1021
+ "A2340": 128,
1022
+ "A2341": 129,
1023
+ "A2350": 130,
1024
+ "A2370": 131,
1025
+ "A2380": 132,
1026
+ "A2450": 133,
1027
+ "A2470": 134,
1028
+ "A2490": 135,
1029
+ "A2500": 136,
1030
+ "A2520": 137,
1031
+ "A2530": 138,
1032
+ "A2550": 139,
1033
+ "A2560": 140,
1034
+ "A2580": 141,
1035
+ "A2585": 142,
1036
+ "A2586": 143,
1037
+ "A2590": 144,
1038
+ "A2610": 145,
1039
+ "A2620": 146,
1040
+ "A2640": 147,
1041
+ "A2660": 148,
1042
+ "A2665": 149,
1043
+ "A2670": 150,
1044
+ "A2675": 151,
1045
+ "A2677": 152,
1046
+ "A2730": 153,
1047
+ "A2740": 154,
1048
+ "A2810": 155,
1049
+ "A2820": 156,
1050
+ "A2830": 157,
1051
+ "A2840": 158,
1052
+ "A2880": 159,
1053
+ "A2890": 160,
1054
+ "A3000": 161,
1055
+ "A3020": 162,
1056
+ "A3050": 163,
1057
+ "A3060": 164,
1058
+ "A3080": 165,
1059
+ "A3090": 166,
1060
+ "A3100": 167,
1061
+ "A3125": 168,
1062
+ "A3130": 169,
1063
+ "A3140": 170,
1064
+ "A3160": 171,
1065
+ "A3170": 172,
1066
+ "A3200": 173,
1067
+ "A3225": 174,
1068
+ "A3250": 175,
1069
+ "A3260": 176,
1070
+ "A3263": 177,
1071
+ "A3310": 178,
1072
+ "A3330": 179,
1073
+ "A3360": 180,
1074
+ "A3365": 181,
1075
+ "A3370": 182,
1076
+ "A3380": 183,
1077
+ "A3400": 184,
1078
+ "A3420": 185,
1079
+ "A3430": 186,
1080
+ "A3450": 187,
1081
+ "A3460": 188,
1082
+ "A3470": 189,
1083
+ "A3540": 190,
1084
+ "A3565": 191,
1085
+ "A3570": 192,
1086
+ "A3580": 193,
1087
+ "A3650": 194,
1088
+ "A3670": 195,
1089
+ "A3710": 196,
1090
+ "A3760": 197,
1091
+ "A3785": 198,
1092
+ "A3790": 199,
1093
+ "A3800": 200,
1094
+ "A3810": 201,
1095
+ "A3840": 202,
1096
+ "A3850": 203,
1097
+ "A3860": 204,
1098
+ "A3870": 205,
1099
+ "A3880": 206,
1100
+ "A3890": 207,
1101
+ "A3900": 208,
1102
+ "A3910": 209,
1103
+ "A3915": 210,
1104
+ "A3920": 211,
1105
+ "A3950": 212,
1106
+ "A3980": 213,
1107
+ "A3990": 214,
1108
+ "A4000": 215,
1109
+ "A4010": 216,
1110
+ "A4020": 217,
1111
+ "A4040": 218,
1112
+ "A4050": 219,
1113
+ "A4055": 220,
1114
+ "A4112": 221,
1115
+ "A4120": 222,
1116
+ "A4130": 223,
1117
+ "A4140": 224,
1118
+ "A4160": 225,
1119
+ "A4170": 226,
1120
+ "A4175": 227,
1121
+ "A4180": 228,
1122
+ "A4200": 229,
1123
+ "A4210": 230,
1124
+ "A4250": 231,
1125
+ "A4260": 232,
1126
+ "A4270": 233,
1127
+ "A4274": 234,
1128
+ "A4275": 235,
1129
+ "A4277": 236,
1130
+ "A4280": 237,
1131
+ "A4290": 238,
1132
+ "A4310": 239,
1133
+ "A4320": 240,
1134
+ "A4330": 241,
1135
+ "A4340": 242,
1136
+ "A4380": 243,
1137
+ "A4390": 244,
1138
+ "A4400": 245,
1139
+ "A4420": 246,
1140
+ "A4430": 247,
1141
+ "A4440": 248,
1142
+ "A4460": 249,
1143
+ "A4470": 250,
1144
+ "A4480": 251,
1145
+ "A4490": 252,
1146
+ "A4605": 253,
1147
+ "A4610": 254,
1148
+ "A4630": 255,
1149
+ "A4650": 256,
1150
+ "A4660": 257,
1151
+ "A4661": 258,
1152
+ "A4695": 259,
1153
+ "A4700": 260,
1154
+ "A4710": 261,
1155
+ "A4720": 262,
1156
+ "A4740": 263,
1157
+ "A4760": 264,
1158
+ "A4780": 265,
1159
+ "A4790": 266,
1160
+ "A4810": 267,
1161
+ "A4840": 268,
1162
+ "A4900": 269,
1163
+ "A4960": 270,
1164
+ "A4970": 271,
1165
+ "A5000": 272,
1166
+ "A5010": 273,
1167
+ "A5030": 274,
1168
+ "A5050": 275,
1169
+ "A5070": 276,
1170
+ "A5100": 277,
1171
+ "A5130": 278,
1172
+ "A5150": 279,
1173
+ "A5170": 280,
1174
+ "A5180": 281,
1175
+ "A5210": 282,
1176
+ "A5230": 283,
1177
+ "A5250": 284,
1178
+ "A5260": 285,
1179
+ "A5330": 286,
1180
+ "A5355": 287,
1181
+ "A5360": 288,
1182
+ "A5370": 289,
1183
+ "A5380": 290,
1184
+ "A5400": 291,
1185
+ "A5460": 292,
1186
+ "A5470": 293,
1187
+ "A5480": 294,
1188
+ "A5490": 295,
1189
+ "A5550": 296,
1190
+ "A5630": 297,
1191
+ "A5640": 298,
1192
+ "A5655": 299,
1193
+ "A5660": 300,
1194
+ "A5665": 301,
1195
+ "A5690": 302,
1196
+ "A5700": 303,
1197
+ "A5720": 304,
1198
+ "A5845": 305,
1199
+ "A5860": 306,
1200
+ "A5890": 307,
1201
+ "A5920": 308,
1202
+ "A5940": 309,
1203
+ "A5990": 310,
1204
+ "A6040": 311,
1205
+ "A6050": 312,
1206
+ "A6060": 313,
1207
+ "A6080": 314,
1208
+ "A6100": 315,
1209
+ "A6180": 316,
1210
+ "A6200": 317,
1211
+ "A6210": 318,
1212
+ "A6220": 319,
1213
+ "A6240": 320,
1214
+ "A6250": 321,
1215
+ "A6255": 322,
1216
+ "A6280": 323,
1217
+ "A6290": 324,
1218
+ "A6330": 325,
1219
+ "A6350": 326,
1220
+ "A6390": 327,
1221
+ "A6410": 328,
1222
+ "A6415": 329,
1223
+ "A6430": 330,
1224
+ "A6440": 331,
1225
+ "A6450": 332,
1226
+ "A6470": 333,
1227
+ "A6480": 334,
1228
+ "A6490": 335,
1229
+ "A6500": 336,
1230
+ "A6510": 337,
1231
+ "A6550": 338,
1232
+ "A6560": 339,
1233
+ "A6570": 340,
1234
+ "A6590": 341,
1235
+ "A6640": 342,
1236
+ "A6650": 343,
1237
+ "A6705": 344,
1238
+ "A6720": 345,
1239
+ "A6730": 346,
1240
+ "A6750": 347,
1241
+ "A6760": 348,
1242
+ "A6765": 349,
1243
+ "A6770": 350,
1244
+ "A6780": 351,
1245
+ "A6800": 352,
1246
+ "A6810": 353,
1247
+ "A6820": 354,
1248
+ "A6840": 355,
1249
+ "A6850": 356,
1250
+ "A6900": 357,
1251
+ "A6930": 358,
1252
+ "A6932": 359,
1253
+ "A6935": 360,
1254
+ "A6940": 361,
1255
+ "A6970": 362,
1256
+ "A6990": 363,
1257
+ "A7000": 364,
1258
+ "A7010": 365,
1259
+ "A7030": 366,
1260
+ "A7040": 367,
1261
+ "A7110": 368,
1262
+ "A7115": 369,
1263
+ "A7130": 370,
1264
+ "A7140": 371,
1265
+ "C0A20": 372,
1266
+ "C0A60": 373,
1267
+ "C0AH8": 374,
1268
+ "C0B10": 375,
1269
+ "C0B75": 376,
1270
+ "C0BC0": 377,
1271
+ "C0BI0": 378,
1272
+ "C0BZ0": 379,
1273
+ "C0C90": 380,
1274
+ "C0CE1": 381,
1275
+ "C0CH0": 382,
1276
+ "C0CQ0": 383,
1277
+ "C0CS0": 384,
1278
+ "C0CU0": 385,
1279
+ "C0CV0": 386,
1280
+ "C0DM1": 387,
1281
+ "C0DP0": 388,
1282
+ "C0DT0": 389,
1283
+ "C0DV0": 390,
1284
+ "C0ED0": 391,
1285
+ "C0EG0": 392,
1286
+ "C0FA0": 393,
1287
+ "C0FC0": 394,
1288
+ "C0FD1": 395,
1289
+ "C0FG0": 396,
1290
+ "C0FG1": 397,
1291
+ "C0FG2": 398,
1292
+ "C0FG4": 399,
1293
+ "C0FH0": 400,
1294
+ "C0FN0": 401,
1295
+ "C0FQ0": 402,
1296
+ "C0FT0": 403,
1297
+ "C0FZ0": 404,
1298
+ "C0G61": 405,
1299
+ "C0GC1": 406,
1300
+ "C0GF0": 407,
1301
+ "C0GH0": 408,
1302
+ "C0H50": 409,
1303
+ "C0HF0": 410,
1304
+ "C0HI0": 411,
1305
+ "C0HM0": 412,
1306
+ "C0HR2": 413,
1307
+ "C0HR7": 414,
1308
+ "C0HR8": 415,
1309
+ "C0HR9": 416,
1310
+ "C0HS0": 417,
1311
+ "C0HV0": 418,
1312
+ "C0I90": 419,
1313
+ "C0ID0": 420,
1314
+ "C0IN0": 421,
1315
+ "C0IO0": 422,
1316
+ "C0L30": 423,
1317
+ "C0L40": 424,
1318
+ "C0LF0": 425,
1319
+ "C0LG0": 426,
1320
+ "C0LP1": 427,
1321
+ "C0LQ0": 428,
1322
+ "C0M80": 429,
1323
+ "C0M90": 430,
1324
+ "C0MH0": 431,
1325
+ "C0MN0": 432,
1326
+ "C0MV0": 433,
1327
+ "C0N60": 434,
1328
+ "C0N70": 435,
1329
+ "C0NB0": 436,
1330
+ "C0NE0": 437,
1331
+ "C0NI0": 438,
1332
+ "C0NL0": 439,
1333
+ "C0NM0": 440,
1334
+ "C0NQ0": 441,
1335
+ "C0NR0": 442,
1336
+ "C0NS0": 443,
1337
+ "C0NT0": 444,
1338
+ "C0NU0": 445,
1339
+ "C0NV0": 446,
1340
+ "C0NV1": 447,
1341
+ "C0NZ0": 448,
1342
+ "C0O30": 449,
1343
+ "C0OP0": 450,
1344
+ "C0OV1": 451,
1345
+ "C0OZ0": 452,
1346
+ "C0OZ2": 453,
1347
+ "C0P10": 454,
1348
+ "C0P20": 455,
1349
+ "C0P40": 456,
1350
+ "C0PC0": 457,
1351
+ "C0PF0": 458,
1352
+ "C0PV0": 459,
1353
+ "C0PZ0": 460,
1354
+ "C0Q10": 461,
1355
+ "C0Q20": 462,
1356
+ "C0Q50": 463,
1357
+ "C0QA0": 464,
1358
+ "C0QZ0": 465,
1359
+ "C0RB1": 466,
1360
+ "C0RD1": 467,
1361
+ "C0RE0": 468,
1362
+ "C0RG0": 469,
1363
+ "C0RH0": 470,
1364
+ "C0RH1": 471,
1365
+ "C0RL0": 472,
1366
+ "C0SA0": 473,
1367
+ "C0SL0": 474,
1368
+ "C0SN1": 475,
1369
+ "C0T20": 476,
1370
+ "C0T21": 477,
1371
+ "C0T50": 478,
1372
+ "C0T80": 479,
1373
+ "C0TF0": 480,
1374
+ "C0TQ0": 481,
1375
+ "C0TS0": 482,
1376
+ "C0TU0": 483,
1377
+ "C0U10": 484,
1378
+ "C0U30": 485,
1379
+ "C0UA0": 486,
1380
+ "C0UG0": 487,
1381
+ "C0UL0": 488,
1382
+ "C0UQ0": 489,
1383
+ "C0US0": 490,
1384
+ "C0V10": 491,
1385
+ "C0VA1": 492,
1386
+ "C0VB0": 493,
1387
+ "C0VF0": 494,
1388
+ "C0VG2": 495,
1389
+ "C0VI0": 496,
1390
+ "C0VI1": 497,
1391
+ "C0VL0": 498,
1392
+ "C0VM0": 499,
1393
+ "C0VO0": 500,
1394
+ "C0VQ0": 501,
1395
+ "C0VV0": 502,
1396
+ "C0VZ0": 503,
1397
+ "C0ZG0": 504,
1398
+ "C0ZL0": 505,
1399
+ "C0ZM0": 506,
1400
+ "C0ZP0": 507,
1401
+ "C0ZQ0": 508,
1402
+ "C0ZV0": 509,
1403
+ "C1A11": 510,
1404
+ "C1AI0": 511,
1405
+ "C1B30": 512,
1406
+ "C1BE0": 513,
1407
+ "C1C61": 514,
1408
+ "C1C90": 515,
1409
+ "C1CB0": 516,
1410
+ "C1CF0": 517,
1411
+ "C1CG0": 518,
1412
+ "C1CR0": 519,
1413
+ "C1DL0": 520,
1414
+ "C1DQ0": 521,
1415
+ "C1DT1": 522,
1416
+ "C1E30": 523,
1417
+ "C1EE0": 524,
1418
+ "C1EI0": 525,
1419
+ "C1EU0": 526,
1420
+ "C1EV0": 527,
1421
+ "C1F21": 528,
1422
+ "C1F90": 529,
1423
+ "C1FC0": 530,
1424
+ "C1FD0": 531,
1425
+ "C1FE0": 532,
1426
+ "C1FT0": 533,
1427
+ "C1G60": 534,
1428
+ "C1GB0": 535,
1429
+ "C1GE0": 536,
1430
+ "C1GF0": 537,
1431
+ "C1GH0": 538,
1432
+ "C1GH1": 539,
1433
+ "C1GL0": 540,
1434
+ "C1GN2": 541,
1435
+ "C1GP0": 542,
1436
+ "C1GS0": 543,
1437
+ "C1H21": 544,
1438
+ "C1H90": 545,
1439
+ "C1I60": 546,
1440
+ "C1I90": 547,
1441
+ "C1I91": 548,
1442
+ "C1IZ0": 549,
1443
+ "C1L20": 550,
1444
+ "C1L40": 551,
1445
+ "C1LB2": 552,
1446
+ "C1LC0": 553,
1447
+ "C1LF0": 554,
1448
+ "C1LG0": 555,
1449
+ "C1LI0": 556,
1450
+ "C1LM1": 557,
1451
+ "C1LS0": 558,
1452
+ "C1M10": 559,
1453
+ "C1M20": 560,
1454
+ "C1M30": 561,
1455
+ "C1M40": 562,
1456
+ "C1M60": 563,
1457
+ "C1M61": 564,
1458
+ "C1M70": 565,
1459
+ "C1M80": 566,
1460
+ "C1MA0": 567,
1461
+ "C1MA1": 568,
1462
+ "C1MC0": 569,
1463
+ "C1MP0": 570,
1464
+ "C1MZ0": 571,
1465
+ "C1NC0": 572,
1466
+ "C1NG0": 573,
1467
+ "C1O10": 574,
1468
+ "C1O20": 575,
1469
+ "C1O31": 576,
1470
+ "C1O40": 577,
1471
+ "C1O80": 578,
1472
+ "C1OB0": 579,
1473
+ "C1OB1": 580,
1474
+ "C1OC0": 581,
1475
+ "C1OD1": 582,
1476
+ "C1OD2": 583,
1477
+ "C1ON0": 584,
1478
+ "C1ON2": 585,
1479
+ "C1OR1": 586,
1480
+ "C1OT0": 587,
1481
+ "C1P10": 588,
1482
+ "C1P80": 589,
1483
+ "C1P90": 590,
1484
+ "C1PE0": 591,
1485
+ "C1PG0": 592,
1486
+ "C1PI0": 593,
1487
+ "C1PL0": 594,
1488
+ "C1PM0": 595,
1489
+ "C1Q21": 596,
1490
+ "C1Q31": 597,
1491
+ "C1Q40": 598,
1492
+ "C1QA0": 599,
1493
+ "C1QN0": 600,
1494
+ "C1QP0": 601,
1495
+ "C1QU0": 602,
1496
+ "C1QZ0": 603,
1497
+ "C1RB1": 604,
1498
+ "C1RC0": 605,
1499
+ "C1RD0": 606,
1500
+ "C1RG0": 607,
1501
+ "C1RN0": 608,
1502
+ "C1RV0": 609,
1503
+ "C1S10": 610,
1504
+ "C1S20": 611,
1505
+ "C1SG0": 612,
1506
+ "C1SL1": 613,
1507
+ "C1SM0": 614,
1508
+ "C1SO0": 615,
1509
+ "C1SZ0": 616,
1510
+ "C1T10": 617,
1511
+ "C1T60": 618,
1512
+ "C1TC0": 619,
1513
+ "C1TE0": 620,
1514
+ "C1TF0": 621,
1515
+ "C1TG0": 622,
1516
+ "C1TL0": 623,
1517
+ "C1TQ0": 624,
1518
+ "C1TQ1": 625,
1519
+ "C1TR0": 626,
1520
+ "C1TU0": 627,
1521
+ "C1TV0": 628,
1522
+ "C1U40": 629,
1523
+ "C1UB0": 630,
1524
+ "C1UE0": 631,
1525
+ "C1UI0": 632,
1526
+ "C1V80": 633,
1527
+ "C1VL0": 634,
1528
+ "C1VP0": 635,
1529
+ "C1VT0": 636,
1530
+ "C1Z10": 637,
1531
+ "C1Z40": 638,
1532
+ "C1Z80": 639,
1533
+ "C1Z90": 640,
1534
+ "C1ZD0": 641,
1535
+ "C1ZH0": 642,
1536
+ "C1ZQ0": 643,
1537
+ "C2A30": 644,
1538
+ "C2AA0": 645,
1539
+ "C2AE0": 646,
1540
+ "C2AE1": 647,
1541
+ "C2AG0": 648,
1542
+ "C2AH0": 649,
1543
+ "C2AN0": 650,
1544
+ "C2AQ0": 651,
1545
+ "C2AR0": 652,
1546
+ "C2AS0": 653,
1547
+ "C2AT0": 654,
1548
+ "C2B40": 655,
1549
+ "C2BA0": 656,
1550
+ "C2BC0": 657,
1551
+ "C2BL2": 658,
1552
+ "C2BS0": 659,
1553
+ "C2BU0": 660,
1554
+ "C2BZ0": 661,
1555
+ "C2C50": 662,
1556
+ "C2CA0": 663,
1557
+ "C2CM0": 664,
1558
+ "C2CS0": 665,
1559
+ "C2D90": 666,
1560
+ "C2DO0": 667,
1561
+ "C2DV0": 668,
1562
+ "C2E10": 669,
1563
+ "C2EC0": 670,
1564
+ "C2F30": 671,
1565
+ "C2F40": 672,
1566
+ "C2F80": 673,
1567
+ "C2FC0": 674,
1568
+ "C2FG0": 675,
1569
+ "C2FH0": 676,
1570
+ "C2FL0": 677,
1571
+ "C2FS0": 678,
1572
+ "C2G81": 679,
1573
+ "C2GC0": 680,
1574
+ "C2GE0": 681,
1575
+ "C2GI0": 682,
1576
+ "C2GN1": 683,
1577
+ "C2GR0": 684,
1578
+ "C2GU0": 685,
1579
+ "C2GZ0": 686,
1580
+ "C2H10": 687,
1581
+ "C2H30": 688,
1582
+ "C2HA0": 689,
1583
+ "C2HF0": 690,
1584
+ "C2HG0": 691,
1585
+ "C2HP0": 692,
1586
+ "C2HV0": 693,
1587
+ "C2HZ0": 694,
1588
+ "C2HZ1": 695,
1589
+ "C2ID0": 696,
1590
+ "C2IO0": 697,
1591
+ "C2IT0": 698,
1592
+ "C2L50": 699,
1593
+ "C2LF0": 700,
1594
+ "C2LL0": 701,
1595
+ "C2LL1": 702,
1596
+ "C2LR0": 703,
1597
+ "C2LS0": 704,
1598
+ "C2M20": 705,
1599
+ "C2M40": 706,
1600
+ "C2M90": 707,
1601
+ "C2MB0": 708,
1602
+ "C2MD0": 709,
1603
+ "C2MG0": 710,
1604
+ "C2ML0": 711,
1605
+ "C2MO0": 712,
1606
+ "C2N50": 713,
1607
+ "C2N60": 714,
1608
+ "C2NE1": 715,
1609
+ "C2NF0": 716,
1610
+ "C2NP0": 717,
1611
+ "C2NQ0": 718,
1612
+ "C2O60": 719,
1613
+ "C2OA0": 720,
1614
+ "C2P90": 721,
1615
+ "C2P91": 722,
1616
+ "C2PA0": 723,
1617
+ "C2PH0": 724,
1618
+ "C2PM0": 725,
1619
+ "C2Q90": 726,
1620
+ "C2QN0": 727,
1621
+ "C2QN2": 728,
1622
+ "C2QZ1": 729,
1623
+ "C2R60": 730,
1624
+ "C2R70": 731,
1625
+ "C2R90": 732,
1626
+ "C2RA0": 733,
1627
+ "C2RS0": 734,
1628
+ "C2S30": 735,
1629
+ "C2S80": 736,
1630
+ "C2SR0": 737,
1631
+ "C2SU0": 738,
1632
+ "C2T10": 739,
1633
+ "C2T30": 740,
1634
+ "C2T60": 741,
1635
+ "C2T80": 742,
1636
+ "C2TA0": 743,
1637
+ "C2TD0": 744,
1638
+ "C2TF0": 745,
1639
+ "C2TI0": 746,
1640
+ "C2TT0": 747,
1641
+ "C2U20": 748,
1642
+ "C2U30": 749,
1643
+ "C2U40": 750,
1644
+ "C2U51": 751,
1645
+ "C2U60": 752,
1646
+ "C2U71": 753,
1647
+ "C2U81": 754,
1648
+ "C2U82": 755,
1649
+ "C2U90": 756,
1650
+ "C2UC0": 757,
1651
+ "C2UE0": 758,
1652
+ "C2UF0": 759,
1653
+ "C2UR0": 760,
1654
+ "C2UU0": 761,
1655
+ "C2VI0": 762,
1656
+ "C2VQ0": 763,
1657
+ "C2VS0": 764,
1658
+ "C2VT0": 765,
1659
+ "C2Z70": 766,
1660
+ "C2ZA0": 767,
1661
+ "C2ZF0": 768,
1662
+ "C2ZN2": 769,
1663
+ "C2ZV0": 770,
1664
+ "C3A41": 771,
1665
+ "C3AC0": 772,
1666
+ "C3AL2": 773,
1667
+ "C3B70": 774,
1668
+ "C3C80": 775,
1669
+ "C3D20": 776,
1670
+ "C3D60": 777,
1671
+ "C3DB0": 778,
1672
+ "C3DF0": 779,
1673
+ "C3DG0": 780,
1674
+ "C3DM0": 781,
1675
+ "C3DP0": 782,
1676
+ "C3DT0": 783,
1677
+ "C3E30": 784,
1678
+ "C3E50": 785,
1679
+ "C3EG1": 786,
1680
+ "C3EH0": 787,
1681
+ "C3ES0": 788,
1682
+ "C3EU0": 789,
1683
+ "C3EZ0": 790,
1684
+ "C3FM0": 791,
1685
+ "C3FO1": 792,
1686
+ "C3FP0": 793,
1687
+ "C3FT0": 794,
1688
+ "C3FU1": 795,
1689
+ "C3G80": 796,
1690
+ "C3GO0": 797,
1691
+ "C3GP0": 798,
1692
+ "C3GP1": 799,
1693
+ "C3GQ0": 800,
1694
+ "C3GT0": 801,
1695
+ "C3H30": 802,
1696
+ "C3H41": 803,
1697
+ "C3H81": 804,
1698
+ "C3HA0": 805,
1699
+ "C3HC1": 806,
1700
+ "C3HN0": 807,
1701
+ "C3IB0": 808,
1702
+ "C3IC0": 809,
1703
+ "CHR28": 810,
1704
+ "R0AC0": 811,
1705
+ "R0AD0": 812,
1706
+ "R0BF0": 813,
1707
+ "R0BG0": 814,
1708
+ "R0BM0": 815,
1709
+ "R0BR0": 816,
1710
+ "R0FH0": 817,
1711
+ "R0LE0": 818,
1712
+ "R0M51": 819,
1713
+ "R0N50": 820,
1714
+ "R0N90": 821,
1715
+ "R0OE0": 822,
1716
+ "R0P10": 823,
1717
+ "R0RT1": 824,
1718
+ "R0S30": 825,
1719
+ "R0S70": 826,
1720
+ "R0SB0": 827,
1721
+ "R0SG0": 828,
1722
+ "R0TA0": 829,
1723
+ "R0ZT0": 830,
1724
+ "R1IT0": 831,
1725
+ "R1SC0": 832,
1726
+ "RL002": 833,
1727
+ "RL003": 834,
1728
+ "S025": 835,
1729
+ "S035": 836,
1730
+ "S040": 837,
1731
+ "S045": 838,
1732
+ "S050": 839,
1733
+ "S052": 840,
1734
+ "S055": 841,
1735
+ "S060": 842,
1736
+ "S065": 843,
1737
+ "S070": 844,
1738
+ "S072": 845,
1739
+ "S075": 846,
1740
+ "S080": 847,
1741
+ "S082": 848,
1742
+ "S085": 849,
1743
+ "S090": 850,
1744
+ "S095": 851,
1745
+ "S100": 852,
1746
+ "S101": 853,
1747
+ "S115": 854,
1748
+ "S120": 855,
1749
+ "S125": 856,
1750
+ "S130": 857,
1751
+ "S135": 858,
1752
+ "S140": 859,
1753
+ "S141": 860,
1754
+ "S145": 861,
1755
+ "S210": 862,
1756
+ "S215": 863,
1757
+ "S225": 864,
1758
+ "S235": 865,
1759
+ "S310": 866,
1760
+ "S315": 867,
1761
+ "S320": 868,
1762
+ "S325": 869,
1763
+ "S330": 870,
1764
+ "S345": 871,
1765
+ "S360": 872,
1766
+ "S365": 873,
1767
+ "S370": 874,
1768
+ "S380": 875,
1769
+ "S395": 876
1770
+ },
1771
+ "layer_norm_eps": 1e-12,
1772
+ "max_position_embeddings": 512,
1773
+ "model_type": "bert",
1774
+ "num_attention_heads": 12,
1775
+ "num_hidden_layers": 12,
1776
+ "pad_token_id": 0,
1777
+ "position_embedding_type": "absolute",
1778
+ "problem_type": "multi_label_classification",
1779
+ "torch_dtype": "float32",
1780
+ "transformers_version": "4.26.0",
1781
+ "type_vocab_size": 2,
1782
+ "use_cache": true,
1783
+ "vocab_size": 32102
1784
+ }
optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f84c92e44f1ce49fec1f7a096671c64793107ac58e59d38d1faf0db25c04565d
3
+ size 891078981
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e40bc59b808d3dcbbc1cec3fa0336217303296fae82b2f7b5b789e6c113fb5f7
3
+ size 445553141
rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6236289b139e8623447deec63baeea4b354ddd3df967c98c84e350585de338a
3
+ size 14575
scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:875f6351c1c12ffbbb98d07d1de8a415aebb94934ff05990faebaa1b60936c2b
3
+ size 627
special_tokens_map.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "mask_token": "[MASK]",
4
+ "pad_token": "[PAD]",
5
+ "sep_token": "[SEP]",
6
+ "unk_token": "[UNK]"
7
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "do_basic_tokenize": true,
4
+ "do_lower_case": true,
5
+ "mask_token": "[MASK]",
6
+ "max_len": 512,
7
+ "model_max_length": 512,
8
+ "name_or_path": "dbmdz/bert-base-italian-xxl-uncased",
9
+ "never_split": null,
10
+ "pad_token": "[PAD]",
11
+ "sep_token": "[SEP]",
12
+ "special_tokens_map_file": null,
13
+ "strip_accents": null,
14
+ "tokenize_chinese_chars": true,
15
+ "tokenizer_class": "BertTokenizer",
16
+ "unk_token": "[UNK]"
17
+ }
trainer_state.json ADDED
@@ -0,0 +1,1519 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.8538806684223458,
3
+ "best_model_checkpoint": "output/ipzs-sg-bert_xxl-bs-16/checkpoint-114021",
4
+ "epoch": 9.0,
5
+ "global_step": 114021,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.04,
12
+ "learning_rate": 3.505111768884679e-05,
13
+ "loss": 0.0964,
14
+ "step": 500
15
+ },
16
+ {
17
+ "epoch": 0.08,
18
+ "learning_rate": 3.491223537769359e-05,
19
+ "loss": 0.0133,
20
+ "step": 1000
21
+ },
22
+ {
23
+ "epoch": 0.12,
24
+ "learning_rate": 3.4773353066540374e-05,
25
+ "loss": 0.0109,
26
+ "step": 1500
27
+ },
28
+ {
29
+ "epoch": 0.16,
30
+ "learning_rate": 3.463447075538717e-05,
31
+ "loss": 0.0102,
32
+ "step": 2000
33
+ },
34
+ {
35
+ "epoch": 0.2,
36
+ "learning_rate": 3.4495588444233954e-05,
37
+ "loss": 0.0099,
38
+ "step": 2500
39
+ },
40
+ {
41
+ "epoch": 0.24,
42
+ "learning_rate": 3.435670613308075e-05,
43
+ "loss": 0.0098,
44
+ "step": 3000
45
+ },
46
+ {
47
+ "epoch": 0.28,
48
+ "learning_rate": 3.421782382192754e-05,
49
+ "loss": 0.0096,
50
+ "step": 3500
51
+ },
52
+ {
53
+ "epoch": 0.32,
54
+ "learning_rate": 3.407894151077433e-05,
55
+ "loss": 0.0088,
56
+ "step": 4000
57
+ },
58
+ {
59
+ "epoch": 0.36,
60
+ "learning_rate": 3.394005919962113e-05,
61
+ "loss": 0.0074,
62
+ "step": 4500
63
+ },
64
+ {
65
+ "epoch": 0.39,
66
+ "learning_rate": 3.3801176888467914e-05,
67
+ "loss": 0.0064,
68
+ "step": 5000
69
+ },
70
+ {
71
+ "epoch": 0.43,
72
+ "learning_rate": 3.36622945773147e-05,
73
+ "loss": 0.0057,
74
+ "step": 5500
75
+ },
76
+ {
77
+ "epoch": 0.47,
78
+ "learning_rate": 3.35234122661615e-05,
79
+ "loss": 0.005,
80
+ "step": 6000
81
+ },
82
+ {
83
+ "epoch": 0.51,
84
+ "learning_rate": 3.338452995500829e-05,
85
+ "loss": 0.0048,
86
+ "step": 6500
87
+ },
88
+ {
89
+ "epoch": 0.55,
90
+ "learning_rate": 3.324564764385508e-05,
91
+ "loss": 0.0042,
92
+ "step": 7000
93
+ },
94
+ {
95
+ "epoch": 0.59,
96
+ "learning_rate": 3.310676533270187e-05,
97
+ "loss": 0.0039,
98
+ "step": 7500
99
+ },
100
+ {
101
+ "epoch": 0.63,
102
+ "learning_rate": 3.296788302154867e-05,
103
+ "loss": 0.0038,
104
+ "step": 8000
105
+ },
106
+ {
107
+ "epoch": 0.67,
108
+ "learning_rate": 3.2829000710395454e-05,
109
+ "loss": 0.0036,
110
+ "step": 8500
111
+ },
112
+ {
113
+ "epoch": 0.71,
114
+ "learning_rate": 3.269011839924224e-05,
115
+ "loss": 0.0036,
116
+ "step": 9000
117
+ },
118
+ {
119
+ "epoch": 0.75,
120
+ "learning_rate": 3.255123608808904e-05,
121
+ "loss": 0.0033,
122
+ "step": 9500
123
+ },
124
+ {
125
+ "epoch": 0.79,
126
+ "learning_rate": 3.241235377693583e-05,
127
+ "loss": 0.0033,
128
+ "step": 10000
129
+ },
130
+ {
131
+ "epoch": 0.83,
132
+ "learning_rate": 3.227347146578262e-05,
133
+ "loss": 0.0031,
134
+ "step": 10500
135
+ },
136
+ {
137
+ "epoch": 0.87,
138
+ "learning_rate": 3.2134589154629414e-05,
139
+ "loss": 0.003,
140
+ "step": 11000
141
+ },
142
+ {
143
+ "epoch": 0.91,
144
+ "learning_rate": 3.19957068434762e-05,
145
+ "loss": 0.0029,
146
+ "step": 11500
147
+ },
148
+ {
149
+ "epoch": 0.95,
150
+ "learning_rate": 3.1856824532322994e-05,
151
+ "loss": 0.0029,
152
+ "step": 12000
153
+ },
154
+ {
155
+ "epoch": 0.99,
156
+ "learning_rate": 3.171794222116978e-05,
157
+ "loss": 0.0028,
158
+ "step": 12500
159
+ },
160
+ {
161
+ "epoch": 1.0,
162
+ "eval_accuracy": 0.6213869893484506,
163
+ "eval_f1": 0.7871180162568165,
164
+ "eval_f1_macro": 0.09915671829069983,
165
+ "eval_f1_weighted": 0.7187367346051451,
166
+ "eval_loss": 0.00270162639208138,
167
+ "eval_p": 0.8552003089493689,
168
+ "eval_r": 0.7290764165655865,
169
+ "eval_roc_auc": 0.8644347845537721,
170
+ "eval_runtime": 154.8297,
171
+ "eval_samples_per_second": 508.133,
172
+ "eval_steps_per_second": 31.764,
173
+ "step": 12669
174
+ },
175
+ {
176
+ "epoch": 1.03,
177
+ "learning_rate": 3.157905991001658e-05,
178
+ "loss": 0.0027,
179
+ "step": 13000
180
+ },
181
+ {
182
+ "epoch": 1.07,
183
+ "learning_rate": 3.144017759886337e-05,
184
+ "loss": 0.0026,
185
+ "step": 13500
186
+ },
187
+ {
188
+ "epoch": 1.11,
189
+ "learning_rate": 3.1301295287710154e-05,
190
+ "loss": 0.0026,
191
+ "step": 14000
192
+ },
193
+ {
194
+ "epoch": 1.14,
195
+ "learning_rate": 3.1162412976556954e-05,
196
+ "loss": 0.0026,
197
+ "step": 14500
198
+ },
199
+ {
200
+ "epoch": 1.18,
201
+ "learning_rate": 3.102353066540374e-05,
202
+ "loss": 0.0025,
203
+ "step": 15000
204
+ },
205
+ {
206
+ "epoch": 1.22,
207
+ "learning_rate": 3.0884648354250534e-05,
208
+ "loss": 0.0025,
209
+ "step": 15500
210
+ },
211
+ {
212
+ "epoch": 1.26,
213
+ "learning_rate": 3.074576604309732e-05,
214
+ "loss": 0.0025,
215
+ "step": 16000
216
+ },
217
+ {
218
+ "epoch": 1.3,
219
+ "learning_rate": 3.0606883731944114e-05,
220
+ "loss": 0.0025,
221
+ "step": 16500
222
+ },
223
+ {
224
+ "epoch": 1.34,
225
+ "learning_rate": 3.0468001420790908e-05,
226
+ "loss": 0.0024,
227
+ "step": 17000
228
+ },
229
+ {
230
+ "epoch": 1.38,
231
+ "learning_rate": 3.0329119109637698e-05,
232
+ "loss": 0.0023,
233
+ "step": 17500
234
+ },
235
+ {
236
+ "epoch": 1.42,
237
+ "learning_rate": 3.019023679848449e-05,
238
+ "loss": 0.0023,
239
+ "step": 18000
240
+ },
241
+ {
242
+ "epoch": 1.46,
243
+ "learning_rate": 3.005135448733128e-05,
244
+ "loss": 0.0022,
245
+ "step": 18500
246
+ },
247
+ {
248
+ "epoch": 1.5,
249
+ "learning_rate": 2.991247217617807e-05,
250
+ "loss": 0.0024,
251
+ "step": 19000
252
+ },
253
+ {
254
+ "epoch": 1.54,
255
+ "learning_rate": 2.9773589865024864e-05,
256
+ "loss": 0.0023,
257
+ "step": 19500
258
+ },
259
+ {
260
+ "epoch": 1.58,
261
+ "learning_rate": 2.9634707553871654e-05,
262
+ "loss": 0.0023,
263
+ "step": 20000
264
+ },
265
+ {
266
+ "epoch": 1.62,
267
+ "learning_rate": 2.9495825242718448e-05,
268
+ "loss": 0.0022,
269
+ "step": 20500
270
+ },
271
+ {
272
+ "epoch": 1.66,
273
+ "learning_rate": 2.9356942931565238e-05,
274
+ "loss": 0.0022,
275
+ "step": 21000
276
+ },
277
+ {
278
+ "epoch": 1.7,
279
+ "learning_rate": 2.921806062041203e-05,
280
+ "loss": 0.0022,
281
+ "step": 21500
282
+ },
283
+ {
284
+ "epoch": 1.74,
285
+ "learning_rate": 2.907917830925882e-05,
286
+ "loss": 0.0021,
287
+ "step": 22000
288
+ },
289
+ {
290
+ "epoch": 1.78,
291
+ "learning_rate": 2.894029599810561e-05,
292
+ "loss": 0.0021,
293
+ "step": 22500
294
+ },
295
+ {
296
+ "epoch": 1.82,
297
+ "learning_rate": 2.8801413686952405e-05,
298
+ "loss": 0.0021,
299
+ "step": 23000
300
+ },
301
+ {
302
+ "epoch": 1.85,
303
+ "learning_rate": 2.8662531375799195e-05,
304
+ "loss": 0.0021,
305
+ "step": 23500
306
+ },
307
+ {
308
+ "epoch": 1.89,
309
+ "learning_rate": 2.8523649064645988e-05,
310
+ "loss": 0.0021,
311
+ "step": 24000
312
+ },
313
+ {
314
+ "epoch": 1.93,
315
+ "learning_rate": 2.8384766753492778e-05,
316
+ "loss": 0.0021,
317
+ "step": 24500
318
+ },
319
+ {
320
+ "epoch": 1.97,
321
+ "learning_rate": 2.8245884442339568e-05,
322
+ "loss": 0.0021,
323
+ "step": 25000
324
+ },
325
+ {
326
+ "epoch": 2.0,
327
+ "eval_accuracy": 0.6822711442153697,
328
+ "eval_f1": 0.8278927653585252,
329
+ "eval_f1_macro": 0.17721735370294905,
330
+ "eval_f1_weighted": 0.7911965688289363,
331
+ "eval_loss": 0.002050888491794467,
332
+ "eval_p": 0.8518841031375748,
333
+ "eval_r": 0.8052157338416219,
334
+ "eval_roc_auc": 0.9024905715784995,
335
+ "eval_runtime": 150.3062,
336
+ "eval_samples_per_second": 523.425,
337
+ "eval_steps_per_second": 32.72,
338
+ "step": 25338
339
+ },
340
+ {
341
+ "epoch": 2.01,
342
+ "learning_rate": 2.810700213118636e-05,
343
+ "loss": 0.002,
344
+ "step": 25500
345
+ },
346
+ {
347
+ "epoch": 2.05,
348
+ "learning_rate": 2.796811982003315e-05,
349
+ "loss": 0.002,
350
+ "step": 26000
351
+ },
352
+ {
353
+ "epoch": 2.09,
354
+ "learning_rate": 2.7829237508879945e-05,
355
+ "loss": 0.0019,
356
+ "step": 26500
357
+ },
358
+ {
359
+ "epoch": 2.13,
360
+ "learning_rate": 2.7690355197726735e-05,
361
+ "loss": 0.0019,
362
+ "step": 27000
363
+ },
364
+ {
365
+ "epoch": 2.17,
366
+ "learning_rate": 2.7551472886573525e-05,
367
+ "loss": 0.0018,
368
+ "step": 27500
369
+ },
370
+ {
371
+ "epoch": 2.21,
372
+ "learning_rate": 2.7412590575420318e-05,
373
+ "loss": 0.0019,
374
+ "step": 28000
375
+ },
376
+ {
377
+ "epoch": 2.25,
378
+ "learning_rate": 2.7273708264267108e-05,
379
+ "loss": 0.0019,
380
+ "step": 28500
381
+ },
382
+ {
383
+ "epoch": 2.29,
384
+ "learning_rate": 2.71348259531139e-05,
385
+ "loss": 0.0018,
386
+ "step": 29000
387
+ },
388
+ {
389
+ "epoch": 2.33,
390
+ "learning_rate": 2.699594364196069e-05,
391
+ "loss": 0.0019,
392
+ "step": 29500
393
+ },
394
+ {
395
+ "epoch": 2.37,
396
+ "learning_rate": 2.685706133080748e-05,
397
+ "loss": 0.0018,
398
+ "step": 30000
399
+ },
400
+ {
401
+ "epoch": 2.41,
402
+ "learning_rate": 2.6718179019654275e-05,
403
+ "loss": 0.0017,
404
+ "step": 30500
405
+ },
406
+ {
407
+ "epoch": 2.45,
408
+ "learning_rate": 2.6579296708501065e-05,
409
+ "loss": 0.0018,
410
+ "step": 31000
411
+ },
412
+ {
413
+ "epoch": 2.49,
414
+ "learning_rate": 2.644041439734786e-05,
415
+ "loss": 0.0018,
416
+ "step": 31500
417
+ },
418
+ {
419
+ "epoch": 2.53,
420
+ "learning_rate": 2.630153208619465e-05,
421
+ "loss": 0.0018,
422
+ "step": 32000
423
+ },
424
+ {
425
+ "epoch": 2.57,
426
+ "learning_rate": 2.616264977504144e-05,
427
+ "loss": 0.0018,
428
+ "step": 32500
429
+ },
430
+ {
431
+ "epoch": 2.6,
432
+ "learning_rate": 2.6023767463888232e-05,
433
+ "loss": 0.0018,
434
+ "step": 33000
435
+ },
436
+ {
437
+ "epoch": 2.64,
438
+ "learning_rate": 2.5884885152735022e-05,
439
+ "loss": 0.0017,
440
+ "step": 33500
441
+ },
442
+ {
443
+ "epoch": 2.68,
444
+ "learning_rate": 2.5746002841581815e-05,
445
+ "loss": 0.0017,
446
+ "step": 34000
447
+ },
448
+ {
449
+ "epoch": 2.72,
450
+ "learning_rate": 2.5607120530428605e-05,
451
+ "loss": 0.0017,
452
+ "step": 34500
453
+ },
454
+ {
455
+ "epoch": 2.76,
456
+ "learning_rate": 2.5468238219275395e-05,
457
+ "loss": 0.0017,
458
+ "step": 35000
459
+ },
460
+ {
461
+ "epoch": 2.8,
462
+ "learning_rate": 2.532935590812219e-05,
463
+ "loss": 0.0018,
464
+ "step": 35500
465
+ },
466
+ {
467
+ "epoch": 2.84,
468
+ "learning_rate": 2.519047359696898e-05,
469
+ "loss": 0.0018,
470
+ "step": 36000
471
+ },
472
+ {
473
+ "epoch": 2.88,
474
+ "learning_rate": 2.5051591285815772e-05,
475
+ "loss": 0.0017,
476
+ "step": 36500
477
+ },
478
+ {
479
+ "epoch": 2.92,
480
+ "learning_rate": 2.4912708974662562e-05,
481
+ "loss": 0.0018,
482
+ "step": 37000
483
+ },
484
+ {
485
+ "epoch": 2.96,
486
+ "learning_rate": 2.4773826663509355e-05,
487
+ "loss": 0.0018,
488
+ "step": 37500
489
+ },
490
+ {
491
+ "epoch": 3.0,
492
+ "learning_rate": 2.4634944352356145e-05,
493
+ "loss": 0.0018,
494
+ "step": 38000
495
+ },
496
+ {
497
+ "epoch": 3.0,
498
+ "eval_accuracy": 0.6974095635152655,
499
+ "eval_f1": 0.8369747009165567,
500
+ "eval_f1_macro": 0.21887278841705338,
501
+ "eval_f1_weighted": 0.8081134454474668,
502
+ "eval_loss": 0.001851799781434238,
503
+ "eval_p": 0.8528991177184794,
504
+ "eval_r": 0.8216340322301161,
505
+ "eval_roc_auc": 0.910698290784354,
506
+ "eval_runtime": 150.2603,
507
+ "eval_samples_per_second": 523.585,
508
+ "eval_steps_per_second": 32.73,
509
+ "step": 38007
510
+ },
511
+ {
512
+ "epoch": 3.04,
513
+ "learning_rate": 2.4496062041202935e-05,
514
+ "loss": 0.0016,
515
+ "step": 38500
516
+ },
517
+ {
518
+ "epoch": 3.08,
519
+ "learning_rate": 2.435717973004973e-05,
520
+ "loss": 0.0015,
521
+ "step": 39000
522
+ },
523
+ {
524
+ "epoch": 3.12,
525
+ "learning_rate": 2.421829741889652e-05,
526
+ "loss": 0.0016,
527
+ "step": 39500
528
+ },
529
+ {
530
+ "epoch": 3.16,
531
+ "learning_rate": 2.4079415107743312e-05,
532
+ "loss": 0.0016,
533
+ "step": 40000
534
+ },
535
+ {
536
+ "epoch": 3.2,
537
+ "learning_rate": 2.3940532796590102e-05,
538
+ "loss": 0.0015,
539
+ "step": 40500
540
+ },
541
+ {
542
+ "epoch": 3.24,
543
+ "learning_rate": 2.3801650485436892e-05,
544
+ "loss": 0.0016,
545
+ "step": 41000
546
+ },
547
+ {
548
+ "epoch": 3.28,
549
+ "learning_rate": 2.3662768174283686e-05,
550
+ "loss": 0.0015,
551
+ "step": 41500
552
+ },
553
+ {
554
+ "epoch": 3.32,
555
+ "learning_rate": 2.3523885863130476e-05,
556
+ "loss": 0.0015,
557
+ "step": 42000
558
+ },
559
+ {
560
+ "epoch": 3.35,
561
+ "learning_rate": 2.338500355197727e-05,
562
+ "loss": 0.0015,
563
+ "step": 42500
564
+ },
565
+ {
566
+ "epoch": 3.39,
567
+ "learning_rate": 2.324612124082406e-05,
568
+ "loss": 0.0016,
569
+ "step": 43000
570
+ },
571
+ {
572
+ "epoch": 3.43,
573
+ "learning_rate": 2.310723892967085e-05,
574
+ "loss": 0.0016,
575
+ "step": 43500
576
+ },
577
+ {
578
+ "epoch": 3.47,
579
+ "learning_rate": 2.2968356618517642e-05,
580
+ "loss": 0.0016,
581
+ "step": 44000
582
+ },
583
+ {
584
+ "epoch": 3.51,
585
+ "learning_rate": 2.2829474307364432e-05,
586
+ "loss": 0.0015,
587
+ "step": 44500
588
+ },
589
+ {
590
+ "epoch": 3.55,
591
+ "learning_rate": 2.2690591996211226e-05,
592
+ "loss": 0.0015,
593
+ "step": 45000
594
+ },
595
+ {
596
+ "epoch": 3.59,
597
+ "learning_rate": 2.2551709685058016e-05,
598
+ "loss": 0.0016,
599
+ "step": 45500
600
+ },
601
+ {
602
+ "epoch": 3.63,
603
+ "learning_rate": 2.2412827373904806e-05,
604
+ "loss": 0.0015,
605
+ "step": 46000
606
+ },
607
+ {
608
+ "epoch": 3.67,
609
+ "learning_rate": 2.22739450627516e-05,
610
+ "loss": 0.0015,
611
+ "step": 46500
612
+ },
613
+ {
614
+ "epoch": 3.71,
615
+ "learning_rate": 2.213506275159839e-05,
616
+ "loss": 0.0015,
617
+ "step": 47000
618
+ },
619
+ {
620
+ "epoch": 3.75,
621
+ "learning_rate": 2.1996180440445182e-05,
622
+ "loss": 0.0015,
623
+ "step": 47500
624
+ },
625
+ {
626
+ "epoch": 3.79,
627
+ "learning_rate": 2.1857298129291972e-05,
628
+ "loss": 0.0015,
629
+ "step": 48000
630
+ },
631
+ {
632
+ "epoch": 3.83,
633
+ "learning_rate": 2.1718415818138762e-05,
634
+ "loss": 0.0015,
635
+ "step": 48500
636
+ },
637
+ {
638
+ "epoch": 3.87,
639
+ "learning_rate": 2.1579533506985556e-05,
640
+ "loss": 0.0015,
641
+ "step": 49000
642
+ },
643
+ {
644
+ "epoch": 3.91,
645
+ "learning_rate": 2.1440651195832346e-05,
646
+ "loss": 0.0015,
647
+ "step": 49500
648
+ },
649
+ {
650
+ "epoch": 3.95,
651
+ "learning_rate": 2.130176888467914e-05,
652
+ "loss": 0.0015,
653
+ "step": 50000
654
+ },
655
+ {
656
+ "epoch": 3.99,
657
+ "learning_rate": 2.116288657352593e-05,
658
+ "loss": 0.0015,
659
+ "step": 50500
660
+ },
661
+ {
662
+ "epoch": 4.0,
663
+ "eval_accuracy": 0.710870173119455,
664
+ "eval_f1": 0.8427627441351563,
665
+ "eval_f1_macro": 0.276326750740236,
666
+ "eval_f1_weighted": 0.8243063205078164,
667
+ "eval_loss": 0.0018125491915270686,
668
+ "eval_p": 0.8380480784058393,
669
+ "eval_r": 0.8475307572344482,
670
+ "eval_roc_auc": 0.923628157802133,
671
+ "eval_runtime": 150.1179,
672
+ "eval_samples_per_second": 524.082,
673
+ "eval_steps_per_second": 32.761,
674
+ "step": 50676
675
+ },
676
+ {
677
+ "epoch": 4.03,
678
+ "learning_rate": 2.1024004262372723e-05,
679
+ "loss": 0.0014,
680
+ "step": 51000
681
+ },
682
+ {
683
+ "epoch": 4.07,
684
+ "learning_rate": 2.0885121951219513e-05,
685
+ "loss": 0.0014,
686
+ "step": 51500
687
+ },
688
+ {
689
+ "epoch": 4.1,
690
+ "learning_rate": 2.0746239640066303e-05,
691
+ "loss": 0.0013,
692
+ "step": 52000
693
+ },
694
+ {
695
+ "epoch": 4.14,
696
+ "learning_rate": 2.0607357328913096e-05,
697
+ "loss": 0.0013,
698
+ "step": 52500
699
+ },
700
+ {
701
+ "epoch": 4.18,
702
+ "learning_rate": 2.0468475017759886e-05,
703
+ "loss": 0.0013,
704
+ "step": 53000
705
+ },
706
+ {
707
+ "epoch": 4.22,
708
+ "learning_rate": 2.032959270660668e-05,
709
+ "loss": 0.0013,
710
+ "step": 53500
711
+ },
712
+ {
713
+ "epoch": 4.26,
714
+ "learning_rate": 2.019071039545347e-05,
715
+ "loss": 0.0013,
716
+ "step": 54000
717
+ },
718
+ {
719
+ "epoch": 4.3,
720
+ "learning_rate": 2.005182808430026e-05,
721
+ "loss": 0.0013,
722
+ "step": 54500
723
+ },
724
+ {
725
+ "epoch": 4.34,
726
+ "learning_rate": 1.9912945773147053e-05,
727
+ "loss": 0.0013,
728
+ "step": 55000
729
+ },
730
+ {
731
+ "epoch": 4.38,
732
+ "learning_rate": 1.9774063461993843e-05,
733
+ "loss": 0.0013,
734
+ "step": 55500
735
+ },
736
+ {
737
+ "epoch": 4.42,
738
+ "learning_rate": 1.9635181150840636e-05,
739
+ "loss": 0.0014,
740
+ "step": 56000
741
+ },
742
+ {
743
+ "epoch": 4.46,
744
+ "learning_rate": 1.9496298839687426e-05,
745
+ "loss": 0.0013,
746
+ "step": 56500
747
+ },
748
+ {
749
+ "epoch": 4.5,
750
+ "learning_rate": 1.9357416528534216e-05,
751
+ "loss": 0.0014,
752
+ "step": 57000
753
+ },
754
+ {
755
+ "epoch": 4.54,
756
+ "learning_rate": 1.921853421738101e-05,
757
+ "loss": 0.0014,
758
+ "step": 57500
759
+ },
760
+ {
761
+ "epoch": 4.58,
762
+ "learning_rate": 1.90796519062278e-05,
763
+ "loss": 0.0013,
764
+ "step": 58000
765
+ },
766
+ {
767
+ "epoch": 4.62,
768
+ "learning_rate": 1.8940769595074593e-05,
769
+ "loss": 0.0013,
770
+ "step": 58500
771
+ },
772
+ {
773
+ "epoch": 4.66,
774
+ "learning_rate": 1.8801887283921383e-05,
775
+ "loss": 0.0013,
776
+ "step": 59000
777
+ },
778
+ {
779
+ "epoch": 4.7,
780
+ "learning_rate": 1.8663004972768173e-05,
781
+ "loss": 0.0013,
782
+ "step": 59500
783
+ },
784
+ {
785
+ "epoch": 4.74,
786
+ "learning_rate": 1.8524122661614966e-05,
787
+ "loss": 0.0014,
788
+ "step": 60000
789
+ },
790
+ {
791
+ "epoch": 4.78,
792
+ "learning_rate": 1.8385240350461756e-05,
793
+ "loss": 0.0013,
794
+ "step": 60500
795
+ },
796
+ {
797
+ "epoch": 4.81,
798
+ "learning_rate": 1.824635803930855e-05,
799
+ "loss": 0.0014,
800
+ "step": 61000
801
+ },
802
+ {
803
+ "epoch": 4.85,
804
+ "learning_rate": 1.810747572815534e-05,
805
+ "loss": 0.0013,
806
+ "step": 61500
807
+ },
808
+ {
809
+ "epoch": 4.89,
810
+ "learning_rate": 1.796859341700213e-05,
811
+ "loss": 0.0014,
812
+ "step": 62000
813
+ },
814
+ {
815
+ "epoch": 4.93,
816
+ "learning_rate": 1.7829711105848923e-05,
817
+ "loss": 0.0013,
818
+ "step": 62500
819
+ },
820
+ {
821
+ "epoch": 4.97,
822
+ "learning_rate": 1.7690828794695713e-05,
823
+ "loss": 0.0013,
824
+ "step": 63000
825
+ },
826
+ {
827
+ "epoch": 5.0,
828
+ "eval_accuracy": 0.71883976917406,
829
+ "eval_f1": 0.8474025833437978,
830
+ "eval_f1_macro": 0.28796797014277603,
831
+ "eval_f1_weighted": 0.8288548463559504,
832
+ "eval_loss": 0.0016964372480288148,
833
+ "eval_p": 0.8470321413422668,
834
+ "eval_r": 0.8477733495061515,
835
+ "eval_roc_auc": 0.9237584040683807,
836
+ "eval_runtime": 151.5541,
837
+ "eval_samples_per_second": 519.115,
838
+ "eval_steps_per_second": 32.45,
839
+ "step": 63345
840
+ },
841
+ {
842
+ "epoch": 5.01,
843
+ "learning_rate": 1.7551946483542503e-05,
844
+ "loss": 0.0013,
845
+ "step": 63500
846
+ },
847
+ {
848
+ "epoch": 5.05,
849
+ "learning_rate": 1.7413064172389297e-05,
850
+ "loss": 0.0012,
851
+ "step": 64000
852
+ },
853
+ {
854
+ "epoch": 5.09,
855
+ "learning_rate": 1.7274181861236087e-05,
856
+ "loss": 0.0012,
857
+ "step": 64500
858
+ },
859
+ {
860
+ "epoch": 5.13,
861
+ "learning_rate": 1.713529955008288e-05,
862
+ "loss": 0.0011,
863
+ "step": 65000
864
+ },
865
+ {
866
+ "epoch": 5.17,
867
+ "learning_rate": 1.699641723892967e-05,
868
+ "loss": 0.0012,
869
+ "step": 65500
870
+ },
871
+ {
872
+ "epoch": 5.21,
873
+ "learning_rate": 1.685753492777646e-05,
874
+ "loss": 0.0012,
875
+ "step": 66000
876
+ },
877
+ {
878
+ "epoch": 5.25,
879
+ "learning_rate": 1.6718652616623253e-05,
880
+ "loss": 0.0012,
881
+ "step": 66500
882
+ },
883
+ {
884
+ "epoch": 5.29,
885
+ "learning_rate": 1.6579770305470043e-05,
886
+ "loss": 0.0012,
887
+ "step": 67000
888
+ },
889
+ {
890
+ "epoch": 5.33,
891
+ "learning_rate": 1.6440887994316837e-05,
892
+ "loss": 0.0012,
893
+ "step": 67500
894
+ },
895
+ {
896
+ "epoch": 5.37,
897
+ "learning_rate": 1.6302005683163627e-05,
898
+ "loss": 0.0012,
899
+ "step": 68000
900
+ },
901
+ {
902
+ "epoch": 5.41,
903
+ "learning_rate": 1.616312337201042e-05,
904
+ "loss": 0.0012,
905
+ "step": 68500
906
+ },
907
+ {
908
+ "epoch": 5.45,
909
+ "learning_rate": 1.602424106085721e-05,
910
+ "loss": 0.0012,
911
+ "step": 69000
912
+ },
913
+ {
914
+ "epoch": 5.49,
915
+ "learning_rate": 1.5885358749704e-05,
916
+ "loss": 0.0012,
917
+ "step": 69500
918
+ },
919
+ {
920
+ "epoch": 5.53,
921
+ "learning_rate": 1.5746476438550794e-05,
922
+ "loss": 0.0011,
923
+ "step": 70000
924
+ },
925
+ {
926
+ "epoch": 5.56,
927
+ "learning_rate": 1.5607594127397584e-05,
928
+ "loss": 0.0012,
929
+ "step": 70500
930
+ },
931
+ {
932
+ "epoch": 5.6,
933
+ "learning_rate": 1.5468711816244377e-05,
934
+ "loss": 0.0012,
935
+ "step": 71000
936
+ },
937
+ {
938
+ "epoch": 5.64,
939
+ "learning_rate": 1.5329829505091167e-05,
940
+ "loss": 0.0012,
941
+ "step": 71500
942
+ },
943
+ {
944
+ "epoch": 5.68,
945
+ "learning_rate": 1.5190947193937959e-05,
946
+ "loss": 0.0012,
947
+ "step": 72000
948
+ },
949
+ {
950
+ "epoch": 5.72,
951
+ "learning_rate": 1.505206488278475e-05,
952
+ "loss": 0.0012,
953
+ "step": 72500
954
+ },
955
+ {
956
+ "epoch": 5.76,
957
+ "learning_rate": 1.4913182571631542e-05,
958
+ "loss": 0.0012,
959
+ "step": 73000
960
+ },
961
+ {
962
+ "epoch": 5.8,
963
+ "learning_rate": 1.4774300260478334e-05,
964
+ "loss": 0.0012,
965
+ "step": 73500
966
+ },
967
+ {
968
+ "epoch": 5.84,
969
+ "learning_rate": 1.4635417949325124e-05,
970
+ "loss": 0.0012,
971
+ "step": 74000
972
+ },
973
+ {
974
+ "epoch": 5.88,
975
+ "learning_rate": 1.4496535638171915e-05,
976
+ "loss": 0.0012,
977
+ "step": 74500
978
+ },
979
+ {
980
+ "epoch": 5.92,
981
+ "learning_rate": 1.4357653327018707e-05,
982
+ "loss": 0.0012,
983
+ "step": 75000
984
+ },
985
+ {
986
+ "epoch": 5.96,
987
+ "learning_rate": 1.4218771015865499e-05,
988
+ "loss": 0.0011,
989
+ "step": 75500
990
+ },
991
+ {
992
+ "epoch": 6.0,
993
+ "learning_rate": 1.407988870471229e-05,
994
+ "loss": 0.0012,
995
+ "step": 76000
996
+ },
997
+ {
998
+ "epoch": 6.0,
999
+ "eval_accuracy": 0.7229326079772225,
1000
+ "eval_f1": 0.8492761531099651,
1001
+ "eval_f1_macro": 0.3068715201994391,
1002
+ "eval_f1_weighted": 0.8317541964664328,
1003
+ "eval_loss": 0.0016757699195295572,
1004
+ "eval_p": 0.8489857055039438,
1005
+ "eval_r": 0.8495667995148155,
1006
+ "eval_roc_auc": 0.9246567913434838,
1007
+ "eval_runtime": 151.532,
1008
+ "eval_samples_per_second": 519.191,
1009
+ "eval_steps_per_second": 32.455,
1010
+ "step": 76014
1011
+ },
1012
+ {
1013
+ "epoch": 6.04,
1014
+ "learning_rate": 1.3941006393559082e-05,
1015
+ "loss": 0.001,
1016
+ "step": 76500
1017
+ },
1018
+ {
1019
+ "epoch": 6.08,
1020
+ "learning_rate": 1.3802124082405872e-05,
1021
+ "loss": 0.001,
1022
+ "step": 77000
1023
+ },
1024
+ {
1025
+ "epoch": 6.12,
1026
+ "learning_rate": 1.3663241771252664e-05,
1027
+ "loss": 0.001,
1028
+ "step": 77500
1029
+ },
1030
+ {
1031
+ "epoch": 6.16,
1032
+ "learning_rate": 1.3524359460099456e-05,
1033
+ "loss": 0.001,
1034
+ "step": 78000
1035
+ },
1036
+ {
1037
+ "epoch": 6.2,
1038
+ "learning_rate": 1.3385477148946247e-05,
1039
+ "loss": 0.0011,
1040
+ "step": 78500
1041
+ },
1042
+ {
1043
+ "epoch": 6.24,
1044
+ "learning_rate": 1.3246594837793039e-05,
1045
+ "loss": 0.0011,
1046
+ "step": 79000
1047
+ },
1048
+ {
1049
+ "epoch": 6.28,
1050
+ "learning_rate": 1.3107712526639829e-05,
1051
+ "loss": 0.0011,
1052
+ "step": 79500
1053
+ },
1054
+ {
1055
+ "epoch": 6.31,
1056
+ "learning_rate": 1.296883021548662e-05,
1057
+ "loss": 0.001,
1058
+ "step": 80000
1059
+ },
1060
+ {
1061
+ "epoch": 6.35,
1062
+ "learning_rate": 1.2829947904333412e-05,
1063
+ "loss": 0.0011,
1064
+ "step": 80500
1065
+ },
1066
+ {
1067
+ "epoch": 6.39,
1068
+ "learning_rate": 1.2691065593180204e-05,
1069
+ "loss": 0.001,
1070
+ "step": 81000
1071
+ },
1072
+ {
1073
+ "epoch": 6.43,
1074
+ "learning_rate": 1.2552183282026996e-05,
1075
+ "loss": 0.001,
1076
+ "step": 81500
1077
+ },
1078
+ {
1079
+ "epoch": 6.47,
1080
+ "learning_rate": 1.2413300970873786e-05,
1081
+ "loss": 0.0011,
1082
+ "step": 82000
1083
+ },
1084
+ {
1085
+ "epoch": 6.51,
1086
+ "learning_rate": 1.2274418659720577e-05,
1087
+ "loss": 0.001,
1088
+ "step": 82500
1089
+ },
1090
+ {
1091
+ "epoch": 6.55,
1092
+ "learning_rate": 1.213553634856737e-05,
1093
+ "loss": 0.0011,
1094
+ "step": 83000
1095
+ },
1096
+ {
1097
+ "epoch": 6.59,
1098
+ "learning_rate": 1.1996654037414161e-05,
1099
+ "loss": 0.001,
1100
+ "step": 83500
1101
+ },
1102
+ {
1103
+ "epoch": 6.63,
1104
+ "learning_rate": 1.1857771726260953e-05,
1105
+ "loss": 0.001,
1106
+ "step": 84000
1107
+ },
1108
+ {
1109
+ "epoch": 6.67,
1110
+ "learning_rate": 1.1718889415107744e-05,
1111
+ "loss": 0.001,
1112
+ "step": 84500
1113
+ },
1114
+ {
1115
+ "epoch": 6.71,
1116
+ "learning_rate": 1.1580007103954534e-05,
1117
+ "loss": 0.0011,
1118
+ "step": 85000
1119
+ },
1120
+ {
1121
+ "epoch": 6.75,
1122
+ "learning_rate": 1.1441124792801326e-05,
1123
+ "loss": 0.0011,
1124
+ "step": 85500
1125
+ },
1126
+ {
1127
+ "epoch": 6.79,
1128
+ "learning_rate": 1.1302242481648118e-05,
1129
+ "loss": 0.001,
1130
+ "step": 86000
1131
+ },
1132
+ {
1133
+ "epoch": 6.83,
1134
+ "learning_rate": 1.116336017049491e-05,
1135
+ "loss": 0.001,
1136
+ "step": 86500
1137
+ },
1138
+ {
1139
+ "epoch": 6.87,
1140
+ "learning_rate": 1.1024477859341701e-05,
1141
+ "loss": 0.0011,
1142
+ "step": 87000
1143
+ },
1144
+ {
1145
+ "epoch": 6.91,
1146
+ "learning_rate": 1.0885595548188491e-05,
1147
+ "loss": 0.001,
1148
+ "step": 87500
1149
+ },
1150
+ {
1151
+ "epoch": 6.95,
1152
+ "learning_rate": 1.0746713237035283e-05,
1153
+ "loss": 0.0011,
1154
+ "step": 88000
1155
+ },
1156
+ {
1157
+ "epoch": 6.99,
1158
+ "learning_rate": 1.0607830925882074e-05,
1159
+ "loss": 0.001,
1160
+ "step": 88500
1161
+ },
1162
+ {
1163
+ "epoch": 7.0,
1164
+ "eval_accuracy": 0.7276609807560313,
1165
+ "eval_f1": 0.851625034501794,
1166
+ "eval_f1_macro": 0.33216946866780483,
1167
+ "eval_f1_weighted": 0.8360047793004518,
1168
+ "eval_loss": 0.0016766807530075312,
1169
+ "eval_p": 0.8478514752859547,
1170
+ "eval_r": 0.8554323340842142,
1171
+ "eval_roc_auc": 0.9275875551926686,
1172
+ "eval_runtime": 149.9874,
1173
+ "eval_samples_per_second": 524.538,
1174
+ "eval_steps_per_second": 32.789,
1175
+ "step": 88683
1176
+ },
1177
+ {
1178
+ "epoch": 7.03,
1179
+ "learning_rate": 1.0468948614728866e-05,
1180
+ "loss": 0.001,
1181
+ "step": 89000
1182
+ },
1183
+ {
1184
+ "epoch": 7.06,
1185
+ "learning_rate": 1.0330066303575658e-05,
1186
+ "loss": 0.0009,
1187
+ "step": 89500
1188
+ },
1189
+ {
1190
+ "epoch": 7.1,
1191
+ "learning_rate": 1.019118399242245e-05,
1192
+ "loss": 0.0009,
1193
+ "step": 90000
1194
+ },
1195
+ {
1196
+ "epoch": 7.14,
1197
+ "learning_rate": 1.005230168126924e-05,
1198
+ "loss": 0.0009,
1199
+ "step": 90500
1200
+ },
1201
+ {
1202
+ "epoch": 7.18,
1203
+ "learning_rate": 9.913419370116031e-06,
1204
+ "loss": 0.0009,
1205
+ "step": 91000
1206
+ },
1207
+ {
1208
+ "epoch": 7.22,
1209
+ "learning_rate": 9.774537058962823e-06,
1210
+ "loss": 0.0009,
1211
+ "step": 91500
1212
+ },
1213
+ {
1214
+ "epoch": 7.26,
1215
+ "learning_rate": 9.635654747809615e-06,
1216
+ "loss": 0.0009,
1217
+ "step": 92000
1218
+ },
1219
+ {
1220
+ "epoch": 7.3,
1221
+ "learning_rate": 9.496772436656406e-06,
1222
+ "loss": 0.0009,
1223
+ "step": 92500
1224
+ },
1225
+ {
1226
+ "epoch": 7.34,
1227
+ "learning_rate": 9.357890125503196e-06,
1228
+ "loss": 0.0009,
1229
+ "step": 93000
1230
+ },
1231
+ {
1232
+ "epoch": 7.38,
1233
+ "learning_rate": 9.219007814349988e-06,
1234
+ "loss": 0.0009,
1235
+ "step": 93500
1236
+ },
1237
+ {
1238
+ "epoch": 7.42,
1239
+ "learning_rate": 9.08012550319678e-06,
1240
+ "loss": 0.0009,
1241
+ "step": 94000
1242
+ },
1243
+ {
1244
+ "epoch": 7.46,
1245
+ "learning_rate": 8.941243192043571e-06,
1246
+ "loss": 0.0009,
1247
+ "step": 94500
1248
+ },
1249
+ {
1250
+ "epoch": 7.5,
1251
+ "learning_rate": 8.802360880890363e-06,
1252
+ "loss": 0.0009,
1253
+ "step": 95000
1254
+ },
1255
+ {
1256
+ "epoch": 7.54,
1257
+ "learning_rate": 8.663478569737153e-06,
1258
+ "loss": 0.0009,
1259
+ "step": 95500
1260
+ },
1261
+ {
1262
+ "epoch": 7.58,
1263
+ "learning_rate": 8.524596258583945e-06,
1264
+ "loss": 0.0009,
1265
+ "step": 96000
1266
+ },
1267
+ {
1268
+ "epoch": 7.62,
1269
+ "learning_rate": 8.385713947430736e-06,
1270
+ "loss": 0.0009,
1271
+ "step": 96500
1272
+ },
1273
+ {
1274
+ "epoch": 7.66,
1275
+ "learning_rate": 8.246831636277528e-06,
1276
+ "loss": 0.0009,
1277
+ "step": 97000
1278
+ },
1279
+ {
1280
+ "epoch": 7.7,
1281
+ "learning_rate": 8.107949325124318e-06,
1282
+ "loss": 0.0009,
1283
+ "step": 97500
1284
+ },
1285
+ {
1286
+ "epoch": 7.74,
1287
+ "learning_rate": 7.96906701397111e-06,
1288
+ "loss": 0.0009,
1289
+ "step": 98000
1290
+ },
1291
+ {
1292
+ "epoch": 7.77,
1293
+ "learning_rate": 7.830184702817902e-06,
1294
+ "loss": 0.0009,
1295
+ "step": 98500
1296
+ },
1297
+ {
1298
+ "epoch": 7.81,
1299
+ "learning_rate": 7.691302391664693e-06,
1300
+ "loss": 0.001,
1301
+ "step": 99000
1302
+ },
1303
+ {
1304
+ "epoch": 7.85,
1305
+ "learning_rate": 7.552420080511485e-06,
1306
+ "loss": 0.001,
1307
+ "step": 99500
1308
+ },
1309
+ {
1310
+ "epoch": 7.89,
1311
+ "learning_rate": 7.413537769358277e-06,
1312
+ "loss": 0.0009,
1313
+ "step": 100000
1314
+ },
1315
+ {
1316
+ "epoch": 7.93,
1317
+ "learning_rate": 7.2746554582050675e-06,
1318
+ "loss": 0.001,
1319
+ "step": 100500
1320
+ },
1321
+ {
1322
+ "epoch": 7.97,
1323
+ "learning_rate": 7.135773147051859e-06,
1324
+ "loss": 0.0009,
1325
+ "step": 101000
1326
+ },
1327
+ {
1328
+ "epoch": 8.0,
1329
+ "eval_accuracy": 0.7294913186058927,
1330
+ "eval_f1": 0.8529003679860734,
1331
+ "eval_f1_macro": 0.34351140192299934,
1332
+ "eval_f1_weighted": 0.8387988374835376,
1333
+ "eval_loss": 0.001688135787844658,
1334
+ "eval_p": 0.8483892536904006,
1335
+ "eval_r": 0.8574597123548778,
1336
+ "eval_roc_auc": 0.928601476610379,
1337
+ "eval_runtime": 152.9938,
1338
+ "eval_samples_per_second": 514.23,
1339
+ "eval_steps_per_second": 32.145,
1340
+ "step": 101352
1341
+ },
1342
+ {
1343
+ "epoch": 8.01,
1344
+ "learning_rate": 6.99689083589865e-06,
1345
+ "loss": 0.0009,
1346
+ "step": 101500
1347
+ },
1348
+ {
1349
+ "epoch": 8.05,
1350
+ "learning_rate": 6.858008524745442e-06,
1351
+ "loss": 0.0008,
1352
+ "step": 102000
1353
+ },
1354
+ {
1355
+ "epoch": 8.09,
1356
+ "learning_rate": 6.7191262135922334e-06,
1357
+ "loss": 0.0008,
1358
+ "step": 102500
1359
+ },
1360
+ {
1361
+ "epoch": 8.13,
1362
+ "learning_rate": 6.580243902439024e-06,
1363
+ "loss": 0.0008,
1364
+ "step": 103000
1365
+ },
1366
+ {
1367
+ "epoch": 8.17,
1368
+ "learning_rate": 6.441361591285816e-06,
1369
+ "loss": 0.0008,
1370
+ "step": 103500
1371
+ },
1372
+ {
1373
+ "epoch": 8.21,
1374
+ "learning_rate": 6.302479280132608e-06,
1375
+ "loss": 0.0009,
1376
+ "step": 104000
1377
+ },
1378
+ {
1379
+ "epoch": 8.25,
1380
+ "learning_rate": 6.1635969689793985e-06,
1381
+ "loss": 0.0008,
1382
+ "step": 104500
1383
+ },
1384
+ {
1385
+ "epoch": 8.29,
1386
+ "learning_rate": 6.02471465782619e-06,
1387
+ "loss": 0.0009,
1388
+ "step": 105000
1389
+ },
1390
+ {
1391
+ "epoch": 8.33,
1392
+ "learning_rate": 5.885832346672981e-06,
1393
+ "loss": 0.0008,
1394
+ "step": 105500
1395
+ },
1396
+ {
1397
+ "epoch": 8.37,
1398
+ "learning_rate": 5.746950035519773e-06,
1399
+ "loss": 0.0008,
1400
+ "step": 106000
1401
+ },
1402
+ {
1403
+ "epoch": 8.41,
1404
+ "learning_rate": 5.6080677243665645e-06,
1405
+ "loss": 0.0008,
1406
+ "step": 106500
1407
+ },
1408
+ {
1409
+ "epoch": 8.45,
1410
+ "learning_rate": 5.469185413213355e-06,
1411
+ "loss": 0.0008,
1412
+ "step": 107000
1413
+ },
1414
+ {
1415
+ "epoch": 8.49,
1416
+ "learning_rate": 5.330303102060147e-06,
1417
+ "loss": 0.0008,
1418
+ "step": 107500
1419
+ },
1420
+ {
1421
+ "epoch": 8.52,
1422
+ "learning_rate": 5.191420790906939e-06,
1423
+ "loss": 0.0009,
1424
+ "step": 108000
1425
+ },
1426
+ {
1427
+ "epoch": 8.56,
1428
+ "learning_rate": 5.0525384797537296e-06,
1429
+ "loss": 0.0008,
1430
+ "step": 108500
1431
+ },
1432
+ {
1433
+ "epoch": 8.6,
1434
+ "learning_rate": 4.913656168600521e-06,
1435
+ "loss": 0.0009,
1436
+ "step": 109000
1437
+ },
1438
+ {
1439
+ "epoch": 8.64,
1440
+ "learning_rate": 4.774773857447313e-06,
1441
+ "loss": 0.0008,
1442
+ "step": 109500
1443
+ },
1444
+ {
1445
+ "epoch": 8.68,
1446
+ "learning_rate": 4.635891546294104e-06,
1447
+ "loss": 0.0008,
1448
+ "step": 110000
1449
+ },
1450
+ {
1451
+ "epoch": 8.72,
1452
+ "learning_rate": 4.4970092351408955e-06,
1453
+ "loss": 0.0009,
1454
+ "step": 110500
1455
+ },
1456
+ {
1457
+ "epoch": 8.76,
1458
+ "learning_rate": 4.358126923987686e-06,
1459
+ "loss": 0.0008,
1460
+ "step": 111000
1461
+ },
1462
+ {
1463
+ "epoch": 8.8,
1464
+ "learning_rate": 4.219244612834478e-06,
1465
+ "loss": 0.0008,
1466
+ "step": 111500
1467
+ },
1468
+ {
1469
+ "epoch": 8.84,
1470
+ "learning_rate": 4.080362301681269e-06,
1471
+ "loss": 0.0008,
1472
+ "step": 112000
1473
+ },
1474
+ {
1475
+ "epoch": 8.88,
1476
+ "learning_rate": 3.941479990528061e-06,
1477
+ "loss": 0.0009,
1478
+ "step": 112500
1479
+ },
1480
+ {
1481
+ "epoch": 8.92,
1482
+ "learning_rate": 3.8025976793748523e-06,
1483
+ "loss": 0.0008,
1484
+ "step": 113000
1485
+ },
1486
+ {
1487
+ "epoch": 8.96,
1488
+ "learning_rate": 3.6637153682216436e-06,
1489
+ "loss": 0.0008,
1490
+ "step": 113500
1491
+ },
1492
+ {
1493
+ "epoch": 9.0,
1494
+ "learning_rate": 3.524833057068435e-06,
1495
+ "loss": 0.0008,
1496
+ "step": 114000
1497
+ },
1498
+ {
1499
+ "epoch": 9.0,
1500
+ "eval_accuracy": 0.7333426544983095,
1501
+ "eval_f1": 0.8538806684223458,
1502
+ "eval_f1_macro": 0.35458058741266574,
1503
+ "eval_f1_weighted": 0.8401736902228668,
1504
+ "eval_loss": 0.0016993152676150203,
1505
+ "eval_p": 0.8495998764892057,
1506
+ "eval_r": 0.8582048171893952,
1507
+ "eval_roc_auc": 0.9289751251101112,
1508
+ "eval_runtime": 150.295,
1509
+ "eval_samples_per_second": 523.464,
1510
+ "eval_steps_per_second": 32.722,
1511
+ "step": 114021
1512
+ }
1513
+ ],
1514
+ "max_steps": 126690,
1515
+ "num_train_epochs": 10,
1516
+ "total_flos": 7.245026294480845e+16,
1517
+ "trial_name": null,
1518
+ "trial_params": null
1519
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c93473c0679568cf568885f24db7e785c048da7a9bf0fba7588d39ac5f510d81
3
+ size 3515
vocab.txt ADDED
The diff for this file is too large to render. See raw diff