Training in progress, step 3000
Browse files- model-00001-of-00004.safetensors +1 -1
- model-00002-of-00004.safetensors +1 -1
- model-00003-of-00004.safetensors +1 -1
- model-00004-of-00004.safetensors +1 -1
- trainer_log.jsonl +44 -251
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4968243304
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eac7d4684539d4de7f0ba5e3718aea87d753d7bafc12ebbf20744247582eb595
|
3 |
size 4968243304
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4991495816
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:83a2c2a4249d28ff583187476e71f5d834b7ab30713f394adfdb8bbcec75a143
|
3 |
size 4991495816
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751040
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c6c0dec75ba811ec9363d24a2bb779b5cd58539443a0025bdf4c58f21ea8ca96
|
3 |
size 4932751040
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1691924384
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1f5136383581c715398ae05a1473c435634a9141735c2b6b69f98027fe05e850
|
3 |
size 1691924384
|
trainer_log.jsonl
CHANGED
@@ -1,251 +1,44 @@
|
|
1 |
-
{"current_steps":
|
2 |
-
{"current_steps":
|
3 |
-
{"current_steps":
|
4 |
-
{"current_steps":
|
5 |
-
{"current_steps":
|
6 |
-
{"current_steps":
|
7 |
-
{"current_steps":
|
8 |
-
{"current_steps":
|
9 |
-
{"current_steps":
|
10 |
-
{"current_steps":
|
11 |
-
{"current_steps":
|
12 |
-
{"current_steps":
|
13 |
-
{"current_steps":
|
14 |
-
{"current_steps":
|
15 |
-
{"current_steps":
|
16 |
-
{"current_steps":
|
17 |
-
{"current_steps":
|
18 |
-
{"current_steps":
|
19 |
-
{"current_steps":
|
20 |
-
{"current_steps":
|
21 |
-
{"current_steps":
|
22 |
-
{"current_steps":
|
23 |
-
{"current_steps":
|
24 |
-
{"current_steps":
|
25 |
-
{"current_steps":
|
26 |
-
{"current_steps":
|
27 |
-
{"current_steps":
|
28 |
-
{"current_steps":
|
29 |
-
{"current_steps":
|
30 |
-
{"current_steps":
|
31 |
-
{"current_steps":
|
32 |
-
{"current_steps":
|
33 |
-
{"current_steps":
|
34 |
-
{"current_steps":
|
35 |
-
{"current_steps":
|
36 |
-
{"current_steps":
|
37 |
-
{"current_steps":
|
38 |
-
{"current_steps":
|
39 |
-
{"current_steps":
|
40 |
-
{"current_steps":
|
41 |
-
{"current_steps":
|
42 |
-
{"current_steps":
|
43 |
-
{"current_steps":
|
44 |
-
{"current_steps":
|
45 |
-
{"current_steps": 450, "total_steps": 7042, "loss": 0.4571, "lr": 1.2765957446808513e-05, "epoch": 0.12780460096563476, "percentage": 6.39, "elapsed_time": "1:20:51", "remaining_time": "19:44:26"}
|
46 |
-
{"current_steps": 460, "total_steps": 7042, "loss": 0.4549, "lr": 1.3049645390070925e-05, "epoch": 0.13064470320931554, "percentage": 6.53, "elapsed_time": "1:22:37", "remaining_time": "19:42:15"}
|
47 |
-
{"current_steps": 470, "total_steps": 7042, "loss": 0.4579, "lr": 1.3333333333333333e-05, "epoch": 0.13348480545299632, "percentage": 6.67, "elapsed_time": "1:24:27", "remaining_time": "19:41:03"}
|
48 |
-
{"current_steps": 480, "total_steps": 7042, "loss": 0.4492, "lr": 1.3617021276595745e-05, "epoch": 0.13632490769667707, "percentage": 6.82, "elapsed_time": "1:26:18", "remaining_time": "19:39:49"}
|
49 |
-
{"current_steps": 490, "total_steps": 7042, "loss": 0.4657, "lr": 1.3900709219858157e-05, "epoch": 0.13916500994035785, "percentage": 6.96, "elapsed_time": "1:28:06", "remaining_time": "19:38:06"}
|
50 |
-
{"current_steps": 500, "total_steps": 7042, "loss": 0.4507, "lr": 1.418439716312057e-05, "epoch": 0.14200511218403863, "percentage": 7.1, "elapsed_time": "1:29:51", "remaining_time": "19:35:43"}
|
51 |
-
{"current_steps": 510, "total_steps": 7042, "loss": 0.4612, "lr": 1.4468085106382981e-05, "epoch": 0.1448452144277194, "percentage": 7.24, "elapsed_time": "1:32:58", "remaining_time": "19:50:53"}
|
52 |
-
{"current_steps": 520, "total_steps": 7042, "loss": 0.4562, "lr": 1.475177304964539e-05, "epoch": 0.14768531667140017, "percentage": 7.38, "elapsed_time": "1:34:56", "remaining_time": "19:50:44"}
|
53 |
-
{"current_steps": 530, "total_steps": 7042, "loss": 0.4454, "lr": 1.5035460992907802e-05, "epoch": 0.15052541891508095, "percentage": 7.53, "elapsed_time": "1:36:45", "remaining_time": "19:48:49"}
|
54 |
-
{"current_steps": 540, "total_steps": 7042, "loss": 0.4603, "lr": 1.5319148936170214e-05, "epoch": 0.1533655211587617, "percentage": 7.67, "elapsed_time": "1:38:35", "remaining_time": "19:47:06"}
|
55 |
-
{"current_steps": 550, "total_steps": 7042, "loss": 0.45, "lr": 1.5602836879432626e-05, "epoch": 0.15620562340244248, "percentage": 7.81, "elapsed_time": "1:40:25", "remaining_time": "19:45:26"}
|
56 |
-
{"current_steps": 560, "total_steps": 7042, "loss": 0.457, "lr": 1.5886524822695038e-05, "epoch": 0.15904572564612326, "percentage": 7.95, "elapsed_time": "1:42:14", "remaining_time": "19:43:25"}
|
57 |
-
{"current_steps": 570, "total_steps": 7042, "loss": 0.439, "lr": 1.6170212765957446e-05, "epoch": 0.16188582788980405, "percentage": 8.09, "elapsed_time": "1:44:00", "remaining_time": "19:40:59"}
|
58 |
-
{"current_steps": 580, "total_steps": 7042, "loss": 0.4554, "lr": 1.645390070921986e-05, "epoch": 0.1647259301334848, "percentage": 8.24, "elapsed_time": "1:45:50", "remaining_time": "19:39:09"}
|
59 |
-
{"current_steps": 590, "total_steps": 7042, "loss": 0.4473, "lr": 1.673758865248227e-05, "epoch": 0.16756603237716558, "percentage": 8.38, "elapsed_time": "1:47:39", "remaining_time": "19:37:22"}
|
60 |
-
{"current_steps": 600, "total_steps": 7042, "loss": 0.4502, "lr": 1.7021276595744682e-05, "epoch": 0.17040613462084636, "percentage": 8.52, "elapsed_time": "1:49:29", "remaining_time": "19:35:32"}
|
61 |
-
{"current_steps": 610, "total_steps": 7042, "loss": 0.4437, "lr": 1.7304964539007094e-05, "epoch": 0.17324623686452711, "percentage": 8.66, "elapsed_time": "1:51:17", "remaining_time": "19:33:28"}
|
62 |
-
{"current_steps": 620, "total_steps": 7042, "loss": 0.4475, "lr": 1.7588652482269506e-05, "epoch": 0.1760863391082079, "percentage": 8.8, "elapsed_time": "1:53:04", "remaining_time": "19:31:12"}
|
63 |
-
{"current_steps": 630, "total_steps": 7042, "loss": 0.4324, "lr": 1.7872340425531915e-05, "epoch": 0.17892644135188868, "percentage": 8.95, "elapsed_time": "1:54:53", "remaining_time": "19:29:21"}
|
64 |
-
{"current_steps": 640, "total_steps": 7042, "loss": 0.4463, "lr": 1.8156028368794327e-05, "epoch": 0.18176654359556943, "percentage": 9.09, "elapsed_time": "1:56:43", "remaining_time": "19:27:32"}
|
65 |
-
{"current_steps": 650, "total_steps": 7042, "loss": 0.4406, "lr": 1.843971631205674e-05, "epoch": 0.1846066458392502, "percentage": 9.23, "elapsed_time": "1:58:29", "remaining_time": "19:25:09"}
|
66 |
-
{"current_steps": 660, "total_steps": 7042, "loss": 0.4453, "lr": 1.872340425531915e-05, "epoch": 0.187446748082931, "percentage": 9.37, "elapsed_time": "2:00:19", "remaining_time": "19:23:28"}
|
67 |
-
{"current_steps": 670, "total_steps": 7042, "loss": 0.4324, "lr": 1.9007092198581563e-05, "epoch": 0.19028685032661175, "percentage": 9.51, "elapsed_time": "2:02:06", "remaining_time": "19:21:17"}
|
68 |
-
{"current_steps": 680, "total_steps": 7042, "loss": 0.4373, "lr": 1.929078014184397e-05, "epoch": 0.19312695257029253, "percentage": 9.66, "elapsed_time": "2:03:51", "remaining_time": "19:18:46"}
|
69 |
-
{"current_steps": 690, "total_steps": 7042, "loss": 0.434, "lr": 1.9574468085106384e-05, "epoch": 0.1959670548139733, "percentage": 9.8, "elapsed_time": "2:05:40", "remaining_time": "19:16:57"}
|
70 |
-
{"current_steps": 700, "total_steps": 7042, "loss": 0.4473, "lr": 1.9858156028368796e-05, "epoch": 0.1988071570576541, "percentage": 9.94, "elapsed_time": "2:07:27", "remaining_time": "19:14:49"}
|
71 |
-
{"current_steps": 710, "total_steps": 7042, "loss": 0.4317, "lr": 1.999996927852086e-05, "epoch": 0.20164725930133484, "percentage": 10.08, "elapsed_time": "2:09:18", "remaining_time": "19:13:09"}
|
72 |
-
{"current_steps": 720, "total_steps": 7042, "loss": 0.4447, "lr": 1.9999723507820288e-05, "epoch": 0.20448736154501562, "percentage": 10.22, "elapsed_time": "2:11:06", "remaining_time": "19:11:08"}
|
73 |
-
{"current_steps": 730, "total_steps": 7042, "loss": 0.4423, "lr": 1.999923197245949e-05, "epoch": 0.2073274637886964, "percentage": 10.37, "elapsed_time": "2:12:54", "remaining_time": "19:09:09"}
|
74 |
-
{"current_steps": 740, "total_steps": 7042, "loss": 0.4236, "lr": 1.9998494684519e-05, "epoch": 0.21016756603237716, "percentage": 10.51, "elapsed_time": "2:14:45", "remaining_time": "19:07:35"}
|
75 |
-
{"current_steps": 750, "total_steps": 7042, "loss": 0.4329, "lr": 1.9997511662119248e-05, "epoch": 0.21300766827605794, "percentage": 10.65, "elapsed_time": "2:16:32", "remaining_time": "19:05:27"}
|
76 |
-
{"current_steps": 760, "total_steps": 7042, "loss": 0.4345, "lr": 1.999628292942012e-05, "epoch": 0.21584777051973872, "percentage": 10.79, "elapsed_time": "2:18:21", "remaining_time": "19:03:39"}
|
77 |
-
{"current_steps": 770, "total_steps": 7042, "loss": 0.4358, "lr": 1.9994808516620362e-05, "epoch": 0.21868787276341947, "percentage": 10.93, "elapsed_time": "2:20:07", "remaining_time": "19:01:24"}
|
78 |
-
{"current_steps": 780, "total_steps": 7042, "loss": 0.4482, "lr": 1.999308845995683e-05, "epoch": 0.22152797500710025, "percentage": 11.08, "elapsed_time": "2:21:56", "remaining_time": "18:59:31"}
|
79 |
-
{"current_steps": 790, "total_steps": 7042, "loss": 0.4352, "lr": 1.9991122801703606e-05, "epoch": 0.22436807725078103, "percentage": 11.22, "elapsed_time": "2:23:43", "remaining_time": "18:57:23"}
|
80 |
-
{"current_steps": 800, "total_steps": 7042, "loss": 0.4265, "lr": 1.998891159017096e-05, "epoch": 0.2272081794944618, "percentage": 11.36, "elapsed_time": "2:25:32", "remaining_time": "18:55:33"}
|
81 |
-
{"current_steps": 810, "total_steps": 7042, "loss": 0.4247, "lr": 1.9986454879704157e-05, "epoch": 0.23004828173814257, "percentage": 11.5, "elapsed_time": "2:27:20", "remaining_time": "18:53:39"}
|
82 |
-
{"current_steps": 820, "total_steps": 7042, "loss": 0.4394, "lr": 1.9983752730682132e-05, "epoch": 0.23288838398182335, "percentage": 11.64, "elapsed_time": "2:29:08", "remaining_time": "18:51:40"}
|
83 |
-
{"current_steps": 830, "total_steps": 7042, "loss": 0.4182, "lr": 1.9980805209515995e-05, "epoch": 0.23572848622550413, "percentage": 11.79, "elapsed_time": "2:30:59", "remaining_time": "18:50:01"}
|
84 |
-
{"current_steps": 840, "total_steps": 7042, "loss": 0.4288, "lr": 1.99776123886474e-05, "epoch": 0.23856858846918488, "percentage": 11.93, "elapsed_time": "2:32:47", "remaining_time": "18:48:05"}
|
85 |
-
{"current_steps": 850, "total_steps": 7042, "loss": 0.4343, "lr": 1.9974174346546767e-05, "epoch": 0.24140869071286566, "percentage": 12.07, "elapsed_time": "2:34:34", "remaining_time": "18:45:59"}
|
86 |
-
{"current_steps": 860, "total_steps": 7042, "loss": 0.4126, "lr": 1.9970491167711365e-05, "epoch": 0.24424879295654645, "percentage": 12.21, "elapsed_time": "2:36:25", "remaining_time": "18:44:25"}
|
87 |
-
{"current_steps": 870, "total_steps": 7042, "loss": 0.429, "lr": 1.996656294266321e-05, "epoch": 0.2470888952002272, "percentage": 12.35, "elapsed_time": "2:38:13", "remaining_time": "18:42:30"}
|
88 |
-
{"current_steps": 880, "total_steps": 7042, "loss": 0.4263, "lr": 1.9962389767946867e-05, "epoch": 0.24992899744390798, "percentage": 12.5, "elapsed_time": "2:40:01", "remaining_time": "18:40:35"}
|
89 |
-
{"current_steps": 890, "total_steps": 7042, "loss": 0.4261, "lr": 1.9957971746127052e-05, "epoch": 0.25276909968758876, "percentage": 12.64, "elapsed_time": "2:41:46", "remaining_time": "18:38:14"}
|
90 |
-
{"current_steps": 900, "total_steps": 7042, "loss": 0.4211, "lr": 1.9953308985786132e-05, "epoch": 0.2556092019312695, "percentage": 12.78, "elapsed_time": "2:43:34", "remaining_time": "18:36:19"}
|
91 |
-
{"current_steps": 910, "total_steps": 7042, "loss": 0.4383, "lr": 1.994840160152145e-05, "epoch": 0.2584493041749503, "percentage": 12.92, "elapsed_time": "2:45:20", "remaining_time": "18:34:05"}
|
92 |
-
{"current_steps": 920, "total_steps": 7042, "loss": 0.421, "lr": 1.99432497139425e-05, "epoch": 0.2612894064186311, "percentage": 13.06, "elapsed_time": "2:47:09", "remaining_time": "18:32:20"}
|
93 |
-
{"current_steps": 930, "total_steps": 7042, "loss": 0.417, "lr": 1.9937853449667975e-05, "epoch": 0.26412950866231183, "percentage": 13.21, "elapsed_time": "2:48:57", "remaining_time": "18:30:25"}
|
94 |
-
{"current_steps": 940, "total_steps": 7042, "loss": 0.4301, "lr": 1.9932212941322647e-05, "epoch": 0.26696961090599264, "percentage": 13.35, "elapsed_time": "2:50:47", "remaining_time": "18:28:43"}
|
95 |
-
{"current_steps": 950, "total_steps": 7042, "loss": 0.4311, "lr": 1.9926328327534108e-05, "epoch": 0.2698097131496734, "percentage": 13.49, "elapsed_time": "2:52:35", "remaining_time": "18:26:48"}
|
96 |
-
{"current_steps": 960, "total_steps": 7042, "loss": 0.4187, "lr": 1.992019975292937e-05, "epoch": 0.27264981539335414, "percentage": 13.63, "elapsed_time": "2:54:23", "remaining_time": "18:24:50"}
|
97 |
-
{"current_steps": 970, "total_steps": 7042, "loss": 0.4245, "lr": 1.9913827368131303e-05, "epoch": 0.27548991763703495, "percentage": 13.77, "elapsed_time": "2:56:11", "remaining_time": "18:22:53"}
|
98 |
-
{"current_steps": 980, "total_steps": 7042, "loss": 0.4335, "lr": 1.990721132975494e-05, "epoch": 0.2783300198807157, "percentage": 13.92, "elapsed_time": "2:57:59", "remaining_time": "18:20:57"}
|
99 |
-
{"current_steps": 990, "total_steps": 7042, "loss": 0.4241, "lr": 1.990035180040361e-05, "epoch": 0.28117012212439646, "percentage": 14.06, "elapsed_time": "2:59:47", "remaining_time": "18:19:02"}
|
100 |
-
{"current_steps": 1000, "total_steps": 7042, "loss": 0.4122, "lr": 1.989324894866497e-05, "epoch": 0.28401022436807727, "percentage": 14.2, "elapsed_time": "3:01:33", "remaining_time": "18:16:56"}
|
101 |
-
{"current_steps": 1010, "total_steps": 7042, "loss": 0.4299, "lr": 1.9885902949106842e-05, "epoch": 0.286850326611758, "percentage": 14.34, "elapsed_time": "3:04:29", "remaining_time": "18:21:51"}
|
102 |
-
{"current_steps": 1020, "total_steps": 7042, "loss": 0.4171, "lr": 1.9878313982272926e-05, "epoch": 0.2896904288554388, "percentage": 14.48, "elapsed_time": "3:06:18", "remaining_time": "18:19:56"}
|
103 |
-
{"current_steps": 1030, "total_steps": 7042, "loss": 0.4138, "lr": 1.9870482234678362e-05, "epoch": 0.2925305310991196, "percentage": 14.63, "elapsed_time": "3:08:08", "remaining_time": "18:18:09"}
|
104 |
-
{"current_steps": 1040, "total_steps": 7042, "loss": 0.4166, "lr": 1.986240789880515e-05, "epoch": 0.29537063334280034, "percentage": 14.77, "elapsed_time": "3:09:58", "remaining_time": "18:16:23"}
|
105 |
-
{"current_steps": 1050, "total_steps": 7042, "loss": 0.4168, "lr": 1.9854091173097423e-05, "epoch": 0.2982107355864811, "percentage": 14.91, "elapsed_time": "3:11:46", "remaining_time": "18:14:24"}
|
106 |
-
{"current_steps": 1060, "total_steps": 7042, "loss": 0.4127, "lr": 1.9845532261956556e-05, "epoch": 0.3010508378301619, "percentage": 15.05, "elapsed_time": "3:13:33", "remaining_time": "18:12:18"}
|
107 |
-
{"current_steps": 1070, "total_steps": 7042, "loss": 0.4252, "lr": 1.9836731375736152e-05, "epoch": 0.30389094007384265, "percentage": 15.19, "elapsed_time": "3:15:23", "remaining_time": "18:10:31"}
|
108 |
-
{"current_steps": 1080, "total_steps": 7042, "loss": 0.418, "lr": 1.982768873073688e-05, "epoch": 0.3067310423175234, "percentage": 15.34, "elapsed_time": "3:17:10", "remaining_time": "18:08:29"}
|
109 |
-
{"current_steps": 1090, "total_steps": 7042, "loss": 0.4139, "lr": 1.9818404549201134e-05, "epoch": 0.3095711445612042, "percentage": 15.48, "elapsed_time": "3:18:58", "remaining_time": "18:06:31"}
|
110 |
-
{"current_steps": 1100, "total_steps": 7042, "loss": 0.4105, "lr": 1.98088790593076e-05, "epoch": 0.31241124680488497, "percentage": 15.62, "elapsed_time": "3:20:45", "remaining_time": "18:04:27"}
|
111 |
-
{"current_steps": 1110, "total_steps": 7042, "loss": 0.42, "lr": 1.979911249516563e-05, "epoch": 0.3152513490485657, "percentage": 15.76, "elapsed_time": "3:22:32", "remaining_time": "18:02:24"}
|
112 |
-
{"current_steps": 1120, "total_steps": 7042, "loss": 0.4141, "lr": 1.9789105096809486e-05, "epoch": 0.31809145129224653, "percentage": 15.9, "elapsed_time": "3:24:21", "remaining_time": "18:00:32"}
|
113 |
-
{"current_steps": 1130, "total_steps": 7042, "loss": 0.4119, "lr": 1.977885711019246e-05, "epoch": 0.3209315535359273, "percentage": 16.05, "elapsed_time": "3:26:09", "remaining_time": "17:58:35"}
|
114 |
-
{"current_steps": 1140, "total_steps": 7042, "loss": 0.4172, "lr": 1.976836878718081e-05, "epoch": 0.3237716557796081, "percentage": 16.19, "elapsed_time": "3:27:57", "remaining_time": "17:56:38"}
|
115 |
-
{"current_steps": 1150, "total_steps": 7042, "loss": 0.4189, "lr": 1.975764038554758e-05, "epoch": 0.32661175802328885, "percentage": 16.33, "elapsed_time": "3:29:46", "remaining_time": "17:54:46"}
|
116 |
-
{"current_steps": 1160, "total_steps": 7042, "loss": 0.4225, "lr": 1.9746672168966253e-05, "epoch": 0.3294518602669696, "percentage": 16.47, "elapsed_time": "3:31:35", "remaining_time": "17:52:54"}
|
117 |
-
{"current_steps": 1170, "total_steps": 7042, "loss": 0.4248, "lr": 1.973546440700429e-05, "epoch": 0.3322919625106504, "percentage": 16.61, "elapsed_time": "3:33:22", "remaining_time": "17:50:52"}
|
118 |
-
{"current_steps": 1180, "total_steps": 7042, "loss": 0.4157, "lr": 1.9724017375116482e-05, "epoch": 0.33513206475433116, "percentage": 16.76, "elapsed_time": "3:35:11", "remaining_time": "17:49:01"}
|
119 |
-
{"current_steps": 1190, "total_steps": 7042, "loss": 0.4154, "lr": 1.97123313546382e-05, "epoch": 0.3379721669980119, "percentage": 16.9, "elapsed_time": "3:37:00", "remaining_time": "17:47:09"}
|
120 |
-
{"current_steps": 1200, "total_steps": 7042, "loss": 0.4087, "lr": 1.9700406632778476e-05, "epoch": 0.3408122692416927, "percentage": 17.04, "elapsed_time": "3:38:49", "remaining_time": "17:45:18"}
|
121 |
-
{"current_steps": 1210, "total_steps": 7042, "loss": 0.4284, "lr": 1.968824350261293e-05, "epoch": 0.3436523714853735, "percentage": 17.18, "elapsed_time": "3:40:38", "remaining_time": "17:43:29"}
|
122 |
-
{"current_steps": 1220, "total_steps": 7042, "loss": 0.416, "lr": 1.9675842263076582e-05, "epoch": 0.34649247372905423, "percentage": 17.32, "elapsed_time": "3:42:26", "remaining_time": "17:41:31"}
|
123 |
-
{"current_steps": 1230, "total_steps": 7042, "loss": 0.4066, "lr": 1.96632032189565e-05, "epoch": 0.34933257597273504, "percentage": 17.47, "elapsed_time": "3:44:13", "remaining_time": "17:39:29"}
|
124 |
-
{"current_steps": 1240, "total_steps": 7042, "loss": 0.4228, "lr": 1.9650326680884312e-05, "epoch": 0.3521726782164158, "percentage": 17.61, "elapsed_time": "3:46:03", "remaining_time": "17:37:45"}
|
125 |
-
{"current_steps": 1250, "total_steps": 7042, "loss": 0.4133, "lr": 1.9637212965328574e-05, "epoch": 0.35501278046009654, "percentage": 17.75, "elapsed_time": "3:47:54", "remaining_time": "17:36:04"}
|
126 |
-
{"current_steps": 1260, "total_steps": 7042, "loss": 0.4022, "lr": 1.9623862394586978e-05, "epoch": 0.35785288270377735, "percentage": 17.89, "elapsed_time": "3:49:44", "remaining_time": "17:34:15"}
|
127 |
-
{"current_steps": 1270, "total_steps": 7042, "loss": 0.4126, "lr": 1.9610275296778443e-05, "epoch": 0.3606929849474581, "percentage": 18.03, "elapsed_time": "3:51:35", "remaining_time": "17:32:31"}
|
128 |
-
{"current_steps": 1280, "total_steps": 7042, "loss": 0.4192, "lr": 1.959645200583505e-05, "epoch": 0.36353308719113886, "percentage": 18.18, "elapsed_time": "3:53:21", "remaining_time": "17:30:29"}
|
129 |
-
{"current_steps": 1290, "total_steps": 7042, "loss": 0.408, "lr": 1.9582392861493835e-05, "epoch": 0.36637318943481967, "percentage": 18.32, "elapsed_time": "3:55:10", "remaining_time": "17:28:37"}
|
130 |
-
{"current_steps": 1300, "total_steps": 7042, "loss": 0.4184, "lr": 1.9568098209288436e-05, "epoch": 0.3692132916785004, "percentage": 18.46, "elapsed_time": "3:56:58", "remaining_time": "17:26:40"}
|
131 |
-
{"current_steps": 1310, "total_steps": 7042, "loss": 0.4104, "lr": 1.9553568400540594e-05, "epoch": 0.3720533939221812, "percentage": 18.6, "elapsed_time": "3:58:45", "remaining_time": "17:24:41"}
|
132 |
-
{"current_steps": 1320, "total_steps": 7042, "loss": 0.4061, "lr": 1.953880379235154e-05, "epoch": 0.374893496165862, "percentage": 18.74, "elapsed_time": "4:00:31", "remaining_time": "17:22:39"}
|
133 |
-
{"current_steps": 1330, "total_steps": 7042, "loss": 0.4091, "lr": 1.95238047475932e-05, "epoch": 0.37773359840954274, "percentage": 18.89, "elapsed_time": "4:02:19", "remaining_time": "17:20:41"}
|
134 |
-
{"current_steps": 1340, "total_steps": 7042, "loss": 0.4007, "lr": 1.950857163489927e-05, "epoch": 0.3805737006532235, "percentage": 19.03, "elapsed_time": "4:04:05", "remaining_time": "17:18:38"}
|
135 |
-
{"current_steps": 1350, "total_steps": 7042, "loss": 0.4073, "lr": 1.9493104828656187e-05, "epoch": 0.3834138028969043, "percentage": 19.17, "elapsed_time": "4:05:51", "remaining_time": "17:16:38"}
|
136 |
-
{"current_steps": 1360, "total_steps": 7042, "loss": 0.4054, "lr": 1.9477404708993904e-05, "epoch": 0.38625390514058505, "percentage": 19.31, "elapsed_time": "4:07:41", "remaining_time": "17:14:51"}
|
137 |
-
{"current_steps": 1370, "total_steps": 7042, "loss": 0.3906, "lr": 1.9461471661776536e-05, "epoch": 0.38909400738426586, "percentage": 19.45, "elapsed_time": "4:09:32", "remaining_time": "17:13:09"}
|
138 |
-
{"current_steps": 1380, "total_steps": 7042, "loss": 0.403, "lr": 1.944530607859291e-05, "epoch": 0.3919341096279466, "percentage": 19.6, "elapsed_time": "4:11:23", "remaining_time": "17:11:27"}
|
139 |
-
{"current_steps": 1390, "total_steps": 7042, "loss": 0.403, "lr": 1.9428908356746914e-05, "epoch": 0.39477421187162737, "percentage": 19.74, "elapsed_time": "4:13:11", "remaining_time": "17:09:31"}
|
140 |
-
{"current_steps": 1400, "total_steps": 7042, "loss": 0.404, "lr": 1.9412278899247748e-05, "epoch": 0.3976143141153082, "percentage": 19.88, "elapsed_time": "4:14:58", "remaining_time": "17:07:32"}
|
141 |
-
{"current_steps": 1410, "total_steps": 7042, "loss": 0.4076, "lr": 1.9395418114800005e-05, "epoch": 0.40045441635898893, "percentage": 20.02, "elapsed_time": "4:16:48", "remaining_time": "17:05:45"}
|
142 |
-
{"current_steps": 1420, "total_steps": 7042, "loss": 0.3932, "lr": 1.9378326417793646e-05, "epoch": 0.4032945186026697, "percentage": 20.16, "elapsed_time": "4:18:34", "remaining_time": "17:03:43"}
|
143 |
-
{"current_steps": 1430, "total_steps": 7042, "loss": 0.4122, "lr": 1.9361004228293788e-05, "epoch": 0.4061346208463505, "percentage": 20.31, "elapsed_time": "4:20:21", "remaining_time": "17:01:45"}
|
144 |
-
{"current_steps": 1440, "total_steps": 7042, "loss": 0.4025, "lr": 1.9343451972030407e-05, "epoch": 0.40897472309003124, "percentage": 20.45, "elapsed_time": "4:22:09", "remaining_time": "16:59:50"}
|
145 |
-
{"current_steps": 1450, "total_steps": 7042, "loss": 0.3931, "lr": 1.9325670080387863e-05, "epoch": 0.411814825333712, "percentage": 20.59, "elapsed_time": "4:23:57", "remaining_time": "16:57:56"}
|
146 |
-
{"current_steps": 1460, "total_steps": 7042, "loss": 0.4094, "lr": 1.9307658990394293e-05, "epoch": 0.4146549275773928, "percentage": 20.73, "elapsed_time": "4:25:43", "remaining_time": "16:55:56"}
|
147 |
-
{"current_steps": 1470, "total_steps": 7042, "loss": 0.404, "lr": 1.9289419144710874e-05, "epoch": 0.41749502982107356, "percentage": 20.87, "elapsed_time": "4:27:29", "remaining_time": "16:53:54"}
|
148 |
-
{"current_steps": 1480, "total_steps": 7042, "loss": 0.3982, "lr": 1.9270950991620955e-05, "epoch": 0.4203351320647543, "percentage": 21.02, "elapsed_time": "4:29:18", "remaining_time": "16:52:05"}
|
149 |
-
{"current_steps": 1490, "total_steps": 7042, "loss": 0.4128, "lr": 1.925225498501902e-05, "epoch": 0.4231752343084351, "percentage": 21.16, "elapsed_time": "4:31:06", "remaining_time": "16:50:10"}
|
150 |
-
{"current_steps": 1500, "total_steps": 7042, "loss": 0.3999, "lr": 1.9233331584399542e-05, "epoch": 0.4260153365521159, "percentage": 21.3, "elapsed_time": "4:32:54", "remaining_time": "16:48:17"}
|
151 |
-
{"current_steps": 1510, "total_steps": 7042, "loss": 0.4019, "lr": 1.9214181254845696e-05, "epoch": 0.42885543879579663, "percentage": 21.44, "elapsed_time": "4:35:48", "remaining_time": "16:50:28"}
|
152 |
-
{"current_steps": 1520, "total_steps": 7042, "loss": 0.3951, "lr": 1.9194804467017916e-05, "epoch": 0.43169554103947744, "percentage": 21.58, "elapsed_time": "4:37:38", "remaining_time": "16:48:38"}
|
153 |
-
{"current_steps": 1530, "total_steps": 7042, "loss": 0.3928, "lr": 1.917520169714234e-05, "epoch": 0.4345356432831582, "percentage": 21.73, "elapsed_time": "4:39:25", "remaining_time": "16:46:41"}
|
154 |
-
{"current_steps": 1540, "total_steps": 7042, "loss": 0.4027, "lr": 1.9155373426999096e-05, "epoch": 0.43737574552683894, "percentage": 21.87, "elapsed_time": "4:41:13", "remaining_time": "16:44:44"}
|
155 |
-
{"current_steps": 1550, "total_steps": 7042, "loss": 0.3993, "lr": 1.9135320143910465e-05, "epoch": 0.44021584777051975, "percentage": 22.01, "elapsed_time": "4:43:03", "remaining_time": "16:42:55"}
|
156 |
-
{"current_steps": 1560, "total_steps": 7042, "loss": 0.3906, "lr": 1.9115042340728904e-05, "epoch": 0.4430559500142005, "percentage": 22.15, "elapsed_time": "4:44:49", "remaining_time": "16:40:53"}
|
157 |
-
{"current_steps": 1570, "total_steps": 7042, "loss": 0.4004, "lr": 1.9094540515824933e-05, "epoch": 0.44589605225788126, "percentage": 22.29, "elapsed_time": "4:46:36", "remaining_time": "16:38:55"}
|
158 |
-
{"current_steps": 1580, "total_steps": 7042, "loss": 0.4003, "lr": 1.9073815173074887e-05, "epoch": 0.44873615450156207, "percentage": 22.44, "elapsed_time": "4:48:25", "remaining_time": "16:37:03"}
|
159 |
-
{"current_steps": 1590, "total_steps": 7042, "loss": 0.4169, "lr": 1.9052866821848536e-05, "epoch": 0.4515762567452428, "percentage": 22.58, "elapsed_time": "4:50:13", "remaining_time": "16:35:09"}
|
160 |
-
{"current_steps": 1600, "total_steps": 7042, "loss": 0.3976, "lr": 1.903169597699655e-05, "epoch": 0.4544163589889236, "percentage": 22.72, "elapsed_time": "4:52:00", "remaining_time": "16:33:12"}
|
161 |
-
{"current_steps": 1610, "total_steps": 7042, "loss": 0.406, "lr": 1.901030315883787e-05, "epoch": 0.4572564612326044, "percentage": 22.86, "elapsed_time": "4:53:53", "remaining_time": "16:31:33"}
|
162 |
-
{"current_steps": 1620, "total_steps": 7042, "loss": 0.3924, "lr": 1.89886888931469e-05, "epoch": 0.46009656347628514, "percentage": 23.0, "elapsed_time": "4:55:40", "remaining_time": "16:29:36"}
|
163 |
-
{"current_steps": 1630, "total_steps": 7042, "loss": 0.4077, "lr": 1.896685371114059e-05, "epoch": 0.46293666571996595, "percentage": 23.15, "elapsed_time": "4:57:29", "remaining_time": "16:27:43"}
|
164 |
-
{"current_steps": 1640, "total_steps": 7042, "loss": 0.4037, "lr": 1.8944798149465394e-05, "epoch": 0.4657767679636467, "percentage": 23.29, "elapsed_time": "4:59:18", "remaining_time": "16:25:53"}
|
165 |
-
{"current_steps": 1650, "total_steps": 7042, "loss": 0.4018, "lr": 1.892252275018406e-05, "epoch": 0.46861687020732745, "percentage": 23.43, "elapsed_time": "5:01:08", "remaining_time": "16:24:04"}
|
166 |
-
{"current_steps": 1660, "total_steps": 7042, "loss": 0.4015, "lr": 1.8900028060762317e-05, "epoch": 0.47145697245100826, "percentage": 23.57, "elapsed_time": "5:02:57", "remaining_time": "16:22:14"}
|
167 |
-
{"current_steps": 1670, "total_steps": 7042, "loss": 0.4089, "lr": 1.8877314634055418e-05, "epoch": 0.474297074694689, "percentage": 23.71, "elapsed_time": "5:04:45", "remaining_time": "16:20:19"}
|
168 |
-
{"current_steps": 1680, "total_steps": 7042, "loss": 0.3982, "lr": 1.8854383028294563e-05, "epoch": 0.47713717693836977, "percentage": 23.86, "elapsed_time": "5:06:34", "remaining_time": "16:18:28"}
|
169 |
-
{"current_steps": 1690, "total_steps": 7042, "loss": 0.3968, "lr": 1.8831233807073162e-05, "epoch": 0.4799772791820506, "percentage": 24.0, "elapsed_time": "5:08:22", "remaining_time": "16:16:34"}
|
170 |
-
{"current_steps": 1700, "total_steps": 7042, "loss": 0.3944, "lr": 1.8807867539333e-05, "epoch": 0.48281738142573133, "percentage": 24.14, "elapsed_time": "5:10:13", "remaining_time": "16:14:51"}
|
171 |
-
{"current_steps": 1710, "total_steps": 7042, "loss": 0.4025, "lr": 1.878428479935023e-05, "epoch": 0.4856574836694121, "percentage": 24.28, "elapsed_time": "5:12:00", "remaining_time": "16:12:52"}
|
172 |
-
{"current_steps": 1720, "total_steps": 7042, "loss": 0.4095, "lr": 1.876048616672129e-05, "epoch": 0.4884975859130929, "percentage": 24.42, "elapsed_time": "5:13:53", "remaining_time": "16:11:12"}
|
173 |
-
{"current_steps": 1730, "total_steps": 7042, "loss": 0.3907, "lr": 1.8736472226348643e-05, "epoch": 0.49133768815677364, "percentage": 24.57, "elapsed_time": "5:15:39", "remaining_time": "16:09:13"}
|
174 |
-
{"current_steps": 1740, "total_steps": 7042, "loss": 0.4054, "lr": 1.871224356842639e-05, "epoch": 0.4941777904004544, "percentage": 24.71, "elapsed_time": "5:17:27", "remaining_time": "16:07:20"}
|
175 |
-
{"current_steps": 1750, "total_steps": 7042, "loss": 0.3976, "lr": 1.868780078842579e-05, "epoch": 0.4970178926441352, "percentage": 24.85, "elapsed_time": "5:19:16", "remaining_time": "16:05:29"}
|
176 |
-
{"current_steps": 1760, "total_steps": 7042, "loss": 0.386, "lr": 1.86631444870806e-05, "epoch": 0.49985799488781596, "percentage": 24.99, "elapsed_time": "5:21:04", "remaining_time": "16:03:36"}
|
177 |
-
{"current_steps": 1770, "total_steps": 7042, "loss": 0.4006, "lr": 1.863827527037233e-05, "epoch": 0.5026980971314967, "percentage": 25.13, "elapsed_time": "5:22:54", "remaining_time": "16:01:48"}
|
178 |
-
{"current_steps": 1780, "total_steps": 7042, "loss": 0.3967, "lr": 1.8613193749515336e-05, "epoch": 0.5055381993751775, "percentage": 25.28, "elapsed_time": "5:24:45", "remaining_time": "16:00:02"}
|
179 |
-
{"current_steps": 1790, "total_steps": 7042, "loss": 0.4044, "lr": 1.858790054094181e-05, "epoch": 0.5083783016188583, "percentage": 25.42, "elapsed_time": "5:26:36", "remaining_time": "15:58:18"}
|
180 |
-
{"current_steps": 1800, "total_steps": 7042, "loss": 0.4004, "lr": 1.856239626628662e-05, "epoch": 0.511218403862539, "percentage": 25.56, "elapsed_time": "5:28:23", "remaining_time": "15:56:20"}
|
181 |
-
{"current_steps": 1810, "total_steps": 7042, "loss": 0.4036, "lr": 1.8536681552372035e-05, "epoch": 0.5140585061062198, "percentage": 25.7, "elapsed_time": "5:30:12", "remaining_time": "15:54:30"}
|
182 |
-
{"current_steps": 1820, "total_steps": 7042, "loss": 0.388, "lr": 1.8510757031192325e-05, "epoch": 0.5168986083499006, "percentage": 25.84, "elapsed_time": "5:32:00", "remaining_time": "15:52:37"}
|
183 |
-
{"current_steps": 1830, "total_steps": 7042, "loss": 0.4062, "lr": 1.848462333989822e-05, "epoch": 0.5197387105935813, "percentage": 25.99, "elapsed_time": "5:33:50", "remaining_time": "15:50:48"}
|
184 |
-
{"current_steps": 1840, "total_steps": 7042, "loss": 0.3988, "lr": 1.845828112078125e-05, "epoch": 0.5225788128372622, "percentage": 26.13, "elapsed_time": "5:35:42", "remaining_time": "15:49:06"}
|
185 |
-
{"current_steps": 1850, "total_steps": 7042, "loss": 0.3911, "lr": 1.843173102125798e-05, "epoch": 0.525418915080943, "percentage": 26.27, "elapsed_time": "5:37:30", "remaining_time": "15:47:11"}
|
186 |
-
{"current_steps": 1860, "total_steps": 7042, "loss": 0.3863, "lr": 1.8404973693854056e-05, "epoch": 0.5282590173246237, "percentage": 26.41, "elapsed_time": "5:39:20", "remaining_time": "15:45:23"}
|
187 |
-
{"current_steps": 1870, "total_steps": 7042, "loss": 0.4025, "lr": 1.837800979618822e-05, "epoch": 0.5310991195683045, "percentage": 26.55, "elapsed_time": "5:41:07", "remaining_time": "15:43:28"}
|
188 |
-
{"current_steps": 1880, "total_steps": 7042, "loss": 0.3911, "lr": 1.8350839990956104e-05, "epoch": 0.5339392218119853, "percentage": 26.7, "elapsed_time": "5:42:57", "remaining_time": "15:41:41"}
|
189 |
-
{"current_steps": 1890, "total_steps": 7042, "loss": 0.3998, "lr": 1.8323464945913967e-05, "epoch": 0.536779324055666, "percentage": 26.84, "elapsed_time": "5:44:48", "remaining_time": "15:39:55"}
|
190 |
-
{"current_steps": 1900, "total_steps": 7042, "loss": 0.3942, "lr": 1.829588533386228e-05, "epoch": 0.5396194262993468, "percentage": 26.98, "elapsed_time": "5:46:34", "remaining_time": "15:37:55"}
|
191 |
-
{"current_steps": 1910, "total_steps": 7042, "loss": 0.394, "lr": 1.8268101832629177e-05, "epoch": 0.5424595285430276, "percentage": 27.12, "elapsed_time": "5:48:24", "remaining_time": "15:36:07"}
|
192 |
-
{"current_steps": 1920, "total_steps": 7042, "loss": 0.3976, "lr": 1.8240115125053816e-05, "epoch": 0.5452996307867083, "percentage": 27.26, "elapsed_time": "5:50:13", "remaining_time": "15:34:16"}
|
193 |
-
{"current_steps": 1930, "total_steps": 7042, "loss": 0.3837, "lr": 1.821192589896958e-05, "epoch": 0.5481397330303891, "percentage": 27.41, "elapsed_time": "5:52:02", "remaining_time": "15:32:27"}
|
194 |
-
{"current_steps": 1940, "total_steps": 7042, "loss": 0.3884, "lr": 1.8183534847187184e-05, "epoch": 0.5509798352740699, "percentage": 27.55, "elapsed_time": "5:53:50", "remaining_time": "15:30:34"}
|
195 |
-
{"current_steps": 1950, "total_steps": 7042, "loss": 0.3965, "lr": 1.815494266747764e-05, "epoch": 0.5538199375177506, "percentage": 27.69, "elapsed_time": "5:55:38", "remaining_time": "15:28:39"}
|
196 |
-
{"current_steps": 1960, "total_steps": 7042, "loss": 0.3952, "lr": 1.8126150062555107e-05, "epoch": 0.5566600397614314, "percentage": 27.83, "elapsed_time": "5:57:22", "remaining_time": "15:26:37"}
|
197 |
-
{"current_steps": 1970, "total_steps": 7042, "loss": 0.4067, "lr": 1.809715774005963e-05, "epoch": 0.5595001420051122, "percentage": 27.98, "elapsed_time": "5:59:13", "remaining_time": "15:24:51"}
|
198 |
-
{"current_steps": 1980, "total_steps": 7042, "loss": 0.3957, "lr": 1.806796641253974e-05, "epoch": 0.5623402442487929, "percentage": 28.12, "elapsed_time": "6:00:59", "remaining_time": "15:22:55"}
|
199 |
-
{"current_steps": 1990, "total_steps": 7042, "loss": 0.4092, "lr": 1.8038576797434945e-05, "epoch": 0.5651803464924737, "percentage": 28.26, "elapsed_time": "6:02:49", "remaining_time": "15:21:07"}
|
200 |
-
{"current_steps": 2000, "total_steps": 7042, "loss": 0.3916, "lr": 1.8008989617058088e-05, "epoch": 0.5680204487361545, "percentage": 28.4, "elapsed_time": "6:04:37", "remaining_time": "15:19:13"}
|
201 |
-
{"current_steps": 2010, "total_steps": 7042, "loss": 0.3908, "lr": 1.797920559857761e-05, "epoch": 0.5708605509798352, "percentage": 28.54, "elapsed_time": "6:07:31", "remaining_time": "15:20:05"}
|
202 |
-
{"current_steps": 2020, "total_steps": 7042, "loss": 0.4008, "lr": 1.794922547399967e-05, "epoch": 0.573700653223516, "percentage": 28.69, "elapsed_time": "6:09:18", "remaining_time": "15:18:09"}
|
203 |
-
{"current_steps": 2030, "total_steps": 7042, "loss": 0.3922, "lr": 1.7919049980150155e-05, "epoch": 0.5765407554671969, "percentage": 28.83, "elapsed_time": "6:11:05", "remaining_time": "15:16:13"}
|
204 |
-
{"current_steps": 2040, "total_steps": 7042, "loss": 0.3874, "lr": 1.7888679858656566e-05, "epoch": 0.5793808577108776, "percentage": 28.97, "elapsed_time": "6:12:53", "remaining_time": "15:14:18"}
|
205 |
-
{"current_steps": 2050, "total_steps": 7042, "loss": 0.3915, "lr": 1.7858115855929797e-05, "epoch": 0.5822209599545584, "percentage": 29.11, "elapsed_time": "6:14:43", "remaining_time": "15:12:29"}
|
206 |
-
{"current_steps": 2060, "total_steps": 7042, "loss": 0.3911, "lr": 1.7827358723145803e-05, "epoch": 0.5850610621982392, "percentage": 29.25, "elapsed_time": "6:16:32", "remaining_time": "15:10:38"}
|
207 |
-
{"current_steps": 2070, "total_steps": 7042, "loss": 0.3854, "lr": 1.77964092162271e-05, "epoch": 0.5879011644419199, "percentage": 29.4, "elapsed_time": "6:18:18", "remaining_time": "15:08:41"}
|
208 |
-
{"current_steps": 2080, "total_steps": 7042, "loss": 0.3956, "lr": 1.7765268095824234e-05, "epoch": 0.5907412666856007, "percentage": 29.54, "elapsed_time": "6:20:08", "remaining_time": "15:06:50"}
|
209 |
-
{"current_steps": 2090, "total_steps": 7042, "loss": 0.3844, "lr": 1.7733936127297053e-05, "epoch": 0.5935813689292815, "percentage": 29.68, "elapsed_time": "6:21:57", "remaining_time": "15:05:00"}
|
210 |
-
{"current_steps": 2100, "total_steps": 7042, "loss": 0.3837, "lr": 1.7702414080695907e-05, "epoch": 0.5964214711729622, "percentage": 29.82, "elapsed_time": "6:23:47", "remaining_time": "15:03:10"}
|
211 |
-
{"current_steps": 2110, "total_steps": 7042, "loss": 0.3788, "lr": 1.7670702730742722e-05, "epoch": 0.599261573416643, "percentage": 29.96, "elapsed_time": "6:25:34", "remaining_time": "15:01:14"}
|
212 |
-
{"current_steps": 2120, "total_steps": 7042, "loss": 0.3848, "lr": 1.763880285681196e-05, "epoch": 0.6021016756603238, "percentage": 30.11, "elapsed_time": "6:27:20", "remaining_time": "14:59:18"}
|
213 |
-
{"current_steps": 2130, "total_steps": 7042, "loss": 0.3958, "lr": 1.7606715242911468e-05, "epoch": 0.6049417779040045, "percentage": 30.25, "elapsed_time": "6:29:07", "remaining_time": "14:57:21"}
|
214 |
-
{"current_steps": 2140, "total_steps": 7042, "loss": 0.3877, "lr": 1.7574440677663212e-05, "epoch": 0.6077818801476853, "percentage": 30.39, "elapsed_time": "6:30:56", "remaining_time": "14:55:31"}
|
215 |
-
{"current_steps": 2150, "total_steps": 7042, "loss": 0.3858, "lr": 1.7541979954283864e-05, "epoch": 0.6106219823913661, "percentage": 30.53, "elapsed_time": "6:32:42", "remaining_time": "14:53:32"}
|
216 |
-
{"current_steps": 2160, "total_steps": 7042, "loss": 0.3791, "lr": 1.7509333870565364e-05, "epoch": 0.6134620846350468, "percentage": 30.67, "elapsed_time": "6:34:32", "remaining_time": "14:51:43"}
|
217 |
-
{"current_steps": 2170, "total_steps": 7042, "loss": 0.3903, "lr": 1.7476503228855254e-05, "epoch": 0.6163021868787276, "percentage": 30.82, "elapsed_time": "6:36:21", "remaining_time": "14:49:52"}
|
218 |
-
{"current_steps": 2180, "total_steps": 7042, "loss": 0.3925, "lr": 1.744348883603699e-05, "epoch": 0.6191422891224084, "percentage": 30.96, "elapsed_time": "6:38:10", "remaining_time": "14:48:02"}
|
219 |
-
{"current_steps": 2190, "total_steps": 7042, "loss": 0.3901, "lr": 1.741029150351012e-05, "epoch": 0.6219823913660891, "percentage": 31.1, "elapsed_time": "6:40:00", "remaining_time": "14:46:13"}
|
220 |
-
{"current_steps": 2200, "total_steps": 7042, "loss": 0.3963, "lr": 1.7376912047170312e-05, "epoch": 0.6248224936097699, "percentage": 31.24, "elapsed_time": "6:41:48", "remaining_time": "14:44:20"}
|
221 |
-
{"current_steps": 2210, "total_steps": 7042, "loss": 0.3801, "lr": 1.7343351287389328e-05, "epoch": 0.6276625958534507, "percentage": 31.38, "elapsed_time": "6:43:36", "remaining_time": "14:42:27"}
|
222 |
-
{"current_steps": 2220, "total_steps": 7042, "loss": 0.3961, "lr": 1.730961004899484e-05, "epoch": 0.6305026980971314, "percentage": 31.53, "elapsed_time": "6:45:25", "remaining_time": "14:40:37"}
|
223 |
-
{"current_steps": 2230, "total_steps": 7042, "loss": 0.3914, "lr": 1.727568916125018e-05, "epoch": 0.6333428003408123, "percentage": 31.67, "elapsed_time": "6:47:13", "remaining_time": "14:38:43"}
|
224 |
-
{"current_steps": 2240, "total_steps": 7042, "loss": 0.3853, "lr": 1.724158945783394e-05, "epoch": 0.6361829025844931, "percentage": 31.81, "elapsed_time": "6:49:02", "remaining_time": "14:36:53"}
|
225 |
-
{"current_steps": 2250, "total_steps": 7042, "loss": 0.3939, "lr": 1.72073117768195e-05, "epoch": 0.6390230048281739, "percentage": 31.95, "elapsed_time": "6:50:51", "remaining_time": "14:35:01"}
|
226 |
-
{"current_steps": 2260, "total_steps": 7042, "loss": 0.373, "lr": 1.717285696065441e-05, "epoch": 0.6418631070718546, "percentage": 32.09, "elapsed_time": "6:52:38", "remaining_time": "14:33:06"}
|
227 |
-
{"current_steps": 2270, "total_steps": 7042, "loss": 0.3961, "lr": 1.7138225856139707e-05, "epoch": 0.6447032093155354, "percentage": 32.24, "elapsed_time": "6:54:27", "remaining_time": "14:31:15"}
|
228 |
-
{"current_steps": 2280, "total_steps": 7042, "loss": 0.3874, "lr": 1.7103419314409084e-05, "epoch": 0.6475433115592162, "percentage": 32.38, "elapsed_time": "6:56:16", "remaining_time": "14:29:25"}
|
229 |
-
{"current_steps": 2290, "total_steps": 7042, "loss": 0.3802, "lr": 1.7068438190907987e-05, "epoch": 0.6503834138028969, "percentage": 32.52, "elapsed_time": "6:58:02", "remaining_time": "14:27:29"}
|
230 |
-
{"current_steps": 2300, "total_steps": 7042, "loss": 0.3895, "lr": 1.7033283345372577e-05, "epoch": 0.6532235160465777, "percentage": 32.66, "elapsed_time": "6:59:52", "remaining_time": "14:25:39"}
|
231 |
-
{"current_steps": 2310, "total_steps": 7042, "loss": 0.4052, "lr": 1.6997955641808607e-05, "epoch": 0.6560636182902585, "percentage": 32.8, "elapsed_time": "7:01:44", "remaining_time": "14:23:55"}
|
232 |
-
{"current_steps": 2320, "total_steps": 7042, "loss": 0.3883, "lr": 1.6962455948470197e-05, "epoch": 0.6589037205339392, "percentage": 32.95, "elapsed_time": "7:03:34", "remaining_time": "14:22:07"}
|
233 |
-
{"current_steps": 2330, "total_steps": 7042, "loss": 0.3877, "lr": 1.6926785137838475e-05, "epoch": 0.66174382277762, "percentage": 33.09, "elapsed_time": "7:05:25", "remaining_time": "14:20:20"}
|
234 |
-
{"current_steps": 2340, "total_steps": 7042, "loss": 0.3796, "lr": 1.6890944086600145e-05, "epoch": 0.6645839250213008, "percentage": 33.23, "elapsed_time": "7:07:14", "remaining_time": "14:18:30"}
|
235 |
-
{"current_steps": 2350, "total_steps": 7042, "loss": 0.3828, "lr": 1.685493367562594e-05, "epoch": 0.6674240272649815, "percentage": 33.37, "elapsed_time": "7:09:05", "remaining_time": "14:16:42"}
|
236 |
-
{"current_steps": 2360, "total_steps": 7042, "loss": 0.3836, "lr": 1.6818754789948974e-05, "epoch": 0.6702641295086623, "percentage": 33.51, "elapsed_time": "7:10:55", "remaining_time": "14:14:55"}
|
237 |
-
{"current_steps": 2370, "total_steps": 7042, "loss": 0.388, "lr": 1.678240831874299e-05, "epoch": 0.6731042317523431, "percentage": 33.66, "elapsed_time": "7:12:45", "remaining_time": "14:13:05"}
|
238 |
-
{"current_steps": 2380, "total_steps": 7042, "loss": 0.3803, "lr": 1.674589515530049e-05, "epoch": 0.6759443339960238, "percentage": 33.8, "elapsed_time": "7:14:35", "remaining_time": "14:11:17"}
|
239 |
-
{"current_steps": 2390, "total_steps": 7042, "loss": 0.3812, "lr": 1.670921619701082e-05, "epoch": 0.6787844362397046, "percentage": 33.94, "elapsed_time": "7:16:25", "remaining_time": "14:09:28"}
|
240 |
-
{"current_steps": 2400, "total_steps": 7042, "loss": 0.3792, "lr": 1.6672372345338067e-05, "epoch": 0.6816245384833854, "percentage": 34.08, "elapsed_time": "7:18:11", "remaining_time": "14:07:31"}
|
241 |
-
{"current_steps": 2410, "total_steps": 7042, "loss": 0.3882, "lr": 1.6635364505798946e-05, "epoch": 0.6844646407270661, "percentage": 34.22, "elapsed_time": "7:19:59", "remaining_time": "14:05:39"}
|
242 |
-
{"current_steps": 2420, "total_steps": 7042, "loss": 0.3812, "lr": 1.6598193587940508e-05, "epoch": 0.687304742970747, "percentage": 34.37, "elapsed_time": "7:21:48", "remaining_time": "14:03:48"}
|
243 |
-
{"current_steps": 2430, "total_steps": 7042, "loss": 0.3851, "lr": 1.6560860505317813e-05, "epoch": 0.6901448452144278, "percentage": 34.51, "elapsed_time": "7:23:38", "remaining_time": "14:02:00"}
|
244 |
-
{"current_steps": 2440, "total_steps": 7042, "loss": 0.3926, "lr": 1.652336617547147e-05, "epoch": 0.6929849474581085, "percentage": 34.65, "elapsed_time": "7:25:26", "remaining_time": "14:00:07"}
|
245 |
-
{"current_steps": 2450, "total_steps": 7042, "loss": 0.3811, "lr": 1.648571151990508e-05, "epoch": 0.6958250497017893, "percentage": 34.79, "elapsed_time": "7:27:16", "remaining_time": "13:58:19"}
|
246 |
-
{"current_steps": 2460, "total_steps": 7042, "loss": 0.3944, "lr": 1.6447897464062593e-05, "epoch": 0.6986651519454701, "percentage": 34.93, "elapsed_time": "7:29:03", "remaining_time": "13:56:24"}
|
247 |
-
{"current_steps": 2470, "total_steps": 7042, "loss": 0.3687, "lr": 1.6409924937305567e-05, "epoch": 0.7015052541891508, "percentage": 35.08, "elapsed_time": "7:30:50", "remaining_time": "13:54:31"}
|
248 |
-
{"current_steps": 2480, "total_steps": 7042, "loss": 0.393, "lr": 1.637179487289032e-05, "epoch": 0.7043453564328316, "percentage": 35.22, "elapsed_time": "7:32:36", "remaining_time": "13:52:35"}
|
249 |
-
{"current_steps": 2490, "total_steps": 7042, "loss": 0.3874, "lr": 1.6333508207944987e-05, "epoch": 0.7071854586765124, "percentage": 35.36, "elapsed_time": "7:34:25", "remaining_time": "13:50:44"}
|
250 |
-
{"current_steps": 2500, "total_steps": 7042, "loss": 0.3759, "lr": 1.6295065883446514e-05, "epoch": 0.7100255609201931, "percentage": 35.5, "elapsed_time": "7:36:14", "remaining_time": "13:48:53"}
|
251 |
-
{"current_steps": 2510, "total_steps": 7042, "loss": 0.3839, "lr": 1.6256468844197503e-05, "epoch": 0.7128656631638739, "percentage": 35.64, "elapsed_time": "7:39:09", "remaining_time": "13:49:02"}
|
|
|
1 |
+
{"current_steps": 2800, "total_steps": 7042, "loss": 0.3833, "lr": 1.5074232636104824e-05, "epoch": 0.7952286282306164, "percentage": 39.76, "elapsed_time": "8:31:34", "remaining_time": "12:55:02"}
|
2 |
+
{"current_steps": 10, "total_steps": 7042, "loss": 7.3847, "lr": 2.8368794326241136e-07, "epoch": 0.0028401022436807723, "percentage": 0.14, "elapsed_time": "0:01:51", "remaining_time": "21:43:53"}
|
3 |
+
{"current_steps": 2810, "total_steps": 7042, "loss": 0.3727, "lr": 1.503145149114114e-05, "epoch": 0.798068730474297, "percentage": 39.9, "elapsed_time": "8:33:21", "remaining_time": "12:53:08"}
|
4 |
+
{"current_steps": 20, "total_steps": 7042, "loss": 7.3917, "lr": 5.673758865248227e-07, "epoch": 0.005680204487361545, "percentage": 0.28, "elapsed_time": "0:03:40", "remaining_time": "21:27:48"}
|
5 |
+
{"current_steps": 2820, "total_steps": 7042, "loss": 0.3742, "lr": 1.4988546687461774e-05, "epoch": 0.8009088327179779, "percentage": 40.05, "elapsed_time": "8:35:07", "remaining_time": "12:51:13"}
|
6 |
+
{"current_steps": 30, "total_steps": 7042, "loss": 6.8405, "lr": 8.510638297872341e-07, "epoch": 0.008520306731042317, "percentage": 0.43, "elapsed_time": "0:05:30", "remaining_time": "21:25:35"}
|
7 |
+
{"current_steps": 2830, "total_steps": 7042, "loss": 0.3719, "lr": 1.4945519279544325e-05, "epoch": 0.8037489349616587, "percentage": 40.19, "elapsed_time": "8:36:55", "remaining_time": "12:49:21"}
|
8 |
+
{"current_steps": 40, "total_steps": 7042, "loss": 5.6289, "lr": 1.1347517730496454e-06, "epoch": 0.01136040897472309, "percentage": 0.57, "elapsed_time": "0:07:16", "remaining_time": "21:13:35"}
|
9 |
+
{"current_steps": 2840, "total_steps": 7042, "loss": 0.379, "lr": 1.4902370324879668e-05, "epoch": 0.8065890372053394, "percentage": 40.33, "elapsed_time": "8:38:45", "remaining_time": "12:47:32"}
|
10 |
+
{"current_steps": 50, "total_steps": 7042, "loss": 5.2088, "lr": 1.418439716312057e-06, "epoch": 0.014200511218403862, "percentage": 0.71, "elapsed_time": "0:09:01", "remaining_time": "21:01:29"}
|
11 |
+
{"current_steps": 2850, "total_steps": 7042, "loss": 0.369, "lr": 1.4859100883945936e-05, "epoch": 0.8094291394490202, "percentage": 40.47, "elapsed_time": "8:40:34", "remaining_time": "12:45:42"}
|
12 |
+
{"current_steps": 60, "total_steps": 7042, "loss": 4.5475, "lr": 1.7021276595744682e-06, "epoch": 0.017040613462084634, "percentage": 0.85, "elapsed_time": "0:10:50", "remaining_time": "21:00:40"}
|
13 |
+
{"current_steps": 2860, "total_steps": 7042, "loss": 0.3685, "lr": 1.4815712020182482e-05, "epoch": 0.812269241692701, "percentage": 40.61, "elapsed_time": "8:42:23", "remaining_time": "12:43:50"}
|
14 |
+
{"current_steps": 70, "total_steps": 7042, "loss": 4.246, "lr": 1.9858156028368797e-06, "epoch": 0.019880715705765408, "percentage": 0.99, "elapsed_time": "0:12:37", "remaining_time": "20:57:12"}
|
15 |
+
{"current_steps": 2870, "total_steps": 7042, "loss": 0.3781, "lr": 1.4772204799963723e-05, "epoch": 0.8151093439363817, "percentage": 40.76, "elapsed_time": "8:44:14", "remaining_time": "12:42:03"}
|
16 |
+
{"current_steps": 80, "total_steps": 7042, "loss": 4.0109, "lr": 2.269503546099291e-06, "epoch": 0.02272081794944618, "percentage": 1.14, "elapsed_time": "0:14:26", "remaining_time": "20:56:13"}
|
17 |
+
{"current_steps": 2880, "total_steps": 7042, "loss": 0.3801, "lr": 1.4728580292572947e-05, "epoch": 0.8179494461800625, "percentage": 40.9, "elapsed_time": "8:46:04", "remaining_time": "12:40:15"}
|
18 |
+
{"current_steps": 90, "total_steps": 7042, "loss": 3.7207, "lr": 2.553191489361702e-06, "epoch": 0.025560920193126953, "percentage": 1.28, "elapsed_time": "0:16:13", "remaining_time": "20:53:15"}
|
19 |
+
{"current_steps": 2890, "total_steps": 7042, "loss": 0.3756, "lr": 1.468483957017602e-05, "epoch": 0.8207895484237433, "percentage": 41.04, "elapsed_time": "8:47:52", "remaining_time": "12:38:23"}
|
20 |
+
{"current_steps": 100, "total_steps": 7042, "loss": 3.3523, "lr": 2.836879432624114e-06, "epoch": 0.028401022436807723, "percentage": 1.42, "elapsed_time": "0:18:02", "remaining_time": "20:52:38"}
|
21 |
+
{"current_steps": 2900, "total_steps": 7042, "loss": 0.3857, "lr": 1.4640983707795042e-05, "epoch": 0.823629650667424, "percentage": 41.18, "elapsed_time": "8:49:38", "remaining_time": "12:36:28"}
|
22 |
+
{"current_steps": 110, "total_steps": 7042, "loss": 3.1659, "lr": 3.120567375886525e-06, "epoch": 0.031241124680488497, "percentage": 1.56, "elapsed_time": "0:19:49", "remaining_time": "20:49:28"}
|
23 |
+
{"current_steps": 2910, "total_steps": 7042, "loss": 0.3728, "lr": 1.459701378328193e-05, "epoch": 0.8264697529111048, "percentage": 41.32, "elapsed_time": "8:51:25", "remaining_time": "12:34:35"}
|
24 |
+
{"current_steps": 120, "total_steps": 7042, "loss": 2.754, "lr": 3.4042553191489363e-06, "epoch": 0.03408122692416927, "percentage": 1.7, "elapsed_time": "0:21:41", "remaining_time": "20:50:46"}
|
25 |
+
{"current_steps": 2920, "total_steps": 7042, "loss": 0.3773, "lr": 1.4552930877291915e-05, "epoch": 0.8293098551547856, "percentage": 41.47, "elapsed_time": "8:53:14", "remaining_time": "12:32:45"}
|
26 |
+
{"current_steps": 130, "total_steps": 7042, "loss": 2.3843, "lr": 3.6879432624113475e-06, "epoch": 0.03692132916785004, "percentage": 1.85, "elapsed_time": "0:23:31", "remaining_time": "20:50:23"}
|
27 |
+
{"current_steps": 2930, "total_steps": 7042, "loss": 0.389, "lr": 1.4508736073256997e-05, "epoch": 0.8321499573984663, "percentage": 41.61, "elapsed_time": "8:54:58", "remaining_time": "12:30:47"}
|
28 |
+
{"current_steps": 140, "total_steps": 7042, "loss": 2.0047, "lr": 3.9716312056737595e-06, "epoch": 0.039761431411530816, "percentage": 1.99, "elapsed_time": "0:25:18", "remaining_time": "20:47:49"}
|
29 |
+
{"current_steps": 2940, "total_steps": 7042, "loss": 0.3816, "lr": 1.4464430457359308e-05, "epoch": 0.8349900596421471, "percentage": 41.75, "elapsed_time": "8:56:46", "remaining_time": "12:28:55"}
|
30 |
+
{"current_steps": 150, "total_steps": 7042, "loss": 1.5855, "lr": 4.255319148936171e-06, "epoch": 0.04260153365521159, "percentage": 2.13, "elapsed_time": "0:27:06", "remaining_time": "20:45:39"}
|
31 |
+
{"current_steps": 2950, "total_steps": 7042, "loss": 0.3707, "lr": 1.442001511850442e-05, "epoch": 0.8378301618858279, "percentage": 41.89, "elapsed_time": "8:58:35", "remaining_time": "12:27:05"}
|
32 |
+
{"current_steps": 160, "total_steps": 7042, "loss": 1.2092, "lr": 4.539007092198582e-06, "epoch": 0.04544163589889236, "percentage": 2.27, "elapsed_time": "0:28:54", "remaining_time": "20:43:34"}
|
33 |
+
{"current_steps": 2960, "total_steps": 7042, "loss": 0.3687, "lr": 1.4375491148294578e-05, "epoch": 0.8406702641295086, "percentage": 42.03, "elapsed_time": "9:00:25", "remaining_time": "12:25:16"}
|
34 |
+
{"current_steps": 170, "total_steps": 7042, "loss": 0.9295, "lr": 4.822695035460993e-06, "epoch": 0.04828173814257313, "percentage": 2.41, "elapsed_time": "0:30:42", "remaining_time": "20:41:39"}
|
35 |
+
{"current_steps": 2970, "total_steps": 7042, "loss": 0.3782, "lr": 1.433085964100188e-05, "epoch": 0.8435103663731894, "percentage": 42.18, "elapsed_time": "9:02:13", "remaining_time": "12:23:25"}
|
36 |
+
{"current_steps": 180, "total_steps": 7042, "loss": 0.7546, "lr": 5.106382978723404e-06, "epoch": 0.051121840386253906, "percentage": 2.56, "elapsed_time": "0:32:31", "remaining_time": "20:39:37"}
|
37 |
+
{"current_steps": 2980, "total_steps": 7042, "loss": 0.3822, "lr": 1.4286121693541378e-05, "epoch": 0.8463504686168702, "percentage": 42.32, "elapsed_time": "9:04:03", "remaining_time": "12:21:35"}
|
38 |
+
{"current_steps": 190, "total_steps": 7042, "loss": 0.6663, "lr": 5.390070921985816e-06, "epoch": 0.05396194262993468, "percentage": 2.7, "elapsed_time": "0:34:20", "remaining_time": "20:38:42"}
|
39 |
+
{"current_steps": 2990, "total_steps": 7042, "loss": 0.3712, "lr": 1.424127840544412e-05, "epoch": 0.8491905708605509, "percentage": 42.46, "elapsed_time": "9:05:54", "remaining_time": "12:19:48"}
|
40 |
+
{"current_steps": 200, "total_steps": 7042, "loss": 0.6311, "lr": 5.673758865248228e-06, "epoch": 0.05680204487361545, "percentage": 2.84, "elapsed_time": "0:36:10", "remaining_time": "20:37:49"}
|
41 |
+
{"current_steps": 3000, "total_steps": 7042, "loss": 0.3869, "lr": 1.419633087883012e-05, "epoch": 0.8520306731042318, "percentage": 42.6, "elapsed_time": "9:07:40", "remaining_time": "12:17:53"}
|
42 |
+
{"current_steps": 210, "total_steps": 7042, "loss": 0.5941, "lr": 5.957446808510638e-06, "epoch": 0.05964214711729622, "percentage": 2.98, "elapsed_time": "0:38:00", "remaining_time": "20:36:16"}
|
43 |
+
{"current_steps": 3010, "total_steps": 7042, "loss": 0.3689, "lr": 1.4151280218381287e-05, "epoch": 0.8548707753479126, "percentage": 42.74, "elapsed_time": "9:10:36", "remaining_time": "12:17:34"}
|
44 |
+
{"current_steps": 220, "total_steps": 7042, "loss": 0.5608, "lr": 6.24113475177305e-06, "epoch": 0.062482249360976995, "percentage": 3.12, "elapsed_time": "0:39:48", "remaining_time": "20:34:27"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|