sedrickkeh
commited on
Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67c0dd50a4708e73af55c2c33ab3aaa3864bed8db676177bf8007165bcb98739
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b16a764412df2696d160469057a22c95f85a3811f0592c52ccb3a2c6d021af3d
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82cbf0f7c2bc52edad1c79e06b22283f7b3aaa8dc7ab3e58e2f1716d4505ba14
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f9eb670784f42929f2fc21b16e9f2a1001ad37f564a7287414ba599a78bd62a7
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -199,3 +199,102 @@
|
|
199 |
{"current_steps": 1980, "total_steps": 2988, "loss": 0.688, "lr": 5e-06, "epoch": 1.9869543401906673, "percentage": 66.27, "elapsed_time": "16:14:01", "remaining_time": "8:15:51"}
|
200 |
{"current_steps": 1990, "total_steps": 2988, "loss": 0.6916, "lr": 5e-06, "epoch": 1.996989463120923, "percentage": 66.6, "elapsed_time": "16:18:53", "remaining_time": "8:10:55"}
|
201 |
{"current_steps": 1993, "total_steps": 2988, "eval_loss": 0.7170566320419312, "epoch": 2.0, "percentage": 66.7, "elapsed_time": "16:29:13", "remaining_time": "8:13:51"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
199 |
{"current_steps": 1980, "total_steps": 2988, "loss": 0.688, "lr": 5e-06, "epoch": 1.9869543401906673, "percentage": 66.27, "elapsed_time": "16:14:01", "remaining_time": "8:15:51"}
|
200 |
{"current_steps": 1990, "total_steps": 2988, "loss": 0.6916, "lr": 5e-06, "epoch": 1.996989463120923, "percentage": 66.6, "elapsed_time": "16:18:53", "remaining_time": "8:10:55"}
|
201 |
{"current_steps": 1993, "total_steps": 2988, "eval_loss": 0.7170566320419312, "epoch": 2.0, "percentage": 66.7, "elapsed_time": "16:29:13", "remaining_time": "8:13:51"}
|
202 |
+
{"current_steps": 2000, "total_steps": 2988, "loss": 0.6927, "lr": 5e-06, "epoch": 2.007024586051179, "percentage": 66.93, "elapsed_time": "16:33:36", "remaining_time": "8:10:50"}
|
203 |
+
{"current_steps": 2010, "total_steps": 2988, "loss": 0.6458, "lr": 5e-06, "epoch": 2.017059708981435, "percentage": 67.27, "elapsed_time": "16:38:28", "remaining_time": "8:05:49"}
|
204 |
+
{"current_steps": 2020, "total_steps": 2988, "loss": 0.6452, "lr": 5e-06, "epoch": 2.027094831911691, "percentage": 67.6, "elapsed_time": "16:43:20", "remaining_time": "8:00:48"}
|
205 |
+
{"current_steps": 2030, "total_steps": 2988, "loss": 0.6464, "lr": 5e-06, "epoch": 2.037129954841947, "percentage": 67.94, "elapsed_time": "16:48:12", "remaining_time": "7:55:47"}
|
206 |
+
{"current_steps": 2040, "total_steps": 2988, "loss": 0.6441, "lr": 5e-06, "epoch": 2.0471650777722026, "percentage": 68.27, "elapsed_time": "16:53:05", "remaining_time": "7:50:47"}
|
207 |
+
{"current_steps": 2050, "total_steps": 2988, "loss": 0.6488, "lr": 5e-06, "epoch": 2.0572002007024586, "percentage": 68.61, "elapsed_time": "16:57:57", "remaining_time": "7:45:46"}
|
208 |
+
{"current_steps": 2060, "total_steps": 2988, "loss": 0.6469, "lr": 5e-06, "epoch": 2.0672353236327146, "percentage": 68.94, "elapsed_time": "17:02:49", "remaining_time": "7:40:46"}
|
209 |
+
{"current_steps": 2070, "total_steps": 2988, "loss": 0.6442, "lr": 5e-06, "epoch": 2.0772704465629706, "percentage": 69.28, "elapsed_time": "17:07:42", "remaining_time": "7:35:45"}
|
210 |
+
{"current_steps": 2080, "total_steps": 2988, "loss": 0.6501, "lr": 5e-06, "epoch": 2.087305569493226, "percentage": 69.61, "elapsed_time": "17:12:34", "remaining_time": "7:30:45"}
|
211 |
+
{"current_steps": 2090, "total_steps": 2988, "loss": 0.6509, "lr": 5e-06, "epoch": 2.097340692423482, "percentage": 69.95, "elapsed_time": "17:17:26", "remaining_time": "7:25:45"}
|
212 |
+
{"current_steps": 2100, "total_steps": 2988, "loss": 0.6476, "lr": 5e-06, "epoch": 2.107375815353738, "percentage": 70.28, "elapsed_time": "17:22:18", "remaining_time": "7:20:45"}
|
213 |
+
{"current_steps": 2110, "total_steps": 2988, "loss": 0.6451, "lr": 5e-06, "epoch": 2.117410938283994, "percentage": 70.62, "elapsed_time": "17:27:11", "remaining_time": "7:15:44"}
|
214 |
+
{"current_steps": 2120, "total_steps": 2988, "loss": 0.6452, "lr": 5e-06, "epoch": 2.12744606121425, "percentage": 70.95, "elapsed_time": "17:32:02", "remaining_time": "7:10:44"}
|
215 |
+
{"current_steps": 2130, "total_steps": 2988, "loss": 0.6501, "lr": 5e-06, "epoch": 2.1374811841445056, "percentage": 71.29, "elapsed_time": "17:36:53", "remaining_time": "7:05:44"}
|
216 |
+
{"current_steps": 2140, "total_steps": 2988, "loss": 0.6483, "lr": 5e-06, "epoch": 2.1475163070747616, "percentage": 71.62, "elapsed_time": "17:41:45", "remaining_time": "7:00:44"}
|
217 |
+
{"current_steps": 2150, "total_steps": 2988, "loss": 0.6488, "lr": 5e-06, "epoch": 2.1575514300050176, "percentage": 71.95, "elapsed_time": "17:46:37", "remaining_time": "6:55:44"}
|
218 |
+
{"current_steps": 2160, "total_steps": 2988, "loss": 0.6448, "lr": 5e-06, "epoch": 2.1675865529352736, "percentage": 72.29, "elapsed_time": "17:51:29", "remaining_time": "6:50:44"}
|
219 |
+
{"current_steps": 2170, "total_steps": 2988, "loss": 0.6444, "lr": 5e-06, "epoch": 2.177621675865529, "percentage": 72.62, "elapsed_time": "17:56:21", "remaining_time": "6:45:44"}
|
220 |
+
{"current_steps": 2180, "total_steps": 2988, "loss": 0.6495, "lr": 5e-06, "epoch": 2.187656798795785, "percentage": 72.96, "elapsed_time": "18:01:13", "remaining_time": "6:40:44"}
|
221 |
+
{"current_steps": 2190, "total_steps": 2988, "loss": 0.6525, "lr": 5e-06, "epoch": 2.197691921726041, "percentage": 73.29, "elapsed_time": "18:06:05", "remaining_time": "6:35:45"}
|
222 |
+
{"current_steps": 2200, "total_steps": 2988, "loss": 0.6492, "lr": 5e-06, "epoch": 2.207727044656297, "percentage": 73.63, "elapsed_time": "18:10:57", "remaining_time": "6:30:45"}
|
223 |
+
{"current_steps": 2210, "total_steps": 2988, "loss": 0.6531, "lr": 5e-06, "epoch": 2.217762167586553, "percentage": 73.96, "elapsed_time": "18:15:49", "remaining_time": "6:25:46"}
|
224 |
+
{"current_steps": 2220, "total_steps": 2988, "loss": 0.6486, "lr": 5e-06, "epoch": 2.2277972905168086, "percentage": 74.3, "elapsed_time": "18:20:41", "remaining_time": "6:20:46"}
|
225 |
+
{"current_steps": 2230, "total_steps": 2988, "loss": 0.6477, "lr": 5e-06, "epoch": 2.2378324134470646, "percentage": 74.63, "elapsed_time": "18:25:32", "remaining_time": "6:15:47"}
|
226 |
+
{"current_steps": 2240, "total_steps": 2988, "loss": 0.6476, "lr": 5e-06, "epoch": 2.2478675363773206, "percentage": 74.97, "elapsed_time": "18:30:25", "remaining_time": "6:10:47"}
|
227 |
+
{"current_steps": 2250, "total_steps": 2988, "loss": 0.6468, "lr": 5e-06, "epoch": 2.2579026593075766, "percentage": 75.3, "elapsed_time": "18:35:17", "remaining_time": "6:05:48"}
|
228 |
+
{"current_steps": 2260, "total_steps": 2988, "loss": 0.6493, "lr": 5e-06, "epoch": 2.2679377822378326, "percentage": 75.64, "elapsed_time": "18:40:09", "remaining_time": "6:00:49"}
|
229 |
+
{"current_steps": 2270, "total_steps": 2988, "loss": 0.6494, "lr": 5e-06, "epoch": 2.277972905168088, "percentage": 75.97, "elapsed_time": "18:45:02", "remaining_time": "5:55:50"}
|
230 |
+
{"current_steps": 2280, "total_steps": 2988, "loss": 0.6488, "lr": 5e-06, "epoch": 2.288008028098344, "percentage": 76.31, "elapsed_time": "18:49:54", "remaining_time": "5:50:51"}
|
231 |
+
{"current_steps": 2290, "total_steps": 2988, "loss": 0.6443, "lr": 5e-06, "epoch": 2.2980431510286, "percentage": 76.64, "elapsed_time": "18:54:46", "remaining_time": "5:45:52"}
|
232 |
+
{"current_steps": 2300, "total_steps": 2988, "loss": 0.6511, "lr": 5e-06, "epoch": 2.308078273958856, "percentage": 76.97, "elapsed_time": "18:59:38", "remaining_time": "5:40:54"}
|
233 |
+
{"current_steps": 2310, "total_steps": 2988, "loss": 0.6521, "lr": 5e-06, "epoch": 2.318113396889112, "percentage": 77.31, "elapsed_time": "19:04:31", "remaining_time": "5:35:55"}
|
234 |
+
{"current_steps": 2320, "total_steps": 2988, "loss": 0.6499, "lr": 5e-06, "epoch": 2.3281485198193677, "percentage": 77.64, "elapsed_time": "19:09:23", "remaining_time": "5:30:56"}
|
235 |
+
{"current_steps": 2330, "total_steps": 2988, "loss": 0.6497, "lr": 5e-06, "epoch": 2.3381836427496236, "percentage": 77.98, "elapsed_time": "19:14:14", "remaining_time": "5:25:57"}
|
236 |
+
{"current_steps": 2340, "total_steps": 2988, "loss": 0.6465, "lr": 5e-06, "epoch": 2.3482187656798796, "percentage": 78.31, "elapsed_time": "19:19:07", "remaining_time": "5:20:59"}
|
237 |
+
{"current_steps": 2350, "total_steps": 2988, "loss": 0.6471, "lr": 5e-06, "epoch": 2.3582538886101356, "percentage": 78.65, "elapsed_time": "19:23:59", "remaining_time": "5:16:00"}
|
238 |
+
{"current_steps": 2360, "total_steps": 2988, "loss": 0.6499, "lr": 5e-06, "epoch": 2.368289011540391, "percentage": 78.98, "elapsed_time": "19:28:51", "remaining_time": "5:11:02"}
|
239 |
+
{"current_steps": 2370, "total_steps": 2988, "loss": 0.6542, "lr": 5e-06, "epoch": 2.378324134470647, "percentage": 79.32, "elapsed_time": "19:33:43", "remaining_time": "5:06:03"}
|
240 |
+
{"current_steps": 2380, "total_steps": 2988, "loss": 0.6519, "lr": 5e-06, "epoch": 2.388359257400903, "percentage": 79.65, "elapsed_time": "19:38:35", "remaining_time": "5:01:05"}
|
241 |
+
{"current_steps": 2390, "total_steps": 2988, "loss": 0.6453, "lr": 5e-06, "epoch": 2.398394380331159, "percentage": 79.99, "elapsed_time": "19:43:26", "remaining_time": "4:56:06"}
|
242 |
+
{"current_steps": 2400, "total_steps": 2988, "loss": 0.6502, "lr": 5e-06, "epoch": 2.408429503261415, "percentage": 80.32, "elapsed_time": "19:48:17", "remaining_time": "4:51:08"}
|
243 |
+
{"current_steps": 2410, "total_steps": 2988, "loss": 0.651, "lr": 5e-06, "epoch": 2.4184646261916707, "percentage": 80.66, "elapsed_time": "19:53:09", "remaining_time": "4:46:09"}
|
244 |
+
{"current_steps": 2420, "total_steps": 2988, "loss": 0.6533, "lr": 5e-06, "epoch": 2.4284997491219267, "percentage": 80.99, "elapsed_time": "19:58:01", "remaining_time": "4:41:11"}
|
245 |
+
{"current_steps": 2430, "total_steps": 2988, "loss": 0.6495, "lr": 5e-06, "epoch": 2.4385348720521827, "percentage": 81.33, "elapsed_time": "20:02:53", "remaining_time": "4:36:13"}
|
246 |
+
{"current_steps": 2440, "total_steps": 2988, "loss": 0.6535, "lr": 5e-06, "epoch": 2.4485699949824387, "percentage": 81.66, "elapsed_time": "20:07:45", "remaining_time": "4:31:15"}
|
247 |
+
{"current_steps": 2450, "total_steps": 2988, "loss": 0.6501, "lr": 5e-06, "epoch": 2.458605117912694, "percentage": 81.99, "elapsed_time": "20:12:37", "remaining_time": "4:26:16"}
|
248 |
+
{"current_steps": 2460, "total_steps": 2988, "loss": 0.6514, "lr": 5e-06, "epoch": 2.46864024084295, "percentage": 82.33, "elapsed_time": "20:17:29", "remaining_time": "4:21:18"}
|
249 |
+
{"current_steps": 2470, "total_steps": 2988, "loss": 0.6567, "lr": 5e-06, "epoch": 2.478675363773206, "percentage": 82.66, "elapsed_time": "20:22:21", "remaining_time": "4:16:20"}
|
250 |
+
{"current_steps": 2480, "total_steps": 2988, "loss": 0.6468, "lr": 5e-06, "epoch": 2.488710486703462, "percentage": 83.0, "elapsed_time": "20:27:13", "remaining_time": "4:11:22"}
|
251 |
+
{"current_steps": 2490, "total_steps": 2988, "loss": 0.6494, "lr": 5e-06, "epoch": 2.498745609633718, "percentage": 83.33, "elapsed_time": "20:32:05", "remaining_time": "4:06:25"}
|
252 |
+
{"current_steps": 2500, "total_steps": 2988, "loss": 0.6575, "lr": 5e-06, "epoch": 2.5087807325639737, "percentage": 83.67, "elapsed_time": "20:36:57", "remaining_time": "4:01:27"}
|
253 |
+
{"current_steps": 2510, "total_steps": 2988, "loss": 0.6529, "lr": 5e-06, "epoch": 2.5188158554942297, "percentage": 84.0, "elapsed_time": "20:41:49", "remaining_time": "3:56:29"}
|
254 |
+
{"current_steps": 2520, "total_steps": 2988, "loss": 0.6486, "lr": 5e-06, "epoch": 2.5288509784244857, "percentage": 84.34, "elapsed_time": "20:46:41", "remaining_time": "3:51:31"}
|
255 |
+
{"current_steps": 2530, "total_steps": 2988, "loss": 0.6479, "lr": 5e-06, "epoch": 2.5388861013547417, "percentage": 84.67, "elapsed_time": "20:51:34", "remaining_time": "3:46:34"}
|
256 |
+
{"current_steps": 2540, "total_steps": 2988, "loss": 0.6515, "lr": 5e-06, "epoch": 2.5489212242849977, "percentage": 85.01, "elapsed_time": "20:56:26", "remaining_time": "3:41:36"}
|
257 |
+
{"current_steps": 2550, "total_steps": 2988, "loss": 0.6529, "lr": 5e-06, "epoch": 2.5589563472152532, "percentage": 85.34, "elapsed_time": "21:01:18", "remaining_time": "3:36:38"}
|
258 |
+
{"current_steps": 2560, "total_steps": 2988, "loss": 0.6486, "lr": 5e-06, "epoch": 2.568991470145509, "percentage": 85.68, "elapsed_time": "21:06:11", "remaining_time": "3:31:41"}
|
259 |
+
{"current_steps": 2570, "total_steps": 2988, "loss": 0.6511, "lr": 5e-06, "epoch": 2.579026593075765, "percentage": 86.01, "elapsed_time": "21:11:03", "remaining_time": "3:26:43"}
|
260 |
+
{"current_steps": 2580, "total_steps": 2988, "loss": 0.6599, "lr": 5e-06, "epoch": 2.589061716006021, "percentage": 86.35, "elapsed_time": "21:15:55", "remaining_time": "3:21:46"}
|
261 |
+
{"current_steps": 2590, "total_steps": 2988, "loss": 0.6475, "lr": 5e-06, "epoch": 2.599096838936277, "percentage": 86.68, "elapsed_time": "21:20:47", "remaining_time": "3:16:49"}
|
262 |
+
{"current_steps": 2600, "total_steps": 2988, "loss": 0.6531, "lr": 5e-06, "epoch": 2.6091319618665327, "percentage": 87.01, "elapsed_time": "21:25:39", "remaining_time": "3:11:51"}
|
263 |
+
{"current_steps": 2610, "total_steps": 2988, "loss": 0.6532, "lr": 5e-06, "epoch": 2.6191670847967887, "percentage": 87.35, "elapsed_time": "21:30:31", "remaining_time": "3:06:54"}
|
264 |
+
{"current_steps": 2620, "total_steps": 2988, "loss": 0.6476, "lr": 5e-06, "epoch": 2.6292022077270447, "percentage": 87.68, "elapsed_time": "21:35:23", "remaining_time": "3:01:56"}
|
265 |
+
{"current_steps": 2630, "total_steps": 2988, "loss": 0.6499, "lr": 5e-06, "epoch": 2.6392373306573007, "percentage": 88.02, "elapsed_time": "21:40:15", "remaining_time": "2:56:59"}
|
266 |
+
{"current_steps": 2640, "total_steps": 2988, "loss": 0.6515, "lr": 5e-06, "epoch": 2.6492724535875567, "percentage": 88.35, "elapsed_time": "21:45:07", "remaining_time": "2:52:02"}
|
267 |
+
{"current_steps": 2650, "total_steps": 2988, "loss": 0.6528, "lr": 5e-06, "epoch": 2.6593075765178122, "percentage": 88.69, "elapsed_time": "21:49:59", "remaining_time": "2:47:05"}
|
268 |
+
{"current_steps": 2660, "total_steps": 2988, "loss": 0.6482, "lr": 5e-06, "epoch": 2.6693426994480682, "percentage": 89.02, "elapsed_time": "21:54:50", "remaining_time": "2:42:07"}
|
269 |
+
{"current_steps": 2670, "total_steps": 2988, "loss": 0.6521, "lr": 5e-06, "epoch": 2.6793778223783242, "percentage": 89.36, "elapsed_time": "21:59:42", "remaining_time": "2:37:10"}
|
270 |
+
{"current_steps": 2680, "total_steps": 2988, "loss": 0.6511, "lr": 5e-06, "epoch": 2.6894129453085798, "percentage": 89.69, "elapsed_time": "22:04:34", "remaining_time": "2:32:13"}
|
271 |
+
{"current_steps": 2690, "total_steps": 2988, "loss": 0.6502, "lr": 5e-06, "epoch": 2.6994480682388358, "percentage": 90.03, "elapsed_time": "22:09:26", "remaining_time": "2:27:16"}
|
272 |
+
{"current_steps": 2700, "total_steps": 2988, "loss": 0.6509, "lr": 5e-06, "epoch": 2.7094831911690918, "percentage": 90.36, "elapsed_time": "22:14:18", "remaining_time": "2:22:19"}
|
273 |
+
{"current_steps": 2710, "total_steps": 2988, "loss": 0.6522, "lr": 5e-06, "epoch": 2.7195183140993477, "percentage": 90.7, "elapsed_time": "22:19:10", "remaining_time": "2:17:22"}
|
274 |
+
{"current_steps": 2720, "total_steps": 2988, "loss": 0.6513, "lr": 5e-06, "epoch": 2.7295534370296037, "percentage": 91.03, "elapsed_time": "22:24:02", "remaining_time": "2:12:25"}
|
275 |
+
{"current_steps": 2730, "total_steps": 2988, "loss": 0.6551, "lr": 5e-06, "epoch": 2.7395885599598593, "percentage": 91.37, "elapsed_time": "22:28:54", "remaining_time": "2:07:28"}
|
276 |
+
{"current_steps": 2740, "total_steps": 2988, "loss": 0.6545, "lr": 5e-06, "epoch": 2.7496236828901153, "percentage": 91.7, "elapsed_time": "22:33:46", "remaining_time": "2:02:31"}
|
277 |
+
{"current_steps": 2750, "total_steps": 2988, "loss": 0.6538, "lr": 5e-06, "epoch": 2.7596588058203713, "percentage": 92.03, "elapsed_time": "22:38:37", "remaining_time": "1:57:34"}
|
278 |
+
{"current_steps": 2760, "total_steps": 2988, "loss": 0.6583, "lr": 5e-06, "epoch": 2.7696939287506273, "percentage": 92.37, "elapsed_time": "22:43:29", "remaining_time": "1:52:38"}
|
279 |
+
{"current_steps": 2770, "total_steps": 2988, "loss": 0.6545, "lr": 5e-06, "epoch": 2.7797290516808832, "percentage": 92.7, "elapsed_time": "22:48:21", "remaining_time": "1:47:41"}
|
280 |
+
{"current_steps": 2780, "total_steps": 2988, "loss": 0.6508, "lr": 5e-06, "epoch": 2.789764174611139, "percentage": 93.04, "elapsed_time": "22:53:12", "remaining_time": "1:42:44"}
|
281 |
+
{"current_steps": 2790, "total_steps": 2988, "loss": 0.6534, "lr": 5e-06, "epoch": 2.799799297541395, "percentage": 93.37, "elapsed_time": "22:58:05", "remaining_time": "1:37:47"}
|
282 |
+
{"current_steps": 2800, "total_steps": 2988, "loss": 0.6552, "lr": 5e-06, "epoch": 2.8098344204716508, "percentage": 93.71, "elapsed_time": "23:02:56", "remaining_time": "1:32:51"}
|
283 |
+
{"current_steps": 2810, "total_steps": 2988, "loss": 0.6541, "lr": 5e-06, "epoch": 2.8198695434019068, "percentage": 94.04, "elapsed_time": "23:07:48", "remaining_time": "1:27:54"}
|
284 |
+
{"current_steps": 2820, "total_steps": 2988, "loss": 0.648, "lr": 5e-06, "epoch": 2.8299046663321628, "percentage": 94.38, "elapsed_time": "23:12:40", "remaining_time": "1:22:58"}
|
285 |
+
{"current_steps": 2830, "total_steps": 2988, "loss": 0.6538, "lr": 5e-06, "epoch": 2.8399397892624183, "percentage": 94.71, "elapsed_time": "23:17:32", "remaining_time": "1:18:01"}
|
286 |
+
{"current_steps": 2840, "total_steps": 2988, "loss": 0.652, "lr": 5e-06, "epoch": 2.8499749121926743, "percentage": 95.05, "elapsed_time": "23:22:24", "remaining_time": "1:13:05"}
|
287 |
+
{"current_steps": 2850, "total_steps": 2988, "loss": 0.6574, "lr": 5e-06, "epoch": 2.8600100351229303, "percentage": 95.38, "elapsed_time": "23:27:16", "remaining_time": "1:08:08"}
|
288 |
+
{"current_steps": 2860, "total_steps": 2988, "loss": 0.6533, "lr": 5e-06, "epoch": 2.8700451580531863, "percentage": 95.72, "elapsed_time": "23:32:08", "remaining_time": "1:03:12"}
|
289 |
+
{"current_steps": 2870, "total_steps": 2988, "loss": 0.6516, "lr": 5e-06, "epoch": 2.8800802809834423, "percentage": 96.05, "elapsed_time": "23:37:00", "remaining_time": "0:58:15"}
|
290 |
+
{"current_steps": 2880, "total_steps": 2988, "loss": 0.6542, "lr": 5e-06, "epoch": 2.890115403913698, "percentage": 96.39, "elapsed_time": "23:41:52", "remaining_time": "0:53:19"}
|
291 |
+
{"current_steps": 2890, "total_steps": 2988, "loss": 0.6517, "lr": 5e-06, "epoch": 2.900150526843954, "percentage": 96.72, "elapsed_time": "23:46:44", "remaining_time": "0:48:22"}
|
292 |
+
{"current_steps": 2900, "total_steps": 2988, "loss": 0.6529, "lr": 5e-06, "epoch": 2.91018564977421, "percentage": 97.05, "elapsed_time": "23:51:36", "remaining_time": "0:43:26"}
|
293 |
+
{"current_steps": 2910, "total_steps": 2988, "loss": 0.6522, "lr": 5e-06, "epoch": 2.920220772704466, "percentage": 97.39, "elapsed_time": "23:56:28", "remaining_time": "0:38:30"}
|
294 |
+
{"current_steps": 2920, "total_steps": 2988, "loss": 0.6508, "lr": 5e-06, "epoch": 2.9302558956347218, "percentage": 97.72, "elapsed_time": "1 day, 0:01:20", "remaining_time": "0:33:33"}
|
295 |
+
{"current_steps": 2930, "total_steps": 2988, "loss": 0.6497, "lr": 5e-06, "epoch": 2.9402910185649773, "percentage": 98.06, "elapsed_time": "1 day, 0:06:12", "remaining_time": "0:28:37"}
|
296 |
+
{"current_steps": 2940, "total_steps": 2988, "loss": 0.6548, "lr": 5e-06, "epoch": 2.9503261414952333, "percentage": 98.39, "elapsed_time": "1 day, 0:11:04", "remaining_time": "0:23:41"}
|
297 |
+
{"current_steps": 2950, "total_steps": 2988, "loss": 0.6539, "lr": 5e-06, "epoch": 2.9603612644254893, "percentage": 98.73, "elapsed_time": "1 day, 0:15:56", "remaining_time": "0:18:45"}
|
298 |
+
{"current_steps": 2960, "total_steps": 2988, "loss": 0.6567, "lr": 5e-06, "epoch": 2.970396387355745, "percentage": 99.06, "elapsed_time": "1 day, 0:20:48", "remaining_time": "0:13:49"}
|
299 |
+
{"current_steps": 2970, "total_steps": 2988, "loss": 0.6547, "lr": 5e-06, "epoch": 2.980431510286001, "percentage": 99.4, "elapsed_time": "1 day, 0:25:40", "remaining_time": "0:08:52"}
|
300 |
+
{"current_steps": 2980, "total_steps": 2988, "loss": 0.6516, "lr": 5e-06, "epoch": 2.990466633216257, "percentage": 99.73, "elapsed_time": "1 day, 0:30:32", "remaining_time": "0:03:56"}
|