{"current_steps": 5, "total_steps": 930, "loss": 4.0376, "learning_rate": 4.999643406399275e-05, "epoch": 0.16, "percentage": 0.54, "elapsed_time": "0:03:48", "remaining_time": "11:44:40", "throughput": "27.16", "total_tokens": 6208} {"current_steps": 10, "total_steps": 930, "loss": 3.9633, "learning_rate": 4.998573727324295e-05, "epoch": 0.32, "percentage": 1.08, "elapsed_time": "0:07:38", "remaining_time": "11:43:13", "throughput": "26.10", "total_tokens": 11968} {"current_steps": 15, "total_steps": 930, "loss": 3.7175, "learning_rate": 4.9967912679276316e-05, "epoch": 0.48, "percentage": 1.61, "elapsed_time": "0:11:31", "remaining_time": "11:42:56", "throughput": "26.06", "total_tokens": 18016} {"current_steps": 20, "total_steps": 930, "loss": 3.6465, "learning_rate": 4.994296536700177e-05, "epoch": 0.64, "percentage": 2.15, "elapsed_time": "0:15:38", "remaining_time": "11:52:03", "throughput": "25.30", "total_tokens": 23760} {"current_steps": 25, "total_steps": 930, "loss": 3.6384, "learning_rate": 4.9910902453260824e-05, "epoch": 0.8, "percentage": 2.69, "elapsed_time": "0:19:58", "remaining_time": "12:03:17", "throughput": "24.73", "total_tokens": 29648} {"current_steps": 30, "total_steps": 930, "loss": 3.5703, "learning_rate": 4.987173308479738e-05, "epoch": 0.96, "percentage": 3.23, "elapsed_time": "0:24:21", "remaining_time": "12:10:35", "throughput": "24.62", "total_tokens": 35968} {"current_steps": 35, "total_steps": 930, "loss": 3.5096, "learning_rate": 4.982546843564834e-05, "epoch": 1.12, "percentage": 3.76, "elapsed_time": "0:28:39", "remaining_time": "12:12:58", "throughput": "24.49", "total_tokens": 42112} {"current_steps": 40, "total_steps": 930, "loss": 3.2806, "learning_rate": 4.977212170395598e-05, "epoch": 1.28, "percentage": 4.3, "elapsed_time": "0:32:56", "remaining_time": "12:12:56", "throughput": "24.46", "total_tokens": 48352} {"current_steps": 45, "total_steps": 930, "loss": 3.4431, "learning_rate": 4.971170810820279e-05, "epoch": 1.44, "percentage": 4.84, "elapsed_time": "0:36:47", "remaining_time": "12:03:38", "throughput": "24.52", "total_tokens": 54144} {"current_steps": 50, "total_steps": 930, "loss": 3.2597, "learning_rate": 4.964424488287009e-05, "epoch": 1.6, "percentage": 5.38, "elapsed_time": "0:40:40", "remaining_time": "11:55:50", "throughput": "24.68", "total_tokens": 60224} {"current_steps": 55, "total_steps": 930, "loss": 3.275, "learning_rate": 4.9569751273521454e-05, "epoch": 1.76, "percentage": 5.91, "elapsed_time": "0:44:33", "remaining_time": "11:48:58", "throughput": "24.87", "total_tokens": 66512} {"current_steps": 60, "total_steps": 930, "loss": 3.1563, "learning_rate": 4.948824853131236e-05, "epoch": 1.92, "percentage": 6.45, "elapsed_time": "0:48:24", "remaining_time": "11:41:55", "throughput": "24.86", "total_tokens": 72208} {"current_steps": 65, "total_steps": 930, "loss": 3.1883, "learning_rate": 4.939975990692789e-05, "epoch": 2.08, "percentage": 6.99, "elapsed_time": "0:52:16", "remaining_time": "11:35:35", "throughput": "24.99", "total_tokens": 78368} {"current_steps": 70, "total_steps": 930, "loss": 3.2454, "learning_rate": 4.930431064394977e-05, "epoch": 2.24, "percentage": 7.53, "elapsed_time": "0:56:08", "remaining_time": "11:29:43", "throughput": "25.02", "total_tokens": 84288} {"current_steps": 75, "total_steps": 930, "loss": 3.1905, "learning_rate": 4.920192797165511e-05, "epoch": 2.4, "percentage": 8.06, "elapsed_time": "0:59:59", "remaining_time": "11:23:58", "throughput": "25.13", "total_tokens": 90464} {"current_steps": 80, "total_steps": 930, "loss": 3.0087, "learning_rate": 4.909264109724853e-05, "epoch": 2.56, "percentage": 8.6, "elapsed_time": "1:03:52", "remaining_time": "11:18:42", "throughput": "25.23", "total_tokens": 96704} {"current_steps": 85, "total_steps": 930, "loss": 3.0016, "learning_rate": 4.897648119753006e-05, "epoch": 2.7199999999999998, "percentage": 9.14, "elapsed_time": "1:07:42", "remaining_time": "11:13:07", "throughput": "25.19", "total_tokens": 102352} {"current_steps": 90, "total_steps": 930, "loss": 3.1813, "learning_rate": 4.885348141000122e-05, "epoch": 2.88, "percentage": 9.68, "elapsed_time": "1:11:48", "remaining_time": "11:10:13", "throughput": "25.09", "total_tokens": 108112} {"current_steps": 95, "total_steps": 930, "loss": 3.1158, "learning_rate": 4.872367682341173e-05, "epoch": 3.04, "percentage": 10.22, "elapsed_time": "1:15:53", "remaining_time": "11:07:01", "throughput": "25.09", "total_tokens": 114240} {"current_steps": 100, "total_steps": 930, "loss": 2.9404, "learning_rate": 4.858710446774951e-05, "epoch": 3.2, "percentage": 10.75, "elapsed_time": "1:19:53", "remaining_time": "11:03:05", "throughput": "25.02", "total_tokens": 119936} {"current_steps": 105, "total_steps": 930, "loss": 2.9749, "learning_rate": 4.844380330367701e-05, "epoch": 3.36, "percentage": 11.29, "elapsed_time": "1:24:13", "remaining_time": "11:01:47", "throughput": "24.93", "total_tokens": 125984} {"current_steps": 110, "total_steps": 930, "loss": 2.9456, "learning_rate": 4.829381421141671e-05, "epoch": 3.52, "percentage": 11.83, "elapsed_time": "1:28:47", "remaining_time": "11:01:50", "throughput": "24.74", "total_tokens": 131808} {"current_steps": 115, "total_steps": 930, "loss": 2.8505, "learning_rate": 4.8137179979088995e-05, "epoch": 3.68, "percentage": 12.37, "elapsed_time": "1:33:18", "remaining_time": "11:01:18", "throughput": "24.61", "total_tokens": 137792} {"current_steps": 120, "total_steps": 930, "loss": 3.0044, "learning_rate": 4.7973945290505766e-05, "epoch": 3.84, "percentage": 12.9, "elapsed_time": "1:37:51", "remaining_time": "11:00:32", "throughput": "24.58", "total_tokens": 144336} {"current_steps": 125, "total_steps": 930, "loss": 3.0709, "learning_rate": 4.780415671242334e-05, "epoch": 4.0, "percentage": 13.44, "elapsed_time": "1:42:25", "remaining_time": "10:59:34", "throughput": "24.46", "total_tokens": 150336} {"current_steps": 130, "total_steps": 930, "loss": 2.912, "learning_rate": 4.7627862681258037e-05, "epoch": 4.16, "percentage": 13.98, "elapsed_time": "1:46:57", "remaining_time": "10:58:15", "throughput": "24.43", "total_tokens": 156768} {"current_steps": 135, "total_steps": 930, "loss": 2.8063, "learning_rate": 4.7445113489268544e-05, "epoch": 4.32, "percentage": 14.52, "elapsed_time": "1:51:34", "remaining_time": "10:57:06", "throughput": "24.38", "total_tokens": 163232} {"current_steps": 140, "total_steps": 930, "loss": 2.7714, "learning_rate": 4.725596127020879e-05, "epoch": 4.48, "percentage": 15.05, "elapsed_time": "1:56:09", "remaining_time": "10:55:25", "throughput": "24.34", "total_tokens": 169616} {"current_steps": 145, "total_steps": 930, "loss": 2.8277, "learning_rate": 4.706045998445548e-05, "epoch": 4.64, "percentage": 15.59, "elapsed_time": "2:00:37", "remaining_time": "10:53:00", "throughput": "24.27", "total_tokens": 175664} {"current_steps": 150, "total_steps": 930, "loss": 2.7456, "learning_rate": 4.685866540361456e-05, "epoch": 4.8, "percentage": 16.13, "elapsed_time": "2:05:19", "remaining_time": "10:51:42", "throughput": "24.10", "total_tokens": 181232} {"current_steps": 155, "total_steps": 930, "loss": 2.7187, "learning_rate": 4.665063509461097e-05, "epoch": 4.96, "percentage": 16.67, "elapsed_time": "2:09:46", "remaining_time": "10:48:51", "throughput": "24.01", "total_tokens": 186960} {"current_steps": 160, "total_steps": 930, "loss": 2.7918, "learning_rate": 4.643642840326627e-05, "epoch": 5.12, "percentage": 17.2, "elapsed_time": "2:14:12", "remaining_time": "10:45:53", "throughput": "23.92", "total_tokens": 192640} {"current_steps": 165, "total_steps": 930, "loss": 2.6223, "learning_rate": 4.621610643736878e-05, "epoch": 5.28, "percentage": 17.74, "elapsed_time": "2:18:38", "remaining_time": "10:42:47", "throughput": "23.88", "total_tokens": 198672} {"current_steps": 170, "total_steps": 930, "loss": 2.654, "learning_rate": 4.598973204924097e-05, "epoch": 5.44, "percentage": 18.28, "elapsed_time": "2:31:07", "remaining_time": "11:15:38", "throughput": "22.60", "total_tokens": 204976} {"current_steps": 175, "total_steps": 930, "loss": 2.7321, "learning_rate": 4.5757369817809415e-05, "epoch": 5.6, "percentage": 18.82, "elapsed_time": "2:35:33", "remaining_time": "11:11:07", "throughput": "22.62", "total_tokens": 211168} {"current_steps": 180, "total_steps": 930, "loss": 2.71, "learning_rate": 4.551908603018191e-05, "epoch": 5.76, "percentage": 19.35, "elapsed_time": "2:39:57", "remaining_time": "11:06:27", "throughput": "22.62", "total_tokens": 217072} {"current_steps": 185, "total_steps": 930, "loss": 2.7663, "learning_rate": 4.527494866273753e-05, "epoch": 5.92, "percentage": 19.89, "elapsed_time": "2:44:21", "remaining_time": "11:01:51", "throughput": "22.63", "total_tokens": 223136} {"current_steps": 190, "total_steps": 930, "loss": 2.4595, "learning_rate": 4.502502736173462e-05, "epoch": 6.08, "percentage": 20.43, "elapsed_time": "2:48:42", "remaining_time": "10:57:04", "throughput": "22.63", "total_tokens": 229088} {"current_steps": 195, "total_steps": 930, "loss": 2.5734, "learning_rate": 4.476939342344246e-05, "epoch": 6.24, "percentage": 20.97, "elapsed_time": "2:53:09", "remaining_time": "10:52:40", "throughput": "22.64", "total_tokens": 235184} {"current_steps": 200, "total_steps": 930, "loss": 2.3804, "learning_rate": 4.45081197738023e-05, "epoch": 6.4, "percentage": 21.51, "elapsed_time": "2:57:33", "remaining_time": "10:48:04", "throughput": "22.64", "total_tokens": 241152} {"current_steps": 205, "total_steps": 930, "loss": 2.4395, "learning_rate": 4.424128094762331e-05, "epoch": 6.5600000000000005, "percentage": 22.04, "elapsed_time": "3:01:59", "remaining_time": "10:43:36", "throughput": "22.63", "total_tokens": 247136} {"current_steps": 210, "total_steps": 930, "loss": 2.3477, "learning_rate": 4.3968953067319777e-05, "epoch": 6.72, "percentage": 22.58, "elapsed_time": "3:06:22", "remaining_time": "10:38:59", "throughput": "22.65", "total_tokens": 253232} {"current_steps": 215, "total_steps": 930, "loss": 2.5377, "learning_rate": 4.369121382119523e-05, "epoch": 6.88, "percentage": 23.12, "elapsed_time": "3:10:44", "remaining_time": "10:34:20", "throughput": "22.63", "total_tokens": 258992} {"current_steps": 220, "total_steps": 930, "loss": 2.5576, "learning_rate": 4.340814244127993e-05, "epoch": 7.04, "percentage": 23.66, "elapsed_time": "3:15:06", "remaining_time": "10:29:39", "throughput": "22.67", "total_tokens": 265392} {"current_steps": 225, "total_steps": 930, "loss": 2.2721, "learning_rate": 4.3119819680728e-05, "epoch": 7.2, "percentage": 24.19, "elapsed_time": "3:19:29", "remaining_time": "10:25:05", "throughput": "22.67", "total_tokens": 271344} {"current_steps": 230, "total_steps": 930, "loss": 2.4025, "learning_rate": 4.282632779078051e-05, "epoch": 7.36, "percentage": 24.73, "elapsed_time": "3:23:50", "remaining_time": "10:20:22", "throughput": "22.66", "total_tokens": 277120} {"current_steps": 235, "total_steps": 930, "loss": 2.2175, "learning_rate": 4.2527750497301323e-05, "epoch": 7.52, "percentage": 25.27, "elapsed_time": "3:28:12", "remaining_time": "10:15:45", "throughput": "22.67", "total_tokens": 283152} {"current_steps": 240, "total_steps": 930, "loss": 2.1803, "learning_rate": 4.222417297689217e-05, "epoch": 7.68, "percentage": 25.81, "elapsed_time": "3:49:47", "remaining_time": "11:00:38", "throughput": "20.97", "total_tokens": 289136} {"current_steps": 245, "total_steps": 930, "loss": 2.4197, "learning_rate": 4.191568183259394e-05, "epoch": 7.84, "percentage": 26.34, "elapsed_time": "3:54:09", "remaining_time": "10:54:40", "throughput": "21.07", "total_tokens": 295968} {"current_steps": 250, "total_steps": 930, "loss": 2.2351, "learning_rate": 4.160236506918098e-05, "epoch": 8.0, "percentage": 26.88, "elapsed_time": "3:58:32", "remaining_time": "10:48:49", "throughput": "21.06", "total_tokens": 301472} {"current_steps": 255, "total_steps": 930, "loss": 2.1748, "learning_rate": 4.128431206805557e-05, "epoch": 8.16, "percentage": 27.42, "elapsed_time": "4:02:54", "remaining_time": "10:42:59", "throughput": "21.08", "total_tokens": 307216} {"current_steps": 260, "total_steps": 930, "loss": 2.1173, "learning_rate": 4.096161356174959e-05, "epoch": 8.32, "percentage": 27.96, "elapsed_time": "4:07:18", "remaining_time": "10:37:18", "throughput": "21.12", "total_tokens": 313424} {"current_steps": 265, "total_steps": 930, "loss": 2.0966, "learning_rate": 4.063436160804092e-05, "epoch": 8.48, "percentage": 28.49, "elapsed_time": "4:11:42", "remaining_time": "10:31:39", "throughput": "21.15", "total_tokens": 319472} {"current_steps": 270, "total_steps": 930, "loss": 2.0825, "learning_rate": 4.030264956369157e-05, "epoch": 8.64, "percentage": 29.03, "elapsed_time": "4:16:15", "remaining_time": "10:26:23", "throughput": "21.17", "total_tokens": 325504} {"current_steps": 275, "total_steps": 930, "loss": 2.0189, "learning_rate": 3.9966572057815373e-05, "epoch": 8.8, "percentage": 29.57, "elapsed_time": "4:20:46", "remaining_time": "10:21:07", "throughput": "21.19", "total_tokens": 331520} {"current_steps": 280, "total_steps": 930, "loss": 2.0671, "learning_rate": 3.962622496488269e-05, "epoch": 8.96, "percentage": 30.11, "elapsed_time": "4:25:15", "remaining_time": "10:15:47", "throughput": "21.22", "total_tokens": 337680} {"current_steps": 285, "total_steps": 930, "loss": 2.0337, "learning_rate": 3.928170537736981e-05, "epoch": 9.12, "percentage": 30.65, "elapsed_time": "4:29:47", "remaining_time": "10:10:34", "throughput": "21.25", "total_tokens": 343936} {"current_steps": 290, "total_steps": 930, "loss": 1.7892, "learning_rate": 3.893311157806091e-05, "epoch": 9.28, "percentage": 31.18, "elapsed_time": "4:34:17", "remaining_time": "10:05:19", "throughput": "21.24", "total_tokens": 349632} {"current_steps": 295, "total_steps": 930, "loss": 1.8558, "learning_rate": 3.858054301201047e-05, "epoch": 9.44, "percentage": 31.72, "elapsed_time": "4:38:51", "remaining_time": "10:00:15", "throughput": "21.28", "total_tokens": 356080} {"current_steps": 300, "total_steps": 930, "loss": 1.9685, "learning_rate": 3.822410025817406e-05, "epoch": 9.6, "percentage": 32.26, "elapsed_time": "4:43:23", "remaining_time": "9:55:07", "throughput": "21.29", "total_tokens": 362048} {"current_steps": 305, "total_steps": 930, "loss": 1.6883, "learning_rate": 3.786388500071572e-05, "epoch": 9.76, "percentage": 32.8, "elapsed_time": "4:47:57", "remaining_time": "9:50:05", "throughput": "21.31", "total_tokens": 368128} {"current_steps": 310, "total_steps": 930, "loss": 1.8049, "learning_rate": 3.7500000000000003e-05, "epoch": 9.92, "percentage": 33.33, "elapsed_time": "4:52:27", "remaining_time": "9:44:55", "throughput": "21.31", "total_tokens": 373920} {"current_steps": 315, "total_steps": 930, "loss": 1.8785, "learning_rate": 3.713254906327703e-05, "epoch": 10.08, "percentage": 33.87, "elapsed_time": "4:56:56", "remaining_time": "9:39:45", "throughput": "21.32", "total_tokens": 379920} {"current_steps": 320, "total_steps": 930, "loss": 1.8797, "learning_rate": 3.67616370150689e-05, "epoch": 10.24, "percentage": 34.41, "elapsed_time": "5:01:29", "remaining_time": "9:34:42", "throughput": "21.36", "total_tokens": 386464} {"current_steps": 325, "total_steps": 930, "loss": 1.6139, "learning_rate": 3.638736966726585e-05, "epoch": 10.4, "percentage": 34.95, "elapsed_time": "5:06:04", "remaining_time": "9:29:45", "throughput": "21.38", "total_tokens": 392608} {"current_steps": 330, "total_steps": 930, "loss": 1.4428, "learning_rate": 3.600985378894086e-05, "epoch": 10.56, "percentage": 35.48, "elapsed_time": "5:10:33", "remaining_time": "9:24:39", "throughput": "21.37", "total_tokens": 398224} {"current_steps": 335, "total_steps": 930, "loss": 1.6858, "learning_rate": 3.562919707589102e-05, "epoch": 10.72, "percentage": 36.02, "elapsed_time": "5:15:06", "remaining_time": "9:19:40", "throughput": "21.39", "total_tokens": 404480} {"current_steps": 340, "total_steps": 930, "loss": 1.5669, "learning_rate": 3.5245508119914687e-05, "epoch": 10.88, "percentage": 36.56, "elapsed_time": "5:19:38", "remaining_time": "9:14:39", "throughput": "21.40", "total_tokens": 410448} {"current_steps": 345, "total_steps": 930, "loss": 1.5857, "learning_rate": 3.4858896377832966e-05, "epoch": 11.04, "percentage": 37.1, "elapsed_time": "5:24:11", "remaining_time": "9:09:42", "throughput": "21.41", "total_tokens": 416544} {"current_steps": 350, "total_steps": 930, "loss": 1.4511, "learning_rate": 3.44694721402644e-05, "epoch": 11.2, "percentage": 37.63, "elapsed_time": "5:28:39", "remaining_time": "9:04:38", "throughput": "21.40", "total_tokens": 422032} {"current_steps": 355, "total_steps": 930, "loss": 1.4448, "learning_rate": 3.407734650016187e-05, "epoch": 11.36, "percentage": 38.17, "elapsed_time": "5:33:11", "remaining_time": "8:59:40", "throughput": "21.42", "total_tokens": 428224} {"current_steps": 360, "total_steps": 930, "loss": 1.4648, "learning_rate": 3.3682631321120504e-05, "epoch": 11.52, "percentage": 38.71, "elapsed_time": "5:37:43", "remaining_time": "8:54:44", "throughput": "21.44", "total_tokens": 434368} {"current_steps": 365, "total_steps": 930, "loss": 1.4896, "learning_rate": 3.32854392054659e-05, "epoch": 11.68, "percentage": 39.25, "elapsed_time": "5:42:15", "remaining_time": "8:49:47", "throughput": "21.47", "total_tokens": 440816} {"current_steps": 370, "total_steps": 930, "loss": 1.2713, "learning_rate": 3.2885883462131394e-05, "epoch": 11.84, "percentage": 39.78, "elapsed_time": "5:46:46", "remaining_time": "8:44:51", "throughput": "21.48", "total_tokens": 446992} {"current_steps": 375, "total_steps": 930, "loss": 1.4016, "learning_rate": 3.2484078074333954e-05, "epoch": 12.0, "percentage": 40.32, "elapsed_time": "5:51:17", "remaining_time": "8:39:54", "throughput": "21.49", "total_tokens": 452864} {"current_steps": 380, "total_steps": 930, "loss": 1.1953, "learning_rate": 3.2080137667057595e-05, "epoch": 12.16, "percentage": 40.86, "elapsed_time": "5:55:47", "remaining_time": "8:34:57", "throughput": "21.49", "total_tokens": 458800} {"current_steps": 385, "total_steps": 930, "loss": 1.235, "learning_rate": 3.167417747435379e-05, "epoch": 12.32, "percentage": 41.4, "elapsed_time": "6:00:19", "remaining_time": "8:30:04", "throughput": "21.51", "total_tokens": 465040} {"current_steps": 390, "total_steps": 930, "loss": 1.1375, "learning_rate": 3.126631330646802e-05, "epoch": 12.48, "percentage": 41.94, "elapsed_time": "6:04:49", "remaining_time": "8:25:08", "throughput": "21.50", "total_tokens": 470544} {"current_steps": 395, "total_steps": 930, "loss": 1.1427, "learning_rate": 3.0856661516802054e-05, "epoch": 12.64, "percentage": 42.47, "elapsed_time": "6:09:21", "remaining_time": "8:20:16", "throughput": "21.51", "total_tokens": 476608} {"current_steps": 400, "total_steps": 930, "loss": 1.3749, "learning_rate": 3.0445338968721287e-05, "epoch": 12.8, "percentage": 43.01, "elapsed_time": "6:13:54", "remaining_time": "8:15:26", "throughput": "21.54", "total_tokens": 483136} {"current_steps": 405, "total_steps": 930, "loss": 1.2318, "learning_rate": 3.0032463002216505e-05, "epoch": 12.96, "percentage": 43.55, "elapsed_time": "6:18:23", "remaining_time": "8:10:31", "throughput": "21.53", "total_tokens": 488752} {"current_steps": 410, "total_steps": 930, "loss": 1.0918, "learning_rate": 2.961815140042974e-05, "epoch": 13.12, "percentage": 44.09, "elapsed_time": "6:22:53", "remaining_time": "8:05:37", "throughput": "21.55", "total_tokens": 495040} {"current_steps": 415, "total_steps": 930, "loss": 1.0229, "learning_rate": 2.920252235605371e-05, "epoch": 13.28, "percentage": 44.62, "elapsed_time": "6:27:25", "remaining_time": "8:00:46", "throughput": "21.54", "total_tokens": 500816} {"current_steps": 420, "total_steps": 930, "loss": 0.9925, "learning_rate": 2.878569443761442e-05, "epoch": 13.44, "percentage": 45.16, "elapsed_time": "6:31:53", "remaining_time": "7:55:52", "throughput": "21.53", "total_tokens": 506336} {"current_steps": 425, "total_steps": 930, "loss": 1.05, "learning_rate": 2.836778655564653e-05, "epoch": 13.6, "percentage": 45.7, "elapsed_time": "6:36:27", "remaining_time": "7:51:05", "throughput": "21.56", "total_tokens": 512848} {"current_steps": 430, "total_steps": 930, "loss": 0.9813, "learning_rate": 2.7948917928771158e-05, "epoch": 13.76, "percentage": 46.24, "elapsed_time": "6:40:58", "remaining_time": "7:46:15", "throughput": "21.57", "total_tokens": 519024} {"current_steps": 435, "total_steps": 930, "loss": 1.1116, "learning_rate": 2.7529208049685807e-05, "epoch": 13.92, "percentage": 46.77, "elapsed_time": "6:45:31", "remaining_time": "7:41:27", "throughput": "21.60", "total_tokens": 525536} {"current_steps": 440, "total_steps": 930, "loss": 0.9063, "learning_rate": 2.7108776651076118e-05, "epoch": 14.08, "percentage": 47.31, "elapsed_time": "6:50:02", "remaining_time": "7:36:38", "throughput": "21.59", "total_tokens": 531200} {"current_steps": 445, "total_steps": 930, "loss": 0.8812, "learning_rate": 2.668774367145913e-05, "epoch": 14.24, "percentage": 47.85, "elapsed_time": "6:54:32", "remaining_time": "7:31:48", "throughput": "21.60", "total_tokens": 537232} {"current_steps": 450, "total_steps": 930, "loss": 0.7509, "learning_rate": 2.6266229220967818e-05, "epoch": 14.4, "percentage": 48.39, "elapsed_time": "6:59:01", "remaining_time": "7:26:57", "throughput": "21.60", "total_tokens": 543120} {"current_steps": 455, "total_steps": 930, "loss": 1.0827, "learning_rate": 2.584435354708671e-05, "epoch": 14.56, "percentage": 48.92, "elapsed_time": "7:03:31", "remaining_time": "7:22:08", "throughput": "21.62", "total_tokens": 549312} {"current_steps": 460, "total_steps": 930, "loss": 0.8113, "learning_rate": 2.5422237000348276e-05, "epoch": 14.72, "percentage": 49.46, "elapsed_time": "7:08:02", "remaining_time": "7:17:20", "throughput": "21.63", "total_tokens": 555408} {"current_steps": 465, "total_steps": 930, "loss": 0.8095, "learning_rate": 2.5e-05, "epoch": 14.88, "percentage": 50.0, "elapsed_time": "7:12:31", "remaining_time": "7:12:31", "throughput": "21.64", "total_tokens": 561648} {"current_steps": 470, "total_steps": 930, "loss": 0.9768, "learning_rate": 2.4577762999651726e-05, "epoch": 15.04, "percentage": 50.54, "elapsed_time": "7:17:03", "remaining_time": "7:07:45", "throughput": "21.66", "total_tokens": 568048} {"current_steps": 475, "total_steps": 930, "loss": 0.8017, "learning_rate": 2.4155646452913296e-05, "epoch": 15.2, "percentage": 51.08, "elapsed_time": "7:21:35", "remaining_time": "7:02:59", "throughput": "21.68", "total_tokens": 574352} {"current_steps": 480, "total_steps": 930, "loss": 0.8299, "learning_rate": 2.3733770779032184e-05, "epoch": 15.36, "percentage": 51.61, "elapsed_time": "7:26:05", "remaining_time": "6:58:12", "throughput": "21.68", "total_tokens": 580160} {"current_steps": 485, "total_steps": 930, "loss": 0.581, "learning_rate": 2.331225632854087e-05, "epoch": 15.52, "percentage": 52.15, "elapsed_time": "7:30:35", "remaining_time": "6:53:25", "throughput": "21.67", "total_tokens": 585952} {"current_steps": 490, "total_steps": 930, "loss": 0.6687, "learning_rate": 2.2891223348923884e-05, "epoch": 15.68, "percentage": 52.69, "elapsed_time": "7:35:04", "remaining_time": "6:48:38", "throughput": "21.68", "total_tokens": 591968} {"current_steps": 495, "total_steps": 930, "loss": 0.8088, "learning_rate": 2.24707919503142e-05, "epoch": 15.84, "percentage": 53.23, "elapsed_time": "7:39:35", "remaining_time": "6:43:52", "throughput": "21.69", "total_tokens": 598128} {"current_steps": 500, "total_steps": 930, "loss": 0.8223, "learning_rate": 2.2051082071228854e-05, "epoch": 16.0, "percentage": 53.76, "elapsed_time": "7:44:04", "remaining_time": "6:39:05", "throughput": "21.70", "total_tokens": 604192} {"current_steps": 505, "total_steps": 930, "loss": 0.5949, "learning_rate": 2.1632213444353482e-05, "epoch": 16.16, "percentage": 54.3, "elapsed_time": "7:48:35", "remaining_time": "6:34:21", "throughput": "21.69", "total_tokens": 609872} {"current_steps": 510, "total_steps": 930, "loss": 0.705, "learning_rate": 2.1214305562385592e-05, "epoch": 16.32, "percentage": 54.84, "elapsed_time": "7:53:04", "remaining_time": "6:29:35", "throughput": "21.69", "total_tokens": 615584} {"current_steps": 515, "total_steps": 930, "loss": 0.3912, "learning_rate": 2.07974776439463e-05, "epoch": 16.48, "percentage": 55.38, "elapsed_time": "8:08:54", "remaining_time": "6:33:58", "throughput": "21.19", "total_tokens": 621536} {"current_steps": 520, "total_steps": 930, "loss": 0.6312, "learning_rate": 2.0381848599570276e-05, "epoch": 16.64, "percentage": 55.91, "elapsed_time": "8:13:16", "remaining_time": "6:28:55", "throughput": "21.21", "total_tokens": 627616} {"current_steps": 525, "total_steps": 930, "loss": 0.8473, "learning_rate": 1.9967536997783494e-05, "epoch": 16.8, "percentage": 56.45, "elapsed_time": "8:17:42", "remaining_time": "6:23:56", "throughput": "21.23", "total_tokens": 633952} {"current_steps": 530, "total_steps": 930, "loss": 0.7956, "learning_rate": 1.9554661031278712e-05, "epoch": 16.96, "percentage": 56.99, "elapsed_time": "8:22:05", "remaining_time": "6:18:56", "throughput": "21.27", "total_tokens": 640720} {"current_steps": 535, "total_steps": 930, "loss": 0.6384, "learning_rate": 1.914333848319795e-05, "epoch": 17.12, "percentage": 57.53, "elapsed_time": "8:26:27", "remaining_time": "6:13:55", "throughput": "21.29", "total_tokens": 646976} {"current_steps": 540, "total_steps": 930, "loss": 0.4768, "learning_rate": 1.8733686693531985e-05, "epoch": 17.28, "percentage": 58.06, "elapsed_time": "8:30:49", "remaining_time": "6:08:56", "throughput": "21.31", "total_tokens": 653296} {"current_steps": 545, "total_steps": 930, "loss": 0.6033, "learning_rate": 1.8325822525646208e-05, "epoch": 17.44, "percentage": 58.6, "elapsed_time": "8:35:12", "remaining_time": "6:03:57", "throughput": "21.33", "total_tokens": 659232} {"current_steps": 550, "total_steps": 930, "loss": 0.549, "learning_rate": 1.79198623329424e-05, "epoch": 17.6, "percentage": 59.14, "elapsed_time": "8:39:35", "remaining_time": "5:58:59", "throughput": "21.34", "total_tokens": 665248} {"current_steps": 555, "total_steps": 930, "loss": 0.5032, "learning_rate": 1.7515921925666052e-05, "epoch": 17.76, "percentage": 59.68, "elapsed_time": "8:43:55", "remaining_time": "5:54:00", "throughput": "21.35", "total_tokens": 671104} {"current_steps": 560, "total_steps": 930, "loss": 0.524, "learning_rate": 1.711411653786861e-05, "epoch": 17.92, "percentage": 60.22, "elapsed_time": "8:48:17", "remaining_time": "5:49:02", "throughput": "21.35", "total_tokens": 676720} {"current_steps": 565, "total_steps": 930, "loss": 0.5206, "learning_rate": 1.6714560794534108e-05, "epoch": 18.08, "percentage": 60.75, "elapsed_time": "8:52:52", "remaining_time": "5:44:14", "throughput": "21.37", "total_tokens": 683104} {"current_steps": 570, "total_steps": 930, "loss": 0.4662, "learning_rate": 1.6317368678879495e-05, "epoch": 18.24, "percentage": 61.29, "elapsed_time": "8:57:56", "remaining_time": "5:39:44", "throughput": "21.34", "total_tokens": 688928} {"current_steps": 575, "total_steps": 930, "loss": 0.5093, "learning_rate": 1.5922653499838137e-05, "epoch": 18.4, "percentage": 61.83, "elapsed_time": "9:03:03", "remaining_time": "5:35:16", "throughput": "21.33", "total_tokens": 695072} {"current_steps": 580, "total_steps": 930, "loss": 0.5162, "learning_rate": 1.55305278597356e-05, "epoch": 18.56, "percentage": 62.37, "elapsed_time": "9:07:38", "remaining_time": "5:30:28", "throughput": "21.34", "total_tokens": 701248} {"current_steps": 585, "total_steps": 930, "loss": 0.5355, "learning_rate": 1.5141103622167041e-05, "epoch": 18.72, "percentage": 62.9, "elapsed_time": "9:12:09", "remaining_time": "5:25:37", "throughput": "21.35", "total_tokens": 707296} {"current_steps": 590, "total_steps": 930, "loss": 0.3836, "learning_rate": 1.475449188008532e-05, "epoch": 18.88, "percentage": 63.44, "elapsed_time": "9:16:42", "remaining_time": "5:20:48", "throughput": "21.35", "total_tokens": 713120} {"current_steps": 595, "total_steps": 930, "loss": 0.519, "learning_rate": 1.437080292410899e-05, "epoch": 19.04, "percentage": 63.98, "elapsed_time": "9:21:13", "remaining_time": "5:15:58", "throughput": "21.37", "total_tokens": 719664} {"current_steps": 600, "total_steps": 930, "loss": 0.4391, "learning_rate": 1.399014621105914e-05, "epoch": 19.2, "percentage": 64.52, "elapsed_time": "9:25:35", "remaining_time": "5:11:04", "throughput": "21.40", "total_tokens": 726224} {"current_steps": 605, "total_steps": 930, "loss": 0.4404, "learning_rate": 1.361263033273415e-05, "epoch": 19.36, "percentage": 65.05, "elapsed_time": "9:29:58", "remaining_time": "5:06:11", "throughput": "21.41", "total_tokens": 732144} {"current_steps": 610, "total_steps": 930, "loss": 0.3758, "learning_rate": 1.3238362984931113e-05, "epoch": 19.52, "percentage": 65.59, "elapsed_time": "9:34:18", "remaining_time": "5:01:16", "throughput": "21.41", "total_tokens": 737824} {"current_steps": 615, "total_steps": 930, "loss": 0.483, "learning_rate": 1.286745093672298e-05, "epoch": 19.68, "percentage": 66.13, "elapsed_time": "9:38:42", "remaining_time": "4:56:24", "throughput": "21.43", "total_tokens": 743984} {"current_steps": 620, "total_steps": 930, "loss": 0.4637, "learning_rate": 1.2500000000000006e-05, "epoch": 19.84, "percentage": 66.67, "elapsed_time": "9:43:05", "remaining_time": "4:51:32", "throughput": "21.44", "total_tokens": 750016} {"current_steps": 625, "total_steps": 930, "loss": 0.4252, "learning_rate": 1.2136114999284288e-05, "epoch": 20.0, "percentage": 67.2, "elapsed_time": "9:47:28", "remaining_time": "4:46:41", "throughput": "21.45", "total_tokens": 756160} {"current_steps": 630, "total_steps": 930, "loss": 0.3591, "learning_rate": 1.1775899741825947e-05, "epoch": 20.16, "percentage": 67.74, "elapsed_time": "9:51:51", "remaining_time": "4:41:50", "throughput": "21.47", "total_tokens": 762576} {"current_steps": 635, "total_steps": 930, "loss": 0.5274, "learning_rate": 1.141945698798954e-05, "epoch": 20.32, "percentage": 68.28, "elapsed_time": "9:56:13", "remaining_time": "4:36:59", "throughput": "21.49", "total_tokens": 768768} {"current_steps": 640, "total_steps": 930, "loss": 0.4133, "learning_rate": 1.1066888421939093e-05, "epoch": 20.48, "percentage": 68.82, "elapsed_time": "10:00:33", "remaining_time": "4:32:07", "throughput": "21.49", "total_tokens": 774480} {"current_steps": 645, "total_steps": 930, "loss": 0.274, "learning_rate": 1.0718294622630188e-05, "epoch": 20.64, "percentage": 69.35, "elapsed_time": "10:04:58", "remaining_time": "4:27:18", "throughput": "21.50", "total_tokens": 780368} {"current_steps": 650, "total_steps": 930, "loss": 0.3506, "learning_rate": 1.0373775035117305e-05, "epoch": 20.8, "percentage": 69.89, "elapsed_time": "10:09:22", "remaining_time": "4:22:30", "throughput": "21.51", "total_tokens": 786368} {"current_steps": 655, "total_steps": 930, "loss": 0.3099, "learning_rate": 1.0033427942184622e-05, "epoch": 20.96, "percentage": 70.43, "elapsed_time": "10:13:43", "remaining_time": "4:17:40", "throughput": "21.52", "total_tokens": 792304} {"current_steps": 660, "total_steps": 930, "loss": 0.409, "learning_rate": 9.697350436308427e-06, "epoch": 21.12, "percentage": 70.97, "elapsed_time": "10:18:05", "remaining_time": "4:12:51", "throughput": "21.53", "total_tokens": 798464} {"current_steps": 665, "total_steps": 930, "loss": 0.4555, "learning_rate": 9.36563839195908e-06, "epoch": 21.28, "percentage": 71.51, "elapsed_time": "10:22:27", "remaining_time": "4:08:02", "throughput": "21.56", "total_tokens": 805152} {"current_steps": 670, "total_steps": 930, "loss": 0.3132, "learning_rate": 9.038386438250415e-06, "epoch": 21.44, "percentage": 72.04, "elapsed_time": "10:27:01", "remaining_time": "4:03:19", "throughput": "21.55", "total_tokens": 810848} {"current_steps": 675, "total_steps": 930, "loss": 0.2986, "learning_rate": 8.715687931944449e-06, "epoch": 21.6, "percentage": 72.58, "elapsed_time": "10:31:38", "remaining_time": "3:58:37", "throughput": "21.55", "total_tokens": 816704} {"current_steps": 680, "total_steps": 930, "loss": 0.3246, "learning_rate": 8.397634930819021e-06, "epoch": 21.76, "percentage": 73.12, "elapsed_time": "10:36:15", "remaining_time": "3:53:55", "throughput": "21.54", "total_tokens": 822272} {"current_steps": 685, "total_steps": 930, "loss": 0.349, "learning_rate": 8.084318167406066e-06, "epoch": 21.92, "percentage": 73.66, "elapsed_time": "10:40:53", "remaining_time": "3:49:13", "throughput": "21.54", "total_tokens": 828256} {"current_steps": 690, "total_steps": 930, "loss": 0.2495, "learning_rate": 7.775827023107838e-06, "epoch": 22.08, "percentage": 74.19, "elapsed_time": "10:45:33", "remaining_time": "3:44:32", "throughput": "21.55", "total_tokens": 834672} {"current_steps": 695, "total_steps": 930, "loss": 0.4472, "learning_rate": 7.472249502698686e-06, "epoch": 22.24, "percentage": 74.73, "elapsed_time": "10:50:19", "remaining_time": "3:39:53", "throughput": "21.56", "total_tokens": 841184} {"current_steps": 700, "total_steps": 930, "loss": 0.2427, "learning_rate": 7.173672209219495e-06, "epoch": 22.4, "percentage": 75.27, "elapsed_time": "10:54:53", "remaining_time": "3:35:10", "throughput": "21.56", "total_tokens": 847104} {"current_steps": 705, "total_steps": 930, "loss": 0.2333, "learning_rate": 6.880180319272006e-06, "epoch": 22.56, "percentage": 75.81, "elapsed_time": "10:59:25", "remaining_time": "3:30:27", "throughput": "21.56", "total_tokens": 853040} {"current_steps": 710, "total_steps": 930, "loss": 0.3539, "learning_rate": 6.591857558720071e-06, "epoch": 22.72, "percentage": 76.34, "elapsed_time": "11:03:55", "remaining_time": "3:25:43", "throughput": "21.56", "total_tokens": 859040} {"current_steps": 715, "total_steps": 930, "loss": 0.3516, "learning_rate": 6.308786178804782e-06, "epoch": 22.88, "percentage": 76.88, "elapsed_time": "11:08:28", "remaining_time": "3:21:00", "throughput": "21.57", "total_tokens": 865168} {"current_steps": 720, "total_steps": 930, "loss": 0.2574, "learning_rate": 6.031046932680226e-06, "epoch": 23.04, "percentage": 77.42, "elapsed_time": "11:12:55", "remaining_time": "3:16:16", "throughput": "21.56", "total_tokens": 870624} {"current_steps": 725, "total_steps": 930, "loss": 0.2764, "learning_rate": 5.758719052376693e-06, "epoch": 23.2, "percentage": 77.96, "elapsed_time": "11:17:18", "remaining_time": "3:11:30", "throughput": "21.56", "total_tokens": 876288} {"current_steps": 730, "total_steps": 930, "loss": 0.2085, "learning_rate": 5.491880226197707e-06, "epoch": 23.36, "percentage": 78.49, "elapsed_time": "11:21:42", "remaining_time": "3:06:46", "throughput": "21.56", "total_tokens": 881968} {"current_steps": 735, "total_steps": 930, "loss": 0.2651, "learning_rate": 5.23060657655754e-06, "epoch": 23.52, "percentage": 79.03, "elapsed_time": "11:26:07", "remaining_time": "3:02:01", "throughput": "21.58", "total_tokens": 888496} {"current_steps": 740, "total_steps": 930, "loss": 0.3042, "learning_rate": 4.9749726382653905e-06, "epoch": 23.68, "percentage": 79.57, "elapsed_time": "11:30:29", "remaining_time": "2:57:17", "throughput": "21.60", "total_tokens": 894880} {"current_steps": 745, "total_steps": 930, "loss": 0.334, "learning_rate": 4.725051337262476e-06, "epoch": 23.84, "percentage": 80.11, "elapsed_time": "11:34:50", "remaining_time": "2:52:32", "throughput": "21.60", "total_tokens": 900624} {"current_steps": 750, "total_steps": 930, "loss": 0.382, "learning_rate": 4.480913969818098e-06, "epoch": 24.0, "percentage": 80.65, "elapsed_time": "11:39:13", "remaining_time": "2:47:48", "throughput": "21.62", "total_tokens": 906880} {"current_steps": 755, "total_steps": 930, "loss": 0.2669, "learning_rate": 4.242630182190594e-06, "epoch": 24.16, "percentage": 81.18, "elapsed_time": "11:43:38", "remaining_time": "2:43:05", "throughput": "21.64", "total_tokens": 913472} {"current_steps": 760, "total_steps": 930, "loss": 0.2149, "learning_rate": 4.010267950759025e-06, "epoch": 24.32, "percentage": 81.72, "elapsed_time": "11:48:02", "remaining_time": "2:38:22", "throughput": "21.64", "total_tokens": 919360} {"current_steps": 765, "total_steps": 930, "loss": 0.2215, "learning_rate": 3.7838935626312242e-06, "epoch": 24.48, "percentage": 82.26, "elapsed_time": "11:52:26", "remaining_time": "2:33:39", "throughput": "21.64", "total_tokens": 924928} {"current_steps": 770, "total_steps": 930, "loss": 0.2804, "learning_rate": 3.5635715967337223e-06, "epoch": 24.64, "percentage": 82.8, "elapsed_time": "11:56:56", "remaining_time": "2:28:58", "throughput": "21.64", "total_tokens": 930816} {"current_steps": 775, "total_steps": 930, "loss": 0.348, "learning_rate": 3.3493649053890326e-06, "epoch": 24.8, "percentage": 83.33, "elapsed_time": "12:01:26", "remaining_time": "2:24:17", "throughput": "21.65", "total_tokens": 937088} {"current_steps": 780, "total_steps": 930, "loss": 0.3526, "learning_rate": 3.141334596385448e-06, "epoch": 24.96, "percentage": 83.87, "elapsed_time": "12:05:57", "remaining_time": "2:19:36", "throughput": "21.66", "total_tokens": 943536} {"current_steps": 785, "total_steps": 930, "loss": 0.1965, "learning_rate": 2.939540015544523e-06, "epoch": 25.12, "percentage": 84.41, "elapsed_time": "12:10:27", "remaining_time": "2:14:55", "throughput": "21.66", "total_tokens": 949360} {"current_steps": 790, "total_steps": 930, "loss": 0.2734, "learning_rate": 2.7440387297912123e-06, "epoch": 25.28, "percentage": 84.95, "elapsed_time": "12:14:58", "remaining_time": "2:10:14", "throughput": "21.68", "total_tokens": 955952} {"current_steps": 795, "total_steps": 930, "loss": 0.2059, "learning_rate": 2.5548865107314607e-06, "epoch": 25.44, "percentage": 85.48, "elapsed_time": "12:56:47", "remaining_time": "2:11:54", "throughput": "20.63", "total_tokens": 961696} {"current_steps": 800, "total_steps": 930, "loss": 0.1972, "learning_rate": 2.372137318741968e-06, "epoch": 25.6, "percentage": 86.02, "elapsed_time": "13:22:16", "remaining_time": "2:10:22", "throughput": "20.10", "total_tokens": 967456} {"current_steps": 805, "total_steps": 930, "loss": 0.3095, "learning_rate": 2.1958432875766653e-06, "epoch": 25.76, "percentage": 86.56, "elapsed_time": "21:18:32", "remaining_time": "3:18:31", "throughput": "12.70", "total_tokens": 973952} {"current_steps": 810, "total_steps": 930, "loss": 0.3327, "learning_rate": 2.026054709494235e-06, "epoch": 25.92, "percentage": 87.1, "elapsed_time": "21:23:37", "remaining_time": "3:10:10", "throughput": "12.72", "total_tokens": 979792} {"current_steps": 815, "total_steps": 930, "loss": 0.2003, "learning_rate": 1.8628200209110131e-06, "epoch": 26.08, "percentage": 87.63, "elapsed_time": "21:28:43", "remaining_time": "3:01:50", "throughput": "12.75", "total_tokens": 985520} {"current_steps": 820, "total_steps": 930, "loss": 0.2809, "learning_rate": 1.7061857885832893e-06, "epoch": 26.24, "percentage": 88.17, "elapsed_time": "21:33:14", "remaining_time": "2:53:29", "throughput": "12.77", "total_tokens": 991264} {"current_steps": 825, "total_steps": 930, "loss": 0.2132, "learning_rate": 1.5561966963229897e-06, "epoch": 26.4, "percentage": 88.71, "elapsed_time": "21:37:50", "remaining_time": "2:45:10", "throughput": "12.81", "total_tokens": 997520} {"current_steps": 830, "total_steps": 930, "loss": 0.2404, "learning_rate": 1.4128955322504966e-06, "epoch": 26.56, "percentage": 89.25, "elapsed_time": "21:42:23", "remaining_time": "2:36:54", "throughput": "12.84", "total_tokens": 1003344} {"current_steps": 835, "total_steps": 930, "loss": 0.2624, "learning_rate": 1.2763231765882732e-06, "epoch": 26.72, "percentage": 89.78, "elapsed_time": "21:46:59", "remaining_time": "2:28:41", "throughput": "12.88", "total_tokens": 1010128} {"current_steps": 805, "total_steps": 930, "loss": 0.3445, "learning_rate": 2.1958432875766653e-06, "epoch": 25.96, "percentage": 86.56, "elapsed_time": "0:03:21", "remaining_time": "0:00:31", "throughput": "4824.24", "total_tokens": 973440} {"current_steps": 810, "total_steps": 930, "loss": 0.1877, "learning_rate": 2.026054709494235e-06, "epoch": 26.12, "percentage": 87.1, "elapsed_time": "0:06:40", "remaining_time": "0:00:59", "throughput": "2443.86", "total_tokens": 979008} {"current_steps": 815, "total_steps": 930, "loss": 0.2929, "learning_rate": 1.8628200209110131e-06, "epoch": 26.28, "percentage": 87.63, "elapsed_time": "0:10:00", "remaining_time": "0:01:24", "throughput": "1641.00", "total_tokens": 984928} {"current_steps": 820, "total_steps": 930, "loss": 0.2057, "learning_rate": 1.7061857885832893e-06, "epoch": 26.44, "percentage": 88.17, "elapsed_time": "0:13:19", "remaining_time": "0:01:47", "throughput": "1239.87", "total_tokens": 991088} {"current_steps": 825, "total_steps": 930, "loss": 0.2783, "learning_rate": 1.5561966963229897e-06, "epoch": 26.6, "percentage": 88.71, "elapsed_time": "0:16:38", "remaining_time": "0:02:07", "throughput": "998.61", "total_tokens": 997424} {"current_steps": 830, "total_steps": 930, "loss": 0.1953, "learning_rate": 1.4128955322504966e-06, "epoch": 26.76, "percentage": 89.25, "elapsed_time": "0:19:58", "remaining_time": "0:02:24", "throughput": "837.55", "total_tokens": 1003680} {"current_steps": 835, "total_steps": 930, "loss": 0.3187, "learning_rate": 1.2763231765882732e-06, "epoch": 26.92, "percentage": 89.78, "elapsed_time": "0:23:17", "remaining_time": "0:02:39", "throughput": "722.45", "total_tokens": 1009696} {"current_steps": 840, "total_steps": 930, "loss": 0.3491, "learning_rate": 1.1465185899987797e-06, "epoch": 27.08, "percentage": 90.32, "elapsed_time": "0:26:36", "remaining_time": "0:02:51", "throughput": "636.30", "total_tokens": 1015648} {"current_steps": 845, "total_steps": 930, "loss": 0.2368, "learning_rate": 1.023518802469947e-06, "epoch": 27.24, "percentage": 90.86, "elapsed_time": "0:48:01", "remaining_time": "0:04:49", "throughput": "354.57", "total_tokens": 1021664} {"current_steps": 850, "total_steps": 930, "loss": 0.2457, "learning_rate": 9.073589027514789e-07, "epoch": 27.4, "percentage": 91.4, "elapsed_time": "0:51:20", "remaining_time": "0:04:49", "throughput": "333.60", "total_tokens": 1027696} {"current_steps": 855, "total_steps": 930, "loss": 0.3219, "learning_rate": 7.980720283448956e-07, "epoch": 27.56, "percentage": 91.94, "elapsed_time": "0:54:40", "remaining_time": "0:04:47", "throughput": "315.18", "total_tokens": 1033904} {"current_steps": 860, "total_steps": 930, "loss": 0.2515, "learning_rate": 6.956893560502359e-07, "epoch": 27.72, "percentage": 92.47, "elapsed_time": "0:57:59", "remaining_time": "0:04:43", "throughput": "298.82", "total_tokens": 1039888} {"current_steps": 865, "total_steps": 930, "loss": 0.1924, "learning_rate": 6.002400930721186e-07, "epoch": 27.88, "percentage": 93.01, "elapsed_time": "1:01:19", "remaining_time": "0:04:36", "throughput": "284.26", "total_tokens": 1045872} {"current_steps": 870, "total_steps": 930, "loss": 0.2513, "learning_rate": 5.117514686876379e-07, "epoch": 28.04, "percentage": 93.55, "elapsed_time": "1:04:39", "remaining_time": "0:04:27", "throughput": "271.25", "total_tokens": 1052192} {"current_steps": 875, "total_steps": 930, "loss": 0.2095, "learning_rate": 4.302487264785521e-07, "epoch": 28.2, "percentage": 94.09, "elapsed_time": "1:07:58", "remaining_time": "0:04:16", "throughput": "259.50", "total_tokens": 1058272} {"current_steps": 880, "total_steps": 930, "loss": 0.298, "learning_rate": 3.557551171299051e-07, "epoch": 28.36, "percentage": 94.62, "elapsed_time": "1:11:17", "remaining_time": "0:04:03", "throughput": "248.94", "total_tokens": 1064976} {"current_steps": 885, "total_steps": 930, "loss": 0.1964, "learning_rate": 2.8829189179721547e-07, "epoch": 28.52, "percentage": 95.16, "elapsed_time": "1:14:37", "remaining_time": "0:03:47", "throughput": "239.20", "total_tokens": 1070944} {"current_steps": 890, "total_steps": 930, "loss": 0.2523, "learning_rate": 2.27878296044029e-07, "epoch": 28.68, "percentage": 95.7, "elapsed_time": "1:17:56", "remaining_time": "0:03:30", "throughput": "230.25", "total_tokens": 1076656} {"current_steps": 895, "total_steps": 930, "loss": 0.3446, "learning_rate": 1.7453156435165986e-07, "epoch": 28.84, "percentage": 96.24, "elapsed_time": "1:21:15", "remaining_time": "0:03:10", "throughput": "222.12", "total_tokens": 1082896} {"current_steps": 900, "total_steps": 930, "loss": 0.1546, "learning_rate": 1.2826691520262114e-07, "epoch": 29.0, "percentage": 96.77, "elapsed_time": "1:24:33", "remaining_time": "0:02:49", "throughput": "214.55", "total_tokens": 1088576} {"current_steps": 905, "total_steps": 930, "loss": 0.3151, "learning_rate": 8.909754673917525e-08, "epoch": 29.16, "percentage": 97.31, "elapsed_time": "1:27:53", "remaining_time": "0:02:25", "throughput": "207.56", "total_tokens": 1094608} {"current_steps": 910, "total_steps": 930, "loss": 0.1548, "learning_rate": 5.7034632998231865e-08, "epoch": 29.32, "percentage": 97.85, "elapsed_time": "1:33:54", "remaining_time": "0:02:03", "throughput": "195.32", "total_tokens": 1100624} {"current_steps": 915, "total_steps": 930, "loss": 0.2533, "learning_rate": 3.208732072368104e-08, "epoch": 29.48, "percentage": 98.39, "elapsed_time": "1:43:10", "remaining_time": "0:01:41", "throughput": "178.73", "total_tokens": 1106496} {"current_steps": 920, "total_steps": 930, "loss": 0.2537, "learning_rate": 1.4262726757049982e-08, "epoch": 29.64, "percentage": 98.92, "elapsed_time": "1:46:29", "remaining_time": "0:01:09", "throughput": "174.09", "total_tokens": 1112320} {"current_steps": 925, "total_steps": 930, "loss": 0.2689, "learning_rate": 3.565936007254855e-09, "epoch": 29.8, "percentage": 99.46, "elapsed_time": "1:49:47", "remaining_time": "0:00:35", "throughput": "169.74", "total_tokens": 1118128} {"current_steps": 930, "total_steps": 930, "loss": 0.225, "learning_rate": 0.0, "epoch": 29.96, "percentage": 100.0, "elapsed_time": "1:53:06", "remaining_time": "0:00:00", "throughput": "165.72", "total_tokens": 1124640} {"current_steps": 930, "total_steps": 930, "epoch": 29.96, "percentage": 100.0, "elapsed_time": "1:53:06", "remaining_time": "0:00:00", "throughput": "165.71", "total_tokens": 1124640}