diff --git "a/trainer_log.jsonl" "b/trainer_log.jsonl" new file mode 100644--- /dev/null +++ "b/trainer_log.jsonl" @@ -0,0 +1,1755 @@ +{"current_steps": 10, "total_steps": 17540, "loss": 1.6812, "learning_rate": 1.1402508551881415e-07, "epoch": 0.0057000356252226575, "percentage": 0.06, "elapsed_time": "0:02:28", "remaining_time": "3 days, 0:23:39", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 20, "total_steps": 17540, "loss": 1.6858, "learning_rate": 2.280501710376283e-07, "epoch": 0.011400071250445315, "percentage": 0.11, "elapsed_time": "0:04:54", "remaining_time": "2 days, 23:37:13", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 30, "total_steps": 17540, "loss": 1.6882, "learning_rate": 3.4207525655644247e-07, "epoch": 0.017100106875667972, "percentage": 0.17, "elapsed_time": "0:07:14", "remaining_time": "2 days, 22:26:06", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 40, "total_steps": 17540, "loss": 1.684, "learning_rate": 4.561003420752566e-07, "epoch": 0.02280014250089063, "percentage": 0.23, "elapsed_time": "0:09:40", "remaining_time": "2 days, 22:32:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 50, "total_steps": 17540, "loss": 1.6798, "learning_rate": 5.701254275940708e-07, "epoch": 0.028500178126113287, "percentage": 0.29, "elapsed_time": "0:11:59", "remaining_time": "2 days, 21:56:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 60, "total_steps": 17540, "loss": 1.6845, "learning_rate": 6.841505131128849e-07, "epoch": 0.034200213751335945, "percentage": 0.34, "elapsed_time": "0:14:18", "remaining_time": "2 days, 21:28:45", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 70, "total_steps": 17540, "loss": 1.6805, "learning_rate": 7.98175598631699e-07, "epoch": 0.0399002493765586, "percentage": 0.4, "elapsed_time": "0:16:43", "remaining_time": "2 days, 21:32:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 80, "total_steps": 17540, "loss": 1.6737, "learning_rate": 9.122006841505132e-07, "epoch": 0.04560028500178126, "percentage": 0.46, "elapsed_time": "0:19:08", "remaining_time": "2 days, 21:38:42", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 90, "total_steps": 17540, "loss": 1.6761, "learning_rate": 1.0262257696693273e-06, "epoch": 0.05130032062700392, "percentage": 0.51, "elapsed_time": "0:21:32", "remaining_time": "2 days, 21:36:01", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 100, "total_steps": 17540, "loss": 1.672, "learning_rate": 1.1402508551881415e-06, "epoch": 0.057000356252226575, "percentage": 0.57, "elapsed_time": "0:23:50", "remaining_time": "2 days, 21:17:08", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 110, "total_steps": 17540, "loss": 1.6788, "learning_rate": 1.2542759407069557e-06, "epoch": 0.06270039187744923, "percentage": 0.63, "elapsed_time": "0:26:18", "remaining_time": "2 days, 21:29:27", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 120, "total_steps": 17540, "loss": 1.6521, "learning_rate": 1.3683010262257699e-06, "epoch": 0.06840042750267189, "percentage": 0.68, "elapsed_time": "0:28:41", "remaining_time": "2 days, 21:24:27", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 130, "total_steps": 17540, "loss": 1.6542, "learning_rate": 1.4823261117445838e-06, "epoch": 0.07410046312789455, "percentage": 0.74, "elapsed_time": "0:31:03", "remaining_time": "2 days, 21:19:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 140, "total_steps": 17540, "loss": 1.6266, "learning_rate": 1.596351197263398e-06, "epoch": 0.0798004987531172, "percentage": 0.8, "elapsed_time": "0:33:24", "remaining_time": "2 days, 21:13:05", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 150, "total_steps": 17540, "loss": 1.6018, "learning_rate": 1.7103762827822124e-06, "epoch": 0.08550053437833986, "percentage": 0.86, "elapsed_time": "0:35:45", "remaining_time": "2 days, 21:04:54", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 160, "total_steps": 17540, "loss": 1.5702, "learning_rate": 1.8244013683010263e-06, "epoch": 0.09120057000356252, "percentage": 0.91, "elapsed_time": "0:38:09", "remaining_time": "2 days, 21:05:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 170, "total_steps": 17540, "loss": 1.568, "learning_rate": 1.9384264538198407e-06, "epoch": 0.09690060562878518, "percentage": 0.97, "elapsed_time": "0:40:32", "remaining_time": "2 days, 21:01:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 180, "total_steps": 17540, "loss": 1.5417, "learning_rate": 2.0524515393386547e-06, "epoch": 0.10260064125400783, "percentage": 1.03, "elapsed_time": "0:42:52", "remaining_time": "2 days, 20:55:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 190, "total_steps": 17540, "loss": 1.5114, "learning_rate": 2.166476624857469e-06, "epoch": 0.10830067687923049, "percentage": 1.08, "elapsed_time": "0:45:13", "remaining_time": "2 days, 20:49:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 200, "total_steps": 17540, "loss": 1.4744, "learning_rate": 2.280501710376283e-06, "epoch": 0.11400071250445315, "percentage": 1.14, "elapsed_time": "0:47:35", "remaining_time": "2 days, 20:46:47", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 210, "total_steps": 17540, "loss": 1.4864, "learning_rate": 2.394526795895097e-06, "epoch": 0.11970074812967581, "percentage": 1.2, "elapsed_time": "0:49:55", "remaining_time": "2 days, 20:39:51", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 220, "total_steps": 17540, "loss": 1.4508, "learning_rate": 2.5085518814139114e-06, "epoch": 0.12540078375489846, "percentage": 1.25, "elapsed_time": "0:52:17", "remaining_time": "2 days, 20:36:20", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 230, "total_steps": 17540, "loss": 1.4298, "learning_rate": 2.6225769669327258e-06, "epoch": 0.13110081938012114, "percentage": 1.31, "elapsed_time": "0:54:43", "remaining_time": "2 days, 20:38:02", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 240, "total_steps": 17540, "loss": 1.4201, "learning_rate": 2.7366020524515397e-06, "epoch": 0.13680085500534378, "percentage": 1.37, "elapsed_time": "0:57:07", "remaining_time": "2 days, 20:37:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 250, "total_steps": 17540, "loss": 1.4037, "learning_rate": 2.8506271379703537e-06, "epoch": 0.14250089063056645, "percentage": 1.43, "elapsed_time": "0:59:31", "remaining_time": "2 days, 20:36:10", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 260, "total_steps": 17540, "loss": 1.3977, "learning_rate": 2.9646522234891676e-06, "epoch": 0.1482009262557891, "percentage": 1.48, "elapsed_time": "1:01:57", "remaining_time": "2 days, 20:37:58", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 270, "total_steps": 17540, "loss": 1.3728, "learning_rate": 3.078677309007982e-06, "epoch": 0.15390096188101177, "percentage": 1.54, "elapsed_time": "1:04:27", "remaining_time": "2 days, 20:43:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 280, "total_steps": 17540, "loss": 1.3524, "learning_rate": 3.192702394526796e-06, "epoch": 0.1596009975062344, "percentage": 1.6, "elapsed_time": "1:06:50", "remaining_time": "2 days, 20:40:39", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 290, "total_steps": 17540, "loss": 1.3344, "learning_rate": 3.30672748004561e-06, "epoch": 0.16530103313145708, "percentage": 1.65, "elapsed_time": "1:09:14", "remaining_time": "2 days, 20:38:55", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 300, "total_steps": 17540, "loss": 1.3409, "learning_rate": 3.4207525655644248e-06, "epoch": 0.17100106875667972, "percentage": 1.71, "elapsed_time": "1:11:35", "remaining_time": "2 days, 20:33:46", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 310, "total_steps": 17540, "loss": 1.3241, "learning_rate": 3.5347776510832387e-06, "epoch": 0.1767011043819024, "percentage": 1.77, "elapsed_time": "1:13:51", "remaining_time": "2 days, 20:24:49", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 320, "total_steps": 17540, "loss": 1.3017, "learning_rate": 3.6488027366020527e-06, "epoch": 0.18240114000712504, "percentage": 1.82, "elapsed_time": "1:16:20", "remaining_time": "2 days, 20:27:45", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 330, "total_steps": 17540, "loss": 1.3024, "learning_rate": 3.762827822120867e-06, "epoch": 0.1881011756323477, "percentage": 1.88, "elapsed_time": "1:18:39", "remaining_time": "2 days, 20:22:04", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 340, "total_steps": 17540, "loss": 1.2862, "learning_rate": 3.8768529076396815e-06, "epoch": 0.19380121125757035, "percentage": 1.94, "elapsed_time": "1:20:58", "remaining_time": "2 days, 20:16:21", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 350, "total_steps": 17540, "loss": 1.2763, "learning_rate": 3.990877993158495e-06, "epoch": 0.19950124688279303, "percentage": 2.0, "elapsed_time": "1:23:18", "remaining_time": "2 days, 20:11:16", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 360, "total_steps": 17540, "loss": 1.2578, "learning_rate": 4.104903078677309e-06, "epoch": 0.20520128250801567, "percentage": 2.05, "elapsed_time": "1:25:39", "remaining_time": "2 days, 20:07:31", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 370, "total_steps": 17540, "loss": 1.264, "learning_rate": 4.218928164196123e-06, "epoch": 0.21090131813323834, "percentage": 2.11, "elapsed_time": "1:28:00", "remaining_time": "2 days, 20:03:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 380, "total_steps": 17540, "loss": 1.2566, "learning_rate": 4.332953249714938e-06, "epoch": 0.21660135375846098, "percentage": 2.17, "elapsed_time": "1:30:26", "remaining_time": "2 days, 20:04:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 390, "total_steps": 17540, "loss": 1.2506, "learning_rate": 4.446978335233752e-06, "epoch": 0.22230138938368366, "percentage": 2.22, "elapsed_time": "1:32:45", "remaining_time": "2 days, 19:58:49", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 400, "total_steps": 17540, "loss": 1.2341, "learning_rate": 4.561003420752566e-06, "epoch": 0.2280014250089063, "percentage": 2.28, "elapsed_time": "1:35:11", "remaining_time": "2 days, 19:58:37", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 410, "total_steps": 17540, "loss": 1.2303, "learning_rate": 4.67502850627138e-06, "epoch": 0.23370146063412897, "percentage": 2.34, "elapsed_time": "1:37:31", "remaining_time": "2 days, 19:54:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 420, "total_steps": 17540, "loss": 1.2157, "learning_rate": 4.789053591790194e-06, "epoch": 0.23940149625935161, "percentage": 2.39, "elapsed_time": "1:39:53", "remaining_time": "2 days, 19:51:51", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 430, "total_steps": 17540, "loss": 1.2119, "learning_rate": 4.903078677309008e-06, "epoch": 0.2451015318845743, "percentage": 2.45, "elapsed_time": "1:42:14", "remaining_time": "2 days, 19:48:16", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 440, "total_steps": 17540, "loss": 1.1998, "learning_rate": 5.017103762827823e-06, "epoch": 0.25080156750979693, "percentage": 2.51, "elapsed_time": "1:44:35", "remaining_time": "2 days, 19:44:34", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 450, "total_steps": 17540, "loss": 1.1845, "learning_rate": 5.131128848346637e-06, "epoch": 0.2565016031350196, "percentage": 2.57, "elapsed_time": "1:46:57", "remaining_time": "2 days, 19:42:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 460, "total_steps": 17540, "loss": 1.2045, "learning_rate": 5.2451539338654515e-06, "epoch": 0.2622016387602423, "percentage": 2.62, "elapsed_time": "1:49:20", "remaining_time": "2 days, 19:39:53", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 470, "total_steps": 17540, "loss": 1.1816, "learning_rate": 5.3591790193842655e-06, "epoch": 0.2679016743854649, "percentage": 2.68, "elapsed_time": "1:51:43", "remaining_time": "2 days, 19:37:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 480, "total_steps": 17540, "loss": 1.1867, "learning_rate": 5.4732041049030794e-06, "epoch": 0.27360171001068756, "percentage": 2.74, "elapsed_time": "1:54:06", "remaining_time": "2 days, 19:35:40", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 490, "total_steps": 17540, "loss": 1.1693, "learning_rate": 5.587229190421893e-06, "epoch": 0.2793017456359102, "percentage": 2.79, "elapsed_time": "1:56:23", "remaining_time": "2 days, 19:30:04", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 500, "total_steps": 17540, "loss": 1.1769, "learning_rate": 5.701254275940707e-06, "epoch": 0.2850017812611329, "percentage": 2.85, "elapsed_time": "1:58:45", "remaining_time": "2 days, 19:27:21", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 510, "total_steps": 17540, "loss": 1.1572, "learning_rate": 5.815279361459521e-06, "epoch": 0.29070181688635555, "percentage": 2.91, "elapsed_time": "2:01:02", "remaining_time": "2 days, 19:21:57", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 520, "total_steps": 17540, "loss": 1.1559, "learning_rate": 5.929304446978335e-06, "epoch": 0.2964018525115782, "percentage": 2.96, "elapsed_time": "2:03:23", "remaining_time": "2 days, 19:18:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 530, "total_steps": 17540, "loss": 1.1402, "learning_rate": 6.04332953249715e-06, "epoch": 0.30210188813680083, "percentage": 3.02, "elapsed_time": "2:05:40", "remaining_time": "2 days, 19:13:13", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 540, "total_steps": 17540, "loss": 1.1456, "learning_rate": 6.157354618015964e-06, "epoch": 0.30780192376202353, "percentage": 3.08, "elapsed_time": "2:08:03", "remaining_time": "2 days, 19:11:39", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 550, "total_steps": 17540, "loss": 1.138, "learning_rate": 6.271379703534778e-06, "epoch": 0.3135019593872462, "percentage": 3.14, "elapsed_time": "2:10:25", "remaining_time": "2 days, 19:08:42", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 560, "total_steps": 17540, "loss": 1.1398, "learning_rate": 6.385404789053592e-06, "epoch": 0.3192019950124688, "percentage": 3.19, "elapsed_time": "2:12:46", "remaining_time": "2 days, 19:06:01", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 570, "total_steps": 17540, "loss": 1.121, "learning_rate": 6.499429874572406e-06, "epoch": 0.32490203063769146, "percentage": 3.25, "elapsed_time": "2:15:09", "remaining_time": "2 days, 19:03:56", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 580, "total_steps": 17540, "loss": 1.1116, "learning_rate": 6.61345496009122e-06, "epoch": 0.33060206626291416, "percentage": 3.31, "elapsed_time": "2:17:32", "remaining_time": "2 days, 19:01:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 590, "total_steps": 17540, "loss": 1.1134, "learning_rate": 6.727480045610034e-06, "epoch": 0.3363021018881368, "percentage": 3.36, "elapsed_time": "2:19:57", "remaining_time": "2 days, 19:00:44", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 600, "total_steps": 17540, "loss": 1.0982, "learning_rate": 6.8415051311288495e-06, "epoch": 0.34200213751335945, "percentage": 3.42, "elapsed_time": "2:22:19", "remaining_time": "2 days, 18:58:16", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 610, "total_steps": 17540, "loss": 1.1104, "learning_rate": 6.9555302166476635e-06, "epoch": 0.3477021731385821, "percentage": 3.48, "elapsed_time": "2:24:43", "remaining_time": "2 days, 18:56:54", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 620, "total_steps": 17540, "loss": 1.0935, "learning_rate": 7.0695553021664774e-06, "epoch": 0.3534022087638048, "percentage": 3.53, "elapsed_time": "2:27:07", "remaining_time": "2 days, 18:55:17", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 630, "total_steps": 17540, "loss": 1.0747, "learning_rate": 7.183580387685291e-06, "epoch": 0.35910224438902744, "percentage": 3.59, "elapsed_time": "2:29:25", "remaining_time": "2 days, 18:50:49", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 640, "total_steps": 17540, "loss": 1.0766, "learning_rate": 7.297605473204105e-06, "epoch": 0.3648022800142501, "percentage": 3.65, "elapsed_time": "2:31:52", "remaining_time": "2 days, 18:50:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 650, "total_steps": 17540, "loss": 1.0817, "learning_rate": 7.41163055872292e-06, "epoch": 0.3705023156394727, "percentage": 3.71, "elapsed_time": "2:34:12", "remaining_time": "2 days, 18:47:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 660, "total_steps": 17540, "loss": 1.0708, "learning_rate": 7.525655644241734e-06, "epoch": 0.3762023512646954, "percentage": 3.76, "elapsed_time": "2:36:30", "remaining_time": "2 days, 18:43:00", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 670, "total_steps": 17540, "loss": 1.0662, "learning_rate": 7.639680729760547e-06, "epoch": 0.38190238688991807, "percentage": 3.82, "elapsed_time": "2:38:55", "remaining_time": "2 days, 18:41:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 680, "total_steps": 17540, "loss": 1.0743, "learning_rate": 7.753705815279363e-06, "epoch": 0.3876024225151407, "percentage": 3.88, "elapsed_time": "2:41:17", "remaining_time": "2 days, 18:39:00", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 690, "total_steps": 17540, "loss": 1.055, "learning_rate": 7.867730900798177e-06, "epoch": 0.39330245814036335, "percentage": 3.93, "elapsed_time": "2:43:37", "remaining_time": "2 days, 18:35:49", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 700, "total_steps": 17540, "loss": 1.0547, "learning_rate": 7.98175598631699e-06, "epoch": 0.39900249376558605, "percentage": 3.99, "elapsed_time": "2:45:58", "remaining_time": "2 days, 18:32:57", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 710, "total_steps": 17540, "loss": 1.0497, "learning_rate": 8.095781071835805e-06, "epoch": 0.4047025293908087, "percentage": 4.05, "elapsed_time": "2:48:21", "remaining_time": "2 days, 18:30:48", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 720, "total_steps": 17540, "loss": 1.0603, "learning_rate": 8.209806157354619e-06, "epoch": 0.41040256501603134, "percentage": 4.1, "elapsed_time": "2:50:52", "remaining_time": "2 days, 18:32:00", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 730, "total_steps": 17540, "loss": 1.0428, "learning_rate": 8.323831242873433e-06, "epoch": 0.416102600641254, "percentage": 4.16, "elapsed_time": "2:53:15", "remaining_time": "2 days, 18:29:40", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 740, "total_steps": 17540, "loss": 1.0424, "learning_rate": 8.437856328392247e-06, "epoch": 0.4218026362664767, "percentage": 4.22, "elapsed_time": "2:55:35", "remaining_time": "2 days, 18:26:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 750, "total_steps": 17540, "loss": 1.0419, "learning_rate": 8.55188141391106e-06, "epoch": 0.4275026718916993, "percentage": 4.28, "elapsed_time": "2:57:53", "remaining_time": "2 days, 18:22:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 760, "total_steps": 17540, "loss": 1.0368, "learning_rate": 8.665906499429876e-06, "epoch": 0.43320270751692197, "percentage": 4.33, "elapsed_time": "3:00:17", "remaining_time": "2 days, 18:20:44", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 770, "total_steps": 17540, "loss": 1.0324, "learning_rate": 8.77993158494869e-06, "epoch": 0.4389027431421446, "percentage": 4.39, "elapsed_time": "3:02:43", "remaining_time": "2 days, 18:19:46", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 780, "total_steps": 17540, "loss": 1.0344, "learning_rate": 8.893956670467504e-06, "epoch": 0.4446027787673673, "percentage": 4.45, "elapsed_time": "3:05:06", "remaining_time": "2 days, 18:17:27", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 790, "total_steps": 17540, "loss": 1.0273, "learning_rate": 9.007981755986318e-06, "epoch": 0.45030281439258996, "percentage": 4.5, "elapsed_time": "3:07:24", "remaining_time": "2 days, 18:13:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 800, "total_steps": 17540, "loss": 1.0247, "learning_rate": 9.122006841505132e-06, "epoch": 0.4560028500178126, "percentage": 4.56, "elapsed_time": "3:09:45", "remaining_time": "2 days, 18:10:50", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 810, "total_steps": 17540, "loss": 1.0234, "learning_rate": 9.236031927023946e-06, "epoch": 0.46170288564303524, "percentage": 4.62, "elapsed_time": "3:12:05", "remaining_time": "2 days, 18:07:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 820, "total_steps": 17540, "loss": 1.0206, "learning_rate": 9.35005701254276e-06, "epoch": 0.46740292126825794, "percentage": 4.68, "elapsed_time": "3:14:26", "remaining_time": "2 days, 18:04:34", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 830, "total_steps": 17540, "loss": 1.0159, "learning_rate": 9.464082098061574e-06, "epoch": 0.4731029568934806, "percentage": 4.73, "elapsed_time": "3:16:42", "remaining_time": "2 days, 18:00:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 840, "total_steps": 17540, "loss": 1.0073, "learning_rate": 9.578107183580388e-06, "epoch": 0.47880299251870323, "percentage": 4.79, "elapsed_time": "3:19:03", "remaining_time": "2 days, 17:57:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 850, "total_steps": 17540, "loss": 1.0049, "learning_rate": 9.692132269099202e-06, "epoch": 0.4845030281439259, "percentage": 4.85, "elapsed_time": "3:21:23", "remaining_time": "2 days, 17:54:17", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 860, "total_steps": 17540, "loss": 1.0008, "learning_rate": 9.806157354618016e-06, "epoch": 0.4902030637691486, "percentage": 4.9, "elapsed_time": "3:23:51", "remaining_time": "2 days, 17:53:48", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 870, "total_steps": 17540, "loss": 0.997, "learning_rate": 9.920182440136832e-06, "epoch": 0.4959030993943712, "percentage": 4.96, "elapsed_time": "3:26:13", "remaining_time": "2 days, 17:51:25", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 880, "total_steps": 17540, "loss": 0.9979, "learning_rate": 1.0034207525655646e-05, "epoch": 0.5016031350195939, "percentage": 5.02, "elapsed_time": "3:28:36", "remaining_time": "2 days, 17:49:18", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 890, "total_steps": 17540, "loss": 0.9898, "learning_rate": 1.014823261117446e-05, "epoch": 0.5073031706448166, "percentage": 5.07, "elapsed_time": "3:30:56", "remaining_time": "2 days, 17:46:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 900, "total_steps": 17540, "loss": 0.9821, "learning_rate": 1.0262257696693273e-05, "epoch": 0.5130032062700391, "percentage": 5.13, "elapsed_time": "3:33:17", "remaining_time": "2 days, 17:43:32", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 910, "total_steps": 17540, "loss": 0.9753, "learning_rate": 1.0376282782212087e-05, "epoch": 0.5187032418952618, "percentage": 5.19, "elapsed_time": "3:35:41", "remaining_time": "2 days, 17:41:34", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 920, "total_steps": 17540, "loss": 0.9907, "learning_rate": 1.0490307867730903e-05, "epoch": 0.5244032775204845, "percentage": 5.25, "elapsed_time": "3:37:55", "remaining_time": "2 days, 17:36:56", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 930, "total_steps": 17540, "loss": 0.9886, "learning_rate": 1.0604332953249717e-05, "epoch": 0.5301033131457071, "percentage": 5.3, "elapsed_time": "3:40:22", "remaining_time": "2 days, 17:35:57", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 940, "total_steps": 17540, "loss": 0.9826, "learning_rate": 1.0718358038768531e-05, "epoch": 0.5358033487709298, "percentage": 5.36, "elapsed_time": "3:42:46", "remaining_time": "2 days, 17:34:04", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 950, "total_steps": 17540, "loss": 0.9865, "learning_rate": 1.0832383124287345e-05, "epoch": 0.5415033843961524, "percentage": 5.42, "elapsed_time": "3:45:13", "remaining_time": "2 days, 17:33:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 960, "total_steps": 17540, "loss": 0.9804, "learning_rate": 1.0946408209806159e-05, "epoch": 0.5472034200213751, "percentage": 5.47, "elapsed_time": "3:47:38", "remaining_time": "2 days, 17:31:35", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 970, "total_steps": 17540, "loss": 0.9725, "learning_rate": 1.1060433295324973e-05, "epoch": 0.5529034556465978, "percentage": 5.53, "elapsed_time": "3:49:59", "remaining_time": "2 days, 17:28:51", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 980, "total_steps": 17540, "loss": 0.9745, "learning_rate": 1.1174458380843787e-05, "epoch": 0.5586034912718204, "percentage": 5.59, "elapsed_time": "3:52:20", "remaining_time": "2 days, 17:26:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 990, "total_steps": 17540, "loss": 0.962, "learning_rate": 1.12884834663626e-05, "epoch": 0.5643035268970431, "percentage": 5.64, "elapsed_time": "3:54:41", "remaining_time": "2 days, 17:23:26", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1000, "total_steps": 17540, "loss": 0.9821, "learning_rate": 1.1402508551881415e-05, "epoch": 0.5700035625222658, "percentage": 5.7, "elapsed_time": "3:57:07", "remaining_time": "2 days, 17:22:00", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1010, "total_steps": 17540, "loss": 0.9718, "learning_rate": 1.1516533637400229e-05, "epoch": 0.5757035981474884, "percentage": 5.76, "elapsed_time": "3:59:31", "remaining_time": "2 days, 17:20:02", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1020, "total_steps": 17540, "loss": 0.9831, "learning_rate": 1.1630558722919043e-05, "epoch": 0.5814036337727111, "percentage": 5.82, "elapsed_time": "4:01:52", "remaining_time": "2 days, 17:17:31", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1030, "total_steps": 17540, "loss": 0.9661, "learning_rate": 1.1744583808437857e-05, "epoch": 0.5871036693979338, "percentage": 5.87, "elapsed_time": "4:04:15", "remaining_time": "2 days, 17:15:22", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1040, "total_steps": 17540, "loss": 0.973, "learning_rate": 1.185860889395667e-05, "epoch": 0.5928037050231564, "percentage": 5.93, "elapsed_time": "4:06:33", "remaining_time": "2 days, 17:11:50", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1050, "total_steps": 17540, "loss": 0.9701, "learning_rate": 1.1972633979475485e-05, "epoch": 0.5985037406483791, "percentage": 5.99, "elapsed_time": "4:08:55", "remaining_time": "2 days, 17:09:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1060, "total_steps": 17540, "loss": 0.9583, "learning_rate": 1.20866590649943e-05, "epoch": 0.6042037762736017, "percentage": 6.04, "elapsed_time": "4:11:16", "remaining_time": "2 days, 17:06:34", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1070, "total_steps": 17540, "loss": 0.9578, "learning_rate": 1.2200684150513114e-05, "epoch": 0.6099038118988244, "percentage": 6.1, "elapsed_time": "4:13:38", "remaining_time": "2 days, 17:04:12", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1080, "total_steps": 17540, "loss": 0.9558, "learning_rate": 1.2314709236031928e-05, "epoch": 0.6156038475240471, "percentage": 6.16, "elapsed_time": "4:16:00", "remaining_time": "2 days, 17:01:49", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1090, "total_steps": 17540, "loss": 0.9582, "learning_rate": 1.2428734321550742e-05, "epoch": 0.6213038831492697, "percentage": 6.21, "elapsed_time": "4:18:25", "remaining_time": "2 days, 16:59:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1100, "total_steps": 17540, "loss": 0.9552, "learning_rate": 1.2542759407069556e-05, "epoch": 0.6270039187744924, "percentage": 6.27, "elapsed_time": "4:20:45", "remaining_time": "2 days, 16:57:07", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1110, "total_steps": 17540, "loss": 0.9553, "learning_rate": 1.265678449258837e-05, "epoch": 0.632703954399715, "percentage": 6.33, "elapsed_time": "4:23:05", "remaining_time": "2 days, 16:54:16", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1120, "total_steps": 17540, "loss": 0.9371, "learning_rate": 1.2770809578107184e-05, "epoch": 0.6384039900249376, "percentage": 6.39, "elapsed_time": "4:25:25", "remaining_time": "2 days, 16:51:18", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1130, "total_steps": 17540, "loss": 0.9493, "learning_rate": 1.2884834663625998e-05, "epoch": 0.6441040256501603, "percentage": 6.44, "elapsed_time": "4:27:49", "remaining_time": "2 days, 16:49:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1140, "total_steps": 17540, "loss": 0.9416, "learning_rate": 1.2998859749144812e-05, "epoch": 0.6498040612753829, "percentage": 6.5, "elapsed_time": "4:30:12", "remaining_time": "2 days, 16:47:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1150, "total_steps": 17540, "loss": 0.9357, "learning_rate": 1.3112884834663626e-05, "epoch": 0.6555040969006056, "percentage": 6.56, "elapsed_time": "4:32:33", "remaining_time": "2 days, 16:44:29", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1160, "total_steps": 17540, "loss": 0.9391, "learning_rate": 1.322690992018244e-05, "epoch": 0.6612041325258283, "percentage": 6.61, "elapsed_time": "4:34:57", "remaining_time": "2 days, 16:42:34", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1170, "total_steps": 17540, "loss": 0.9352, "learning_rate": 1.3340935005701254e-05, "epoch": 0.6669041681510509, "percentage": 6.67, "elapsed_time": "4:37:21", "remaining_time": "2 days, 16:40:38", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1180, "total_steps": 17540, "loss": 0.9272, "learning_rate": 1.3454960091220068e-05, "epoch": 0.6726042037762736, "percentage": 6.73, "elapsed_time": "4:39:39", "remaining_time": "2 days, 16:37:16", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1190, "total_steps": 17540, "loss": 0.9366, "learning_rate": 1.3568985176738885e-05, "epoch": 0.6783042394014963, "percentage": 6.78, "elapsed_time": "4:42:03", "remaining_time": "2 days, 16:35:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1200, "total_steps": 17540, "loss": 0.9337, "learning_rate": 1.3683010262257699e-05, "epoch": 0.6840042750267189, "percentage": 6.84, "elapsed_time": "4:44:20", "remaining_time": "2 days, 16:31:53", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1210, "total_steps": 17540, "loss": 0.921, "learning_rate": 1.3797035347776513e-05, "epoch": 0.6897043106519416, "percentage": 6.9, "elapsed_time": "4:46:43", "remaining_time": "2 days, 16:29:37", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1220, "total_steps": 17540, "loss": 0.9332, "learning_rate": 1.3911060433295327e-05, "epoch": 0.6954043462771642, "percentage": 6.96, "elapsed_time": "4:49:00", "remaining_time": "2 days, 16:26:09", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1230, "total_steps": 17540, "loss": 0.9303, "learning_rate": 1.4025085518814141e-05, "epoch": 0.7011043819023869, "percentage": 7.01, "elapsed_time": "4:51:16", "remaining_time": "2 days, 16:22:18", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1240, "total_steps": 17540, "loss": 0.93, "learning_rate": 1.4139110604332955e-05, "epoch": 0.7068044175276096, "percentage": 7.07, "elapsed_time": "4:53:37", "remaining_time": "2 days, 16:19:44", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1250, "total_steps": 17540, "loss": 0.9216, "learning_rate": 1.4253135689851769e-05, "epoch": 0.7125044531528322, "percentage": 7.13, "elapsed_time": "4:55:57", "remaining_time": "2 days, 16:16:58", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1260, "total_steps": 17540, "loss": 0.9202, "learning_rate": 1.4367160775370583e-05, "epoch": 0.7182044887780549, "percentage": 7.18, "elapsed_time": "4:58:20", "remaining_time": "2 days, 16:14:46", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1270, "total_steps": 17540, "loss": 0.9241, "learning_rate": 1.4481185860889397e-05, "epoch": 0.7239045244032776, "percentage": 7.24, "elapsed_time": "5:00:40", "remaining_time": "2 days, 16:11:58", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1280, "total_steps": 17540, "loss": 0.9182, "learning_rate": 1.459521094640821e-05, "epoch": 0.7296045600285002, "percentage": 7.3, "elapsed_time": "5:03:02", "remaining_time": "2 days, 16:09:40", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1290, "total_steps": 17540, "loss": 0.9315, "learning_rate": 1.4709236031927025e-05, "epoch": 0.7353045956537229, "percentage": 7.35, "elapsed_time": "5:05:26", "remaining_time": "2 days, 16:07:34", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1300, "total_steps": 17540, "loss": 0.9112, "learning_rate": 1.482326111744584e-05, "epoch": 0.7410046312789454, "percentage": 7.41, "elapsed_time": "5:07:48", "remaining_time": "2 days, 16:05:12", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1310, "total_steps": 17540, "loss": 0.9272, "learning_rate": 1.4937286202964654e-05, "epoch": 0.7467046669041681, "percentage": 7.47, "elapsed_time": "5:10:08", "remaining_time": "2 days, 16:02:30", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1320, "total_steps": 17540, "loss": 0.9297, "learning_rate": 1.5051311288483468e-05, "epoch": 0.7524047025293908, "percentage": 7.53, "elapsed_time": "5:12:29", "remaining_time": "2 days, 15:59:49", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1330, "total_steps": 17540, "loss": 0.9342, "learning_rate": 1.5165336374002282e-05, "epoch": 0.7581047381546134, "percentage": 7.58, "elapsed_time": "5:14:52", "remaining_time": "2 days, 15:57:45", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1340, "total_steps": 17540, "loss": 0.9112, "learning_rate": 1.5279361459521094e-05, "epoch": 0.7638047737798361, "percentage": 7.64, "elapsed_time": "5:17:18", "remaining_time": "2 days, 15:56:05", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1350, "total_steps": 17540, "loss": 0.9117, "learning_rate": 1.539338654503991e-05, "epoch": 0.7695048094050588, "percentage": 7.7, "elapsed_time": "5:19:43", "remaining_time": "2 days, 15:54:16", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1360, "total_steps": 17540, "loss": 0.9004, "learning_rate": 1.5507411630558726e-05, "epoch": 0.7752048450302814, "percentage": 7.75, "elapsed_time": "5:22:03", "remaining_time": "2 days, 15:51:33", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1370, "total_steps": 17540, "loss": 0.9117, "learning_rate": 1.5621436716077538e-05, "epoch": 0.7809048806555041, "percentage": 7.81, "elapsed_time": "5:24:26", "remaining_time": "2 days, 15:49:26", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1380, "total_steps": 17540, "loss": 0.9163, "learning_rate": 1.5735461801596354e-05, "epoch": 0.7866049162807267, "percentage": 7.87, "elapsed_time": "5:26:43", "remaining_time": "2 days, 15:46:05", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1390, "total_steps": 17540, "loss": 0.9172, "learning_rate": 1.5849486887115166e-05, "epoch": 0.7923049519059494, "percentage": 7.92, "elapsed_time": "5:29:06", "remaining_time": "2 days, 15:43:45", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1400, "total_steps": 17540, "loss": 0.9072, "learning_rate": 1.596351197263398e-05, "epoch": 0.7980049875311721, "percentage": 7.98, "elapsed_time": "5:31:26", "remaining_time": "2 days, 15:40:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1410, "total_steps": 17540, "loss": 0.9038, "learning_rate": 1.6077537058152794e-05, "epoch": 0.8037050231563947, "percentage": 8.04, "elapsed_time": "5:33:43", "remaining_time": "2 days, 15:37:46", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1420, "total_steps": 17540, "loss": 0.9078, "learning_rate": 1.619156214367161e-05, "epoch": 0.8094050587816174, "percentage": 8.1, "elapsed_time": "5:36:03", "remaining_time": "2 days, 15:34:58", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1430, "total_steps": 17540, "loss": 0.9092, "learning_rate": 1.6305587229190422e-05, "epoch": 0.8151050944068401, "percentage": 8.15, "elapsed_time": "5:38:25", "remaining_time": "2 days, 15:32:33", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1440, "total_steps": 17540, "loss": 0.8968, "learning_rate": 1.6419612314709237e-05, "epoch": 0.8208051300320627, "percentage": 8.21, "elapsed_time": "5:40:48", "remaining_time": "2 days, 15:30:20", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1450, "total_steps": 17540, "loss": 0.8897, "learning_rate": 1.653363740022805e-05, "epoch": 0.8265051656572854, "percentage": 8.27, "elapsed_time": "5:43:10", "remaining_time": "2 days, 15:28:04", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1460, "total_steps": 17540, "loss": 0.9091, "learning_rate": 1.6647662485746865e-05, "epoch": 0.832205201282508, "percentage": 8.32, "elapsed_time": "5:45:34", "remaining_time": "2 days, 15:26:02", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1470, "total_steps": 17540, "loss": 0.8915, "learning_rate": 1.6761687571265678e-05, "epoch": 0.8379052369077307, "percentage": 8.38, "elapsed_time": "5:47:51", "remaining_time": "2 days, 15:22:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1480, "total_steps": 17540, "loss": 0.9033, "learning_rate": 1.6875712656784493e-05, "epoch": 0.8436052725329534, "percentage": 8.44, "elapsed_time": "5:50:12", "remaining_time": "2 days, 15:20:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1490, "total_steps": 17540, "loss": 0.9074, "learning_rate": 1.6989737742303306e-05, "epoch": 0.849305308158176, "percentage": 8.49, "elapsed_time": "5:52:33", "remaining_time": "2 days, 15:17:42", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1500, "total_steps": 17540, "loss": 0.8935, "learning_rate": 1.710376282782212e-05, "epoch": 0.8550053437833987, "percentage": 8.55, "elapsed_time": "5:54:56", "remaining_time": "2 days, 15:15:30", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1510, "total_steps": 17540, "loss": 0.886, "learning_rate": 1.7217787913340937e-05, "epoch": 0.8607053794086214, "percentage": 8.61, "elapsed_time": "5:57:20", "remaining_time": "2 days, 15:13:27", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1520, "total_steps": 17540, "loss": 0.89, "learning_rate": 1.7331812998859753e-05, "epoch": 0.8664054150338439, "percentage": 8.67, "elapsed_time": "5:59:40", "remaining_time": "2 days, 15:10:42", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1530, "total_steps": 17540, "loss": 0.8916, "learning_rate": 1.7445838084378565e-05, "epoch": 0.8721054506590666, "percentage": 8.72, "elapsed_time": "6:02:02", "remaining_time": "2 days, 15:08:26", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1540, "total_steps": 17540, "loss": 0.8859, "learning_rate": 1.755986316989738e-05, "epoch": 0.8778054862842892, "percentage": 8.78, "elapsed_time": "6:04:27", "remaining_time": "2 days, 15:06:33", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1550, "total_steps": 17540, "loss": 0.8919, "learning_rate": 1.7673888255416193e-05, "epoch": 0.8835055219095119, "percentage": 8.84, "elapsed_time": "6:06:52", "remaining_time": "2 days, 15:04:39", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1560, "total_steps": 17540, "loss": 0.8913, "learning_rate": 1.778791334093501e-05, "epoch": 0.8892055575347346, "percentage": 8.89, "elapsed_time": "6:09:12", "remaining_time": "2 days, 15:02:02", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1570, "total_steps": 17540, "loss": 0.8915, "learning_rate": 1.790193842645382e-05, "epoch": 0.8949055931599572, "percentage": 8.95, "elapsed_time": "6:11:35", "remaining_time": "2 days, 14:59:51", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1580, "total_steps": 17540, "loss": 0.8925, "learning_rate": 1.8015963511972636e-05, "epoch": 0.9006056287851799, "percentage": 9.01, "elapsed_time": "6:13:51", "remaining_time": "2 days, 14:56:29", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1590, "total_steps": 17540, "loss": 0.8763, "learning_rate": 1.812998859749145e-05, "epoch": 0.9063056644104026, "percentage": 9.06, "elapsed_time": "6:16:08", "remaining_time": "2 days, 14:53:17", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1600, "total_steps": 17540, "loss": 0.883, "learning_rate": 1.8244013683010264e-05, "epoch": 0.9120057000356252, "percentage": 9.12, "elapsed_time": "6:18:33", "remaining_time": "2 days, 14:51:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1610, "total_steps": 17540, "loss": 0.8849, "learning_rate": 1.835803876852908e-05, "epoch": 0.9177057356608479, "percentage": 9.18, "elapsed_time": "6:20:54", "remaining_time": "2 days, 14:48:53", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1620, "total_steps": 17540, "loss": 0.8887, "learning_rate": 1.8472063854047892e-05, "epoch": 0.9234057712860705, "percentage": 9.24, "elapsed_time": "6:23:19", "remaining_time": "2 days, 14:46:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1630, "total_steps": 17540, "loss": 0.8876, "learning_rate": 1.8586088939566708e-05, "epoch": 0.9291058069112932, "percentage": 9.29, "elapsed_time": "6:25:39", "remaining_time": "2 days, 14:44:22", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1640, "total_steps": 17540, "loss": 0.8719, "learning_rate": 1.870011402508552e-05, "epoch": 0.9348058425365159, "percentage": 9.35, "elapsed_time": "6:27:59", "remaining_time": "2 days, 14:41:41", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1650, "total_steps": 17540, "loss": 0.8941, "learning_rate": 1.8814139110604336e-05, "epoch": 0.9405058781617385, "percentage": 9.41, "elapsed_time": "6:30:27", "remaining_time": "2 days, 14:40:13", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1660, "total_steps": 17540, "loss": 0.8849, "learning_rate": 1.8928164196123148e-05, "epoch": 0.9462059137869612, "percentage": 9.46, "elapsed_time": "6:32:46", "remaining_time": "2 days, 14:37:21", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1670, "total_steps": 17540, "loss": 0.8878, "learning_rate": 1.9042189281641964e-05, "epoch": 0.9519059494121839, "percentage": 9.52, "elapsed_time": "6:35:14", "remaining_time": "2 days, 14:35:55", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1680, "total_steps": 17540, "loss": 0.8885, "learning_rate": 1.9156214367160776e-05, "epoch": 0.9576059850374065, "percentage": 9.58, "elapsed_time": "6:37:35", "remaining_time": "2 days, 14:33:29", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1690, "total_steps": 17540, "loss": 0.8804, "learning_rate": 1.927023945267959e-05, "epoch": 0.9633060206626292, "percentage": 9.64, "elapsed_time": "6:40:00", "remaining_time": "2 days, 14:31:31", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1700, "total_steps": 17540, "loss": 0.8664, "learning_rate": 1.9384264538198404e-05, "epoch": 0.9690060562878517, "percentage": 9.69, "elapsed_time": "6:42:20", "remaining_time": "2 days, 14:28:50", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1710, "total_steps": 17540, "loss": 0.887, "learning_rate": 1.949828962371722e-05, "epoch": 0.9747060919130744, "percentage": 9.75, "elapsed_time": "6:44:42", "remaining_time": "2 days, 14:26:31", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1720, "total_steps": 17540, "loss": 0.8792, "learning_rate": 1.9612314709236032e-05, "epoch": 0.9804061275382971, "percentage": 9.81, "elapsed_time": "6:46:58", "remaining_time": "2 days, 14:23:16", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1730, "total_steps": 17540, "loss": 0.8757, "learning_rate": 1.9726339794754847e-05, "epoch": 0.9861061631635197, "percentage": 9.86, "elapsed_time": "6:49:17", "remaining_time": "2 days, 14:20:26", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1740, "total_steps": 17540, "loss": 0.8753, "learning_rate": 1.9840364880273663e-05, "epoch": 0.9918061987887424, "percentage": 9.92, "elapsed_time": "6:51:42", "remaining_time": "2 days, 14:18:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1750, "total_steps": 17540, "loss": 0.8631, "learning_rate": 1.9954389965792475e-05, "epoch": 0.9975062344139651, "percentage": 9.98, "elapsed_time": "6:54:09", "remaining_time": "2 days, 14:16:50", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1760, "total_steps": 17540, "loss": 0.8597, "learning_rate": 1.999999287101006e-05, "epoch": 1.0032062700391877, "percentage": 10.03, "elapsed_time": "6:56:32", "remaining_time": "2 days, 14:14:44", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1770, "total_steps": 17540, "loss": 0.8749, "learning_rate": 1.9999949304997227e-05, "epoch": 1.0089063056644103, "percentage": 10.09, "elapsed_time": "6:58:57", "remaining_time": "2 days, 14:12:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1780, "total_steps": 17540, "loss": 0.8701, "learning_rate": 1.9999866133693866e-05, "epoch": 1.0146063412896331, "percentage": 10.15, "elapsed_time": "7:01:25", "remaining_time": "2 days, 14:11:13", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1790, "total_steps": 17540, "loss": 0.8618, "learning_rate": 1.999974335742938e-05, "epoch": 1.0203063769148557, "percentage": 10.21, "elapsed_time": "7:03:46", "remaining_time": "2 days, 14:08:41", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1800, "total_steps": 17540, "loss": 0.8654, "learning_rate": 1.999958097669003e-05, "epoch": 1.0260064125400783, "percentage": 10.26, "elapsed_time": "7:06:10", "remaining_time": "2 days, 14:06:40", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1810, "total_steps": 17540, "loss": 0.8559, "learning_rate": 1.9999378992118937e-05, "epoch": 1.031706448165301, "percentage": 10.32, "elapsed_time": "7:08:34", "remaining_time": "2 days, 14:04:32", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1820, "total_steps": 17540, "loss": 0.8496, "learning_rate": 1.9999137404516062e-05, "epoch": 1.0374064837905237, "percentage": 10.38, "elapsed_time": "7:11:01", "remaining_time": "2 days, 14:02:54", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1830, "total_steps": 17540, "loss": 0.85, "learning_rate": 1.999885621483823e-05, "epoch": 1.0431065194157463, "percentage": 10.43, "elapsed_time": "7:13:26", "remaining_time": "2 days, 14:01:02", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1840, "total_steps": 17540, "loss": 0.8579, "learning_rate": 1.9998535424199112e-05, "epoch": 1.048806555040969, "percentage": 10.49, "elapsed_time": "7:15:48", "remaining_time": "2 days, 13:58:33", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1850, "total_steps": 17540, "loss": 0.8644, "learning_rate": 1.9998175033869205e-05, "epoch": 1.0545065906661917, "percentage": 10.55, "elapsed_time": "7:18:10", "remaining_time": "2 days, 13:56:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1860, "total_steps": 17540, "loss": 0.8597, "learning_rate": 1.999777504527586e-05, "epoch": 1.0602066262914143, "percentage": 10.6, "elapsed_time": "7:20:30", "remaining_time": "2 days, 13:53:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1870, "total_steps": 17540, "loss": 0.8589, "learning_rate": 1.9997335460003246e-05, "epoch": 1.065906661916637, "percentage": 10.66, "elapsed_time": "7:22:47", "remaining_time": "2 days, 13:50:30", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1880, "total_steps": 17540, "loss": 0.8526, "learning_rate": 1.9996856279792368e-05, "epoch": 1.0716066975418597, "percentage": 10.72, "elapsed_time": "7:25:08", "remaining_time": "2 days, 13:47:57", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1890, "total_steps": 17540, "loss": 0.8605, "learning_rate": 1.999633750654104e-05, "epoch": 1.0773067331670823, "percentage": 10.78, "elapsed_time": "7:27:31", "remaining_time": "2 days, 13:45:42", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1900, "total_steps": 17540, "loss": 0.8582, "learning_rate": 1.999577914230388e-05, "epoch": 1.083006768792305, "percentage": 10.83, "elapsed_time": "7:29:44", "remaining_time": "2 days, 13:42:07", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1910, "total_steps": 17540, "loss": 0.8624, "learning_rate": 1.9995181189292334e-05, "epoch": 1.0887068044175277, "percentage": 10.89, "elapsed_time": "7:32:04", "remaining_time": "2 days, 13:39:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1920, "total_steps": 17540, "loss": 0.8518, "learning_rate": 1.999454364987461e-05, "epoch": 1.0944068400427502, "percentage": 10.95, "elapsed_time": "7:34:23", "remaining_time": "2 days, 13:36:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1930, "total_steps": 17540, "loss": 0.8561, "learning_rate": 1.9993866526575723e-05, "epoch": 1.1001068756679728, "percentage": 11.0, "elapsed_time": "7:36:48", "remaining_time": "2 days, 13:34:42", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1940, "total_steps": 17540, "loss": 0.8627, "learning_rate": 1.999314982207745e-05, "epoch": 1.1058069112931956, "percentage": 11.06, "elapsed_time": "7:39:12", "remaining_time": "2 days, 13:32:38", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1950, "total_steps": 17540, "loss": 0.8468, "learning_rate": 1.9992393539218334e-05, "epoch": 1.1115069469184182, "percentage": 11.12, "elapsed_time": "7:41:32", "remaining_time": "2 days, 13:30:01", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1960, "total_steps": 17540, "loss": 0.8612, "learning_rate": 1.999159768099367e-05, "epoch": 1.1172069825436408, "percentage": 11.17, "elapsed_time": "7:43:58", "remaining_time": "2 days, 13:28:04", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1970, "total_steps": 17540, "loss": 0.8515, "learning_rate": 1.9990762250555495e-05, "epoch": 1.1229070181688636, "percentage": 11.23, "elapsed_time": "7:46:23", "remaining_time": "2 days, 13:26:12", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1980, "total_steps": 17540, "loss": 0.8403, "learning_rate": 1.9989887251212575e-05, "epoch": 1.1286070537940862, "percentage": 11.29, "elapsed_time": "7:48:47", "remaining_time": "2 days, 13:23:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 1990, "total_steps": 17540, "loss": 0.8434, "learning_rate": 1.9988972686430382e-05, "epoch": 1.1343070894193088, "percentage": 11.35, "elapsed_time": "7:51:08", "remaining_time": "2 days, 13:21:29", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2000, "total_steps": 17540, "loss": 0.8573, "learning_rate": 1.9988018559831093e-05, "epoch": 1.1400071250445316, "percentage": 11.4, "elapsed_time": "7:53:31", "remaining_time": "2 days, 13:19:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2010, "total_steps": 17540, "loss": 0.8446, "learning_rate": 1.998702487519358e-05, "epoch": 1.1457071606697542, "percentage": 11.46, "elapsed_time": "7:55:55", "remaining_time": "2 days, 13:17:08", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2020, "total_steps": 17540, "loss": 0.8471, "learning_rate": 1.998599163645338e-05, "epoch": 1.1514071962949768, "percentage": 11.52, "elapsed_time": "7:58:16", "remaining_time": "2 days, 13:14:38", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2030, "total_steps": 17540, "loss": 0.8475, "learning_rate": 1.9984918847702684e-05, "epoch": 1.1571072319201996, "percentage": 11.57, "elapsed_time": "8:00:41", "remaining_time": "2 days, 13:12:40", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2040, "total_steps": 17540, "loss": 0.8463, "learning_rate": 1.9983806513190323e-05, "epoch": 1.1628072675454222, "percentage": 11.63, "elapsed_time": "8:02:58", "remaining_time": "2 days, 13:09:42", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2050, "total_steps": 17540, "loss": 0.8406, "learning_rate": 1.998265463732175e-05, "epoch": 1.1685073031706448, "percentage": 11.69, "elapsed_time": "8:05:17", "remaining_time": "2 days, 13:06:52", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2060, "total_steps": 17540, "loss": 0.8486, "learning_rate": 1.9981463224659034e-05, "epoch": 1.1742073387958674, "percentage": 11.74, "elapsed_time": "8:07:36", "remaining_time": "2 days, 13:04:10", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2070, "total_steps": 17540, "loss": 0.836, "learning_rate": 1.9980232279920814e-05, "epoch": 1.1799073744210902, "percentage": 11.8, "elapsed_time": "8:09:57", "remaining_time": "2 days, 13:01:39", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2080, "total_steps": 17540, "loss": 0.8432, "learning_rate": 1.9978961807982312e-05, "epoch": 1.1856074100463128, "percentage": 11.86, "elapsed_time": "8:12:18", "remaining_time": "2 days, 12:59:10", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2090, "total_steps": 17540, "loss": 0.8327, "learning_rate": 1.9977651813875293e-05, "epoch": 1.1913074456715353, "percentage": 11.92, "elapsed_time": "8:14:42", "remaining_time": "2 days, 12:57:01", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2100, "total_steps": 17540, "loss": 0.8362, "learning_rate": 1.997630230278806e-05, "epoch": 1.1970074812967582, "percentage": 11.97, "elapsed_time": "8:17:07", "remaining_time": "2 days, 12:55:00", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2110, "total_steps": 17540, "loss": 0.8441, "learning_rate": 1.997491328006541e-05, "epoch": 1.2027075169219807, "percentage": 12.03, "elapsed_time": "8:19:24", "remaining_time": "2 days, 12:52:07", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2120, "total_steps": 17540, "loss": 0.8383, "learning_rate": 1.9973484751208636e-05, "epoch": 1.2084075525472033, "percentage": 12.09, "elapsed_time": "8:21:46", "remaining_time": "2 days, 12:49:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2130, "total_steps": 17540, "loss": 0.8507, "learning_rate": 1.99720167218755e-05, "epoch": 1.2141075881724261, "percentage": 12.14, "elapsed_time": "8:24:10", "remaining_time": "2 days, 12:47:37", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2140, "total_steps": 17540, "loss": 0.8356, "learning_rate": 1.9970509197880204e-05, "epoch": 1.2198076237976487, "percentage": 12.2, "elapsed_time": "8:26:32", "remaining_time": "2 days, 12:45:09", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2150, "total_steps": 17540, "loss": 0.8411, "learning_rate": 1.9968962185193367e-05, "epoch": 1.2255076594228713, "percentage": 12.26, "elapsed_time": "8:28:55", "remaining_time": "2 days, 12:42:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2160, "total_steps": 17540, "loss": 0.8319, "learning_rate": 1.9967375689942013e-05, "epoch": 1.2312076950480941, "percentage": 12.31, "elapsed_time": "8:31:22", "remaining_time": "2 days, 12:41:08", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2170, "total_steps": 17540, "loss": 0.8488, "learning_rate": 1.9965749718409532e-05, "epoch": 1.2369077306733167, "percentage": 12.37, "elapsed_time": "8:33:44", "remaining_time": "2 days, 12:38:46", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2180, "total_steps": 17540, "loss": 0.8452, "learning_rate": 1.9964084277035668e-05, "epoch": 1.2426077662985393, "percentage": 12.43, "elapsed_time": "8:36:04", "remaining_time": "2 days, 12:36:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2190, "total_steps": 17540, "loss": 0.8414, "learning_rate": 1.996237937241648e-05, "epoch": 1.2483078019237621, "percentage": 12.49, "elapsed_time": "8:38:25", "remaining_time": "2 days, 12:33:45", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2200, "total_steps": 17540, "loss": 0.8434, "learning_rate": 1.9960635011304325e-05, "epoch": 1.2540078375489847, "percentage": 12.54, "elapsed_time": "8:40:46", "remaining_time": "2 days, 12:31:12", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2210, "total_steps": 17540, "loss": 0.8395, "learning_rate": 1.9958851200607833e-05, "epoch": 1.2597078731742073, "percentage": 12.6, "elapsed_time": "8:43:06", "remaining_time": "2 days, 12:28:40", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2220, "total_steps": 17540, "loss": 0.8477, "learning_rate": 1.9957027947391873e-05, "epoch": 1.26540790879943, "percentage": 12.66, "elapsed_time": "8:45:24", "remaining_time": "2 days, 12:25:49", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2230, "total_steps": 17540, "loss": 0.8354, "learning_rate": 1.9955165258877534e-05, "epoch": 1.2711079444246527, "percentage": 12.71, "elapsed_time": "8:47:54", "remaining_time": "2 days, 12:24:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2240, "total_steps": 17540, "loss": 0.8356, "learning_rate": 1.9953263142442078e-05, "epoch": 1.2768079800498753, "percentage": 12.77, "elapsed_time": "8:50:11", "remaining_time": "2 days, 12:21:22", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2250, "total_steps": 17540, "loss": 0.8259, "learning_rate": 1.9951321605618932e-05, "epoch": 1.282508015675098, "percentage": 12.83, "elapsed_time": "8:52:34", "remaining_time": "2 days, 12:19:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2260, "total_steps": 17540, "loss": 0.8307, "learning_rate": 1.9949340656097652e-05, "epoch": 1.2882080513003207, "percentage": 12.88, "elapsed_time": "8:54:57", "remaining_time": "2 days, 12:16:51", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2270, "total_steps": 17540, "loss": 0.8431, "learning_rate": 1.9947320301723882e-05, "epoch": 1.2939080869255433, "percentage": 12.94, "elapsed_time": "8:57:14", "remaining_time": "2 days, 12:14:00", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2280, "total_steps": 17540, "loss": 0.839, "learning_rate": 1.9945260550499337e-05, "epoch": 1.299608122550766, "percentage": 13.0, "elapsed_time": "8:59:34", "remaining_time": "2 days, 12:11:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2290, "total_steps": 17540, "loss": 0.8401, "learning_rate": 1.9943161410581765e-05, "epoch": 1.3053081581759887, "percentage": 13.06, "elapsed_time": "9:01:56", "remaining_time": "2 days, 12:09:01", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2300, "total_steps": 17540, "loss": 0.8297, "learning_rate": 1.994102289028491e-05, "epoch": 1.3110081938012113, "percentage": 13.11, "elapsed_time": "9:04:16", "remaining_time": "2 days, 12:06:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2310, "total_steps": 17540, "loss": 0.8322, "learning_rate": 1.993884499807848e-05, "epoch": 1.3167082294264338, "percentage": 13.17, "elapsed_time": "9:06:38", "remaining_time": "2 days, 12:04:02", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2320, "total_steps": 17540, "loss": 0.8331, "learning_rate": 1.9936627742588136e-05, "epoch": 1.3224082650516567, "percentage": 13.23, "elapsed_time": "9:09:03", "remaining_time": "2 days, 12:01:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2330, "total_steps": 17540, "loss": 0.8253, "learning_rate": 1.9934371132595426e-05, "epoch": 1.3281083006768792, "percentage": 13.28, "elapsed_time": "9:11:25", "remaining_time": "2 days, 11:59:38", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2340, "total_steps": 17540, "loss": 0.8252, "learning_rate": 1.9932075177037757e-05, "epoch": 1.3338083363021018, "percentage": 13.34, "elapsed_time": "9:13:47", "remaining_time": "2 days, 11:57:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2350, "total_steps": 17540, "loss": 0.8218, "learning_rate": 1.9929739885008375e-05, "epoch": 1.3395083719273244, "percentage": 13.4, "elapsed_time": "9:16:05", "remaining_time": "2 days, 11:54:30", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2360, "total_steps": 17540, "loss": 0.834, "learning_rate": 1.9927365265756326e-05, "epoch": 1.3452084075525472, "percentage": 13.45, "elapsed_time": "9:18:22", "remaining_time": "2 days, 11:51:37", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2370, "total_steps": 17540, "loss": 0.8324, "learning_rate": 1.9924951328686398e-05, "epoch": 1.3509084431777698, "percentage": 13.51, "elapsed_time": "9:20:44", "remaining_time": "2 days, 11:49:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2380, "total_steps": 17540, "loss": 0.8257, "learning_rate": 1.9922498083359113e-05, "epoch": 1.3566084788029924, "percentage": 13.57, "elapsed_time": "9:23:04", "remaining_time": "2 days, 11:46:39", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2390, "total_steps": 17540, "loss": 0.8274, "learning_rate": 1.9920005539490666e-05, "epoch": 1.3623085144282152, "percentage": 13.63, "elapsed_time": "9:25:24", "remaining_time": "2 days, 11:44:01", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2400, "total_steps": 17540, "loss": 0.8349, "learning_rate": 1.9917473706952905e-05, "epoch": 1.3680085500534378, "percentage": 13.68, "elapsed_time": "9:27:41", "remaining_time": "2 days, 11:41:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2410, "total_steps": 17540, "loss": 0.8306, "learning_rate": 1.9914902595773268e-05, "epoch": 1.3737085856786604, "percentage": 13.74, "elapsed_time": "9:30:03", "remaining_time": "2 days, 11:38:49", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2420, "total_steps": 17540, "loss": 0.8298, "learning_rate": 1.9912292216134775e-05, "epoch": 1.3794086213038832, "percentage": 13.8, "elapsed_time": "9:32:24", "remaining_time": "2 days, 11:36:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2430, "total_steps": 17540, "loss": 0.8148, "learning_rate": 1.990964257837596e-05, "epoch": 1.3851086569291058, "percentage": 13.85, "elapsed_time": "9:34:43", "remaining_time": "2 days, 11:33:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2440, "total_steps": 17540, "loss": 0.8277, "learning_rate": 1.9906953692990843e-05, "epoch": 1.3908086925543284, "percentage": 13.91, "elapsed_time": "9:37:05", "remaining_time": "2 days, 11:31:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2450, "total_steps": 17540, "loss": 0.8248, "learning_rate": 1.990422557062889e-05, "epoch": 1.3965087281795512, "percentage": 13.97, "elapsed_time": "9:39:26", "remaining_time": "2 days, 11:28:51", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2460, "total_steps": 17540, "loss": 0.8291, "learning_rate": 1.9901458222094964e-05, "epoch": 1.4022087638047738, "percentage": 14.03, "elapsed_time": "9:41:50", "remaining_time": "2 days, 11:26:44", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2470, "total_steps": 17540, "loss": 0.8294, "learning_rate": 1.9898651658349276e-05, "epoch": 1.4079087994299964, "percentage": 14.08, "elapsed_time": "9:44:17", "remaining_time": "2 days, 11:24:54", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2480, "total_steps": 17540, "loss": 0.827, "learning_rate": 1.9895805890507368e-05, "epoch": 1.4136088350552192, "percentage": 14.14, "elapsed_time": "9:46:37", "remaining_time": "2 days, 11:22:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2490, "total_steps": 17540, "loss": 0.8256, "learning_rate": 1.9892920929840042e-05, "epoch": 1.4193088706804418, "percentage": 14.2, "elapsed_time": "9:48:59", "remaining_time": "2 days, 11:19:57", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2500, "total_steps": 17540, "loss": 0.8149, "learning_rate": 1.988999678777332e-05, "epoch": 1.4250089063056643, "percentage": 14.25, "elapsed_time": "9:51:23", "remaining_time": "2 days, 11:17:49", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2510, "total_steps": 17540, "loss": 0.8219, "learning_rate": 1.988703347588842e-05, "epoch": 1.4307089419308872, "percentage": 14.31, "elapsed_time": "9:53:41", "remaining_time": "2 days, 11:15:05", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2520, "total_steps": 17540, "loss": 0.8272, "learning_rate": 1.988403100592168e-05, "epoch": 1.4364089775561097, "percentage": 14.37, "elapsed_time": "9:56:06", "remaining_time": "2 days, 11:12:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2530, "total_steps": 17540, "loss": 0.8185, "learning_rate": 1.988098938976453e-05, "epoch": 1.4421090131813323, "percentage": 14.42, "elapsed_time": "9:58:28", "remaining_time": "2 days, 11:10:35", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2540, "total_steps": 17540, "loss": 0.8224, "learning_rate": 1.9877908639463438e-05, "epoch": 1.4478090488065551, "percentage": 14.48, "elapsed_time": "10:00:49", "remaining_time": "2 days, 11:08:08", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2550, "total_steps": 17540, "loss": 0.829, "learning_rate": 1.987478876721987e-05, "epoch": 1.4535090844317777, "percentage": 14.54, "elapsed_time": "10:03:12", "remaining_time": "2 days, 11:05:52", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2560, "total_steps": 17540, "loss": 0.823, "learning_rate": 1.9871629785390234e-05, "epoch": 1.4592091200570003, "percentage": 14.6, "elapsed_time": "10:05:32", "remaining_time": "2 days, 11:03:22", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2570, "total_steps": 17540, "loss": 0.8192, "learning_rate": 1.986843170648583e-05, "epoch": 1.4649091556822231, "percentage": 14.65, "elapsed_time": "10:07:54", "remaining_time": "2 days, 11:01:01", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2580, "total_steps": 17540, "loss": 0.813, "learning_rate": 1.9865194543172808e-05, "epoch": 1.4706091913074457, "percentage": 14.71, "elapsed_time": "10:10:17", "remaining_time": "2 days, 10:58:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2590, "total_steps": 17540, "loss": 0.8206, "learning_rate": 1.986191830827211e-05, "epoch": 1.4763092269326683, "percentage": 14.77, "elapsed_time": "10:12:37", "remaining_time": "2 days, 10:56:13", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2600, "total_steps": 17540, "loss": 0.8288, "learning_rate": 1.985860301475943e-05, "epoch": 1.4820092625578911, "percentage": 14.82, "elapsed_time": "10:14:57", "remaining_time": "2 days, 10:53:37", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2610, "total_steps": 17540, "loss": 0.8212, "learning_rate": 1.9855248675765146e-05, "epoch": 1.4877092981831137, "percentage": 14.88, "elapsed_time": "10:17:16", "remaining_time": "2 days, 10:50:57", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2620, "total_steps": 17540, "loss": 0.8271, "learning_rate": 1.9851855304574287e-05, "epoch": 1.4934093338083363, "percentage": 14.94, "elapsed_time": "10:19:33", "remaining_time": "2 days, 10:48:07", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2630, "total_steps": 17540, "loss": 0.8287, "learning_rate": 1.9848422914626462e-05, "epoch": 1.4991093694335589, "percentage": 14.99, "elapsed_time": "10:21:51", "remaining_time": "2 days, 10:45:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2640, "total_steps": 17540, "loss": 0.8171, "learning_rate": 1.984495151951582e-05, "epoch": 1.5048094050587815, "percentage": 15.05, "elapsed_time": "10:24:16", "remaining_time": "2 days, 10:43:20", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2650, "total_steps": 17540, "loss": 0.8253, "learning_rate": 1.9841441132990998e-05, "epoch": 1.5105094406840043, "percentage": 15.11, "elapsed_time": "10:26:39", "remaining_time": "2 days, 10:41:07", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2660, "total_steps": 17540, "loss": 0.809, "learning_rate": 1.983789176895505e-05, "epoch": 1.516209476309227, "percentage": 15.17, "elapsed_time": "10:29:00", "remaining_time": "2 days, 10:38:40", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2670, "total_steps": 17540, "loss": 0.8264, "learning_rate": 1.9834303441465402e-05, "epoch": 1.5219095119344495, "percentage": 15.22, "elapsed_time": "10:31:20", "remaining_time": "2 days, 10:36:08", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2680, "total_steps": 17540, "loss": 0.8128, "learning_rate": 1.9830676164733808e-05, "epoch": 1.5276095475596723, "percentage": 15.28, "elapsed_time": "10:33:43", "remaining_time": "2 days, 10:33:52", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2690, "total_steps": 17540, "loss": 0.8049, "learning_rate": 1.9827009953126277e-05, "epoch": 1.5333095831848949, "percentage": 15.34, "elapsed_time": "10:36:06", "remaining_time": "2 days, 10:31:37", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2700, "total_steps": 17540, "loss": 0.8144, "learning_rate": 1.982330482116301e-05, "epoch": 1.5390096188101174, "percentage": 15.39, "elapsed_time": "10:38:33", "remaining_time": "2 days, 10:29:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2710, "total_steps": 17540, "loss": 0.8044, "learning_rate": 1.9819560783518378e-05, "epoch": 1.5447096544353403, "percentage": 15.45, "elapsed_time": "10:40:55", "remaining_time": "2 days, 10:27:21", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2720, "total_steps": 17540, "loss": 0.8171, "learning_rate": 1.9815777855020818e-05, "epoch": 1.5504096900605628, "percentage": 15.51, "elapsed_time": "10:43:17", "remaining_time": "2 days, 10:24:58", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2730, "total_steps": 17540, "loss": 0.8145, "learning_rate": 1.9811956050652803e-05, "epoch": 1.5561097256857854, "percentage": 15.56, "elapsed_time": "10:45:36", "remaining_time": "2 days, 10:22:21", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2740, "total_steps": 17540, "loss": 0.8229, "learning_rate": 1.9808095385550777e-05, "epoch": 1.5618097613110082, "percentage": 15.62, "elapsed_time": "10:48:00", "remaining_time": "2 days, 10:20:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2750, "total_steps": 17540, "loss": 0.8166, "learning_rate": 1.98041958750051e-05, "epoch": 1.5675097969362308, "percentage": 15.68, "elapsed_time": "10:50:24", "remaining_time": "2 days, 10:18:01", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2760, "total_steps": 17540, "loss": 0.8113, "learning_rate": 1.980025753445997e-05, "epoch": 1.5732098325614534, "percentage": 15.74, "elapsed_time": "10:52:43", "remaining_time": "2 days, 10:15:25", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2770, "total_steps": 17540, "loss": 0.818, "learning_rate": 1.979628037951338e-05, "epoch": 1.5789098681866762, "percentage": 15.79, "elapsed_time": "10:55:05", "remaining_time": "2 days, 10:13:03", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2780, "total_steps": 17540, "loss": 0.8144, "learning_rate": 1.9792264425917048e-05, "epoch": 1.5846099038118988, "percentage": 15.85, "elapsed_time": "10:57:27", "remaining_time": "2 days, 10:10:41", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2790, "total_steps": 17540, "loss": 0.8135, "learning_rate": 1.9788209689576356e-05, "epoch": 1.5903099394371214, "percentage": 15.91, "elapsed_time": "10:59:51", "remaining_time": "2 days, 10:08:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2800, "total_steps": 17540, "loss": 0.8125, "learning_rate": 1.9784116186550282e-05, "epoch": 1.5960099750623442, "percentage": 15.96, "elapsed_time": "11:02:17", "remaining_time": "2 days, 10:06:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2810, "total_steps": 17540, "loss": 0.8142, "learning_rate": 1.977998393305135e-05, "epoch": 1.6017100106875668, "percentage": 16.02, "elapsed_time": "11:04:38", "remaining_time": "2 days, 10:04:02", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2820, "total_steps": 17540, "loss": 0.8226, "learning_rate": 1.977581294544555e-05, "epoch": 1.6074100463127894, "percentage": 16.08, "elapsed_time": "11:06:59", "remaining_time": "2 days, 10:01:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2830, "total_steps": 17540, "loss": 0.8222, "learning_rate": 1.9771603240252287e-05, "epoch": 1.6131100819380122, "percentage": 16.13, "elapsed_time": "11:09:20", "remaining_time": "2 days, 9:59:08", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2840, "total_steps": 17540, "loss": 0.7992, "learning_rate": 1.97673548341443e-05, "epoch": 1.6188101175632348, "percentage": 16.19, "elapsed_time": "11:11:42", "remaining_time": "2 days, 9:56:47", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2850, "total_steps": 17540, "loss": 0.8145, "learning_rate": 1.9763067743947618e-05, "epoch": 1.6245101531884574, "percentage": 16.25, "elapsed_time": "11:14:03", "remaining_time": "2 days, 9:54:21", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2860, "total_steps": 17540, "loss": 0.8206, "learning_rate": 1.9758741986641466e-05, "epoch": 1.6302101888136802, "percentage": 16.31, "elapsed_time": "11:16:28", "remaining_time": "2 days, 9:52:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2870, "total_steps": 17540, "loss": 0.8108, "learning_rate": 1.9754377579358222e-05, "epoch": 1.6359102244389028, "percentage": 16.36, "elapsed_time": "11:18:50", "remaining_time": "2 days, 9:49:54", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2880, "total_steps": 17540, "loss": 0.8131, "learning_rate": 1.974997453938333e-05, "epoch": 1.6416102600641254, "percentage": 16.42, "elapsed_time": "11:21:09", "remaining_time": "2 days, 9:47:18", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2890, "total_steps": 17540, "loss": 0.8231, "learning_rate": 1.974553288415525e-05, "epoch": 1.6473102956893482, "percentage": 16.48, "elapsed_time": "11:23:25", "remaining_time": "2 days, 9:44:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2900, "total_steps": 17540, "loss": 0.8266, "learning_rate": 1.974105263126538e-05, "epoch": 1.6530103313145708, "percentage": 16.53, "elapsed_time": "11:25:53", "remaining_time": "2 days, 9:42:35", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2910, "total_steps": 17540, "loss": 0.8157, "learning_rate": 1.9736533798457976e-05, "epoch": 1.6587103669397933, "percentage": 16.59, "elapsed_time": "11:28:13", "remaining_time": "2 days, 9:40:01", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2920, "total_steps": 17540, "loss": 0.813, "learning_rate": 1.9731976403630096e-05, "epoch": 1.6644104025650162, "percentage": 16.65, "elapsed_time": "11:30:35", "remaining_time": "2 days, 9:37:40", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2930, "total_steps": 17540, "loss": 0.8019, "learning_rate": 1.972738046483153e-05, "epoch": 1.6701104381902387, "percentage": 16.7, "elapsed_time": "11:32:59", "remaining_time": "2 days, 9:35:27", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2940, "total_steps": 17540, "loss": 0.816, "learning_rate": 1.972274600026472e-05, "epoch": 1.6758104738154613, "percentage": 16.76, "elapsed_time": "11:35:23", "remaining_time": "2 days, 9:33:20", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2950, "total_steps": 17540, "loss": 0.8182, "learning_rate": 1.9718073028284686e-05, "epoch": 1.6815105094406841, "percentage": 16.82, "elapsed_time": "11:37:44", "remaining_time": "2 days, 9:30:53", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2960, "total_steps": 17540, "loss": 0.8171, "learning_rate": 1.971336156739897e-05, "epoch": 1.6872105450659065, "percentage": 16.88, "elapsed_time": "11:40:05", "remaining_time": "2 days, 9:28:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2970, "total_steps": 17540, "loss": 0.8136, "learning_rate": 1.9708611636267538e-05, "epoch": 1.6929105806911293, "percentage": 16.93, "elapsed_time": "11:42:30", "remaining_time": "2 days, 9:26:20", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2980, "total_steps": 17540, "loss": 0.8137, "learning_rate": 1.9703823253702728e-05, "epoch": 1.6986106163163521, "percentage": 16.99, "elapsed_time": "11:44:55", "remaining_time": "2 days, 9:24:13", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 2990, "total_steps": 17540, "loss": 0.8145, "learning_rate": 1.9698996438669163e-05, "epoch": 1.7043106519415745, "percentage": 17.05, "elapsed_time": "11:47:15", "remaining_time": "2 days, 9:21:42", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3000, "total_steps": 17540, "loss": 0.8183, "learning_rate": 1.969413121028368e-05, "epoch": 1.7100106875667973, "percentage": 17.1, "elapsed_time": "11:49:36", "remaining_time": "2 days, 9:19:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3010, "total_steps": 17540, "loss": 0.8097, "learning_rate": 1.9689227587815263e-05, "epoch": 1.7157107231920201, "percentage": 17.16, "elapsed_time": "11:51:58", "remaining_time": "2 days, 9:16:51", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3020, "total_steps": 17540, "loss": 0.8078, "learning_rate": 1.968428559068494e-05, "epoch": 1.7214107588172425, "percentage": 17.22, "elapsed_time": "11:54:16", "remaining_time": "2 days, 9:14:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3030, "total_steps": 17540, "loss": 0.8117, "learning_rate": 1.967930523846574e-05, "epoch": 1.7271107944424653, "percentage": 17.27, "elapsed_time": "11:56:38", "remaining_time": "2 days, 9:11:49", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3040, "total_steps": 17540, "loss": 0.8007, "learning_rate": 1.9674286550882593e-05, "epoch": 1.7328108300676879, "percentage": 17.33, "elapsed_time": "11:59:00", "remaining_time": "2 days, 9:09:30", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3050, "total_steps": 17540, "loss": 0.8103, "learning_rate": 1.966922954781225e-05, "epoch": 1.7385108656929105, "percentage": 17.39, "elapsed_time": "12:01:24", "remaining_time": "2 days, 9:07:18", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3060, "total_steps": 17540, "loss": 0.8119, "learning_rate": 1.9664134249283226e-05, "epoch": 1.7442109013181333, "percentage": 17.45, "elapsed_time": "12:03:47", "remaining_time": "2 days, 9:05:00", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3070, "total_steps": 17540, "loss": 0.8055, "learning_rate": 1.96590006754757e-05, "epoch": 1.7499109369433559, "percentage": 17.5, "elapsed_time": "12:06:09", "remaining_time": "2 days, 9:02:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3080, "total_steps": 17540, "loss": 0.8093, "learning_rate": 1.9653828846721447e-05, "epoch": 1.7556109725685785, "percentage": 17.56, "elapsed_time": "12:08:25", "remaining_time": "2 days, 8:59:48", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3090, "total_steps": 17540, "loss": 0.805, "learning_rate": 1.964861878350374e-05, "epoch": 1.7613110081938013, "percentage": 17.62, "elapsed_time": "12:10:42", "remaining_time": "2 days, 8:57:04", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3100, "total_steps": 17540, "loss": 0.8012, "learning_rate": 1.96433705064573e-05, "epoch": 1.7670110438190239, "percentage": 17.67, "elapsed_time": "12:13:04", "remaining_time": "2 days, 8:54:42", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3110, "total_steps": 17540, "loss": 0.8117, "learning_rate": 1.963808403636818e-05, "epoch": 1.7727110794442464, "percentage": 17.73, "elapsed_time": "12:15:26", "remaining_time": "2 days, 8:52:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3120, "total_steps": 17540, "loss": 0.8053, "learning_rate": 1.9632759394173705e-05, "epoch": 1.7784111150694693, "percentage": 17.79, "elapsed_time": "12:17:47", "remaining_time": "2 days, 8:49:54", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3130, "total_steps": 17540, "loss": 0.8116, "learning_rate": 1.962739660096239e-05, "epoch": 1.7841111506946918, "percentage": 17.84, "elapsed_time": "12:20:18", "remaining_time": "2 days, 8:48:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3140, "total_steps": 17540, "loss": 0.8076, "learning_rate": 1.9621995677973827e-05, "epoch": 1.7898111863199144, "percentage": 17.9, "elapsed_time": "12:22:39", "remaining_time": "2 days, 8:45:48", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3150, "total_steps": 17540, "loss": 0.8129, "learning_rate": 1.9616556646598647e-05, "epoch": 1.7955112219451372, "percentage": 17.96, "elapsed_time": "12:25:01", "remaining_time": "2 days, 8:43:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3160, "total_steps": 17540, "loss": 0.7991, "learning_rate": 1.9611079528378395e-05, "epoch": 1.8012112575703598, "percentage": 18.02, "elapsed_time": "12:27:20", "remaining_time": "2 days, 8:40:52", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3170, "total_steps": 17540, "loss": 0.7973, "learning_rate": 1.9605564345005473e-05, "epoch": 1.8069112931955824, "percentage": 18.07, "elapsed_time": "12:29:49", "remaining_time": "2 days, 8:39:02", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3180, "total_steps": 17540, "loss": 0.7968, "learning_rate": 1.9600011118323034e-05, "epoch": 1.8126113288208052, "percentage": 18.13, "elapsed_time": "12:32:06", "remaining_time": "2 days, 8:36:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3190, "total_steps": 17540, "loss": 0.7988, "learning_rate": 1.9594419870324902e-05, "epoch": 1.8183113644460278, "percentage": 18.19, "elapsed_time": "12:34:29", "remaining_time": "2 days, 8:33:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3200, "total_steps": 17540, "loss": 0.8106, "learning_rate": 1.958879062315549e-05, "epoch": 1.8240114000712504, "percentage": 18.24, "elapsed_time": "12:36:54", "remaining_time": "2 days, 8:31:53", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3210, "total_steps": 17540, "loss": 0.806, "learning_rate": 1.958312339910971e-05, "epoch": 1.8297114356964732, "percentage": 18.3, "elapsed_time": "12:39:12", "remaining_time": "2 days, 8:29:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3220, "total_steps": 17540, "loss": 0.7976, "learning_rate": 1.957741822063288e-05, "epoch": 1.8354114713216958, "percentage": 18.36, "elapsed_time": "12:41:35", "remaining_time": "2 days, 8:26:55", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3230, "total_steps": 17540, "loss": 0.7943, "learning_rate": 1.9571675110320643e-05, "epoch": 1.8411115069469184, "percentage": 18.42, "elapsed_time": "12:43:56", "remaining_time": "2 days, 8:24:32", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3240, "total_steps": 17540, "loss": 0.8021, "learning_rate": 1.9565894090918865e-05, "epoch": 1.8468115425721412, "percentage": 18.47, "elapsed_time": "12:46:16", "remaining_time": "2 days, 8:22:02", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3250, "total_steps": 17540, "loss": 0.802, "learning_rate": 1.956007518532356e-05, "epoch": 1.8525115781973638, "percentage": 18.53, "elapsed_time": "12:48:39", "remaining_time": "2 days, 8:19:42", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3260, "total_steps": 17540, "loss": 0.8038, "learning_rate": 1.9554218416580787e-05, "epoch": 1.8582116138225864, "percentage": 18.59, "elapsed_time": "12:51:06", "remaining_time": "2 days, 8:17:45", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3270, "total_steps": 17540, "loss": 0.8009, "learning_rate": 1.9548323807886568e-05, "epoch": 1.8639116494478092, "percentage": 18.64, "elapsed_time": "12:53:32", "remaining_time": "2 days, 8:15:38", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3280, "total_steps": 17540, "loss": 0.7997, "learning_rate": 1.954239138258679e-05, "epoch": 1.8696116850730315, "percentage": 18.7, "elapsed_time": "12:55:53", "remaining_time": "2 days, 8:13:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3290, "total_steps": 17540, "loss": 0.8007, "learning_rate": 1.9536421164177115e-05, "epoch": 1.8753117206982544, "percentage": 18.76, "elapsed_time": "12:58:16", "remaining_time": "2 days, 8:10:56", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3300, "total_steps": 17540, "loss": 0.8025, "learning_rate": 1.953041317630289e-05, "epoch": 1.8810117563234772, "percentage": 18.81, "elapsed_time": "13:00:39", "remaining_time": "2 days, 8:08:38", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3310, "total_steps": 17540, "loss": 0.7985, "learning_rate": 1.9524367442759038e-05, "epoch": 1.8867117919486995, "percentage": 18.87, "elapsed_time": "13:03:01", "remaining_time": "2 days, 8:06:16", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3320, "total_steps": 17540, "loss": 0.7947, "learning_rate": 1.951828398748999e-05, "epoch": 1.8924118275739223, "percentage": 18.93, "elapsed_time": "13:05:24", "remaining_time": "2 days, 8:03:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3330, "total_steps": 17540, "loss": 0.7969, "learning_rate": 1.951216283458957e-05, "epoch": 1.8981118631991452, "percentage": 18.99, "elapsed_time": "13:07:42", "remaining_time": "2 days, 8:01:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3340, "total_steps": 17540, "loss": 0.7985, "learning_rate": 1.95060040083009e-05, "epoch": 1.9038118988243675, "percentage": 19.04, "elapsed_time": "13:10:01", "remaining_time": "2 days, 7:58:45", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3350, "total_steps": 17540, "loss": 0.795, "learning_rate": 1.9499807533016314e-05, "epoch": 1.9095119344495903, "percentage": 19.1, "elapsed_time": "13:12:19", "remaining_time": "2 days, 7:56:10", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3360, "total_steps": 17540, "loss": 0.7978, "learning_rate": 1.9493573433277263e-05, "epoch": 1.915211970074813, "percentage": 19.16, "elapsed_time": "13:14:38", "remaining_time": "2 days, 7:53:33", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3370, "total_steps": 17540, "loss": 0.8048, "learning_rate": 1.9487301733774205e-05, "epoch": 1.9209120057000355, "percentage": 19.21, "elapsed_time": "13:17:00", "remaining_time": "2 days, 7:51:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3380, "total_steps": 17540, "loss": 0.8002, "learning_rate": 1.9480992459346506e-05, "epoch": 1.9266120413252583, "percentage": 19.27, "elapsed_time": "13:19:17", "remaining_time": "2 days, 7:48:31", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3390, "total_steps": 17540, "loss": 0.8063, "learning_rate": 1.9474645634982363e-05, "epoch": 1.932312076950481, "percentage": 19.33, "elapsed_time": "13:21:36", "remaining_time": "2 days, 7:45:56", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3400, "total_steps": 17540, "loss": 0.8002, "learning_rate": 1.9468261285818686e-05, "epoch": 1.9380121125757035, "percentage": 19.38, "elapsed_time": "13:24:01", "remaining_time": "2 days, 7:43:46", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3410, "total_steps": 17540, "loss": 0.7874, "learning_rate": 1.9461839437141003e-05, "epoch": 1.9437121482009263, "percentage": 19.44, "elapsed_time": "13:26:23", "remaining_time": "2 days, 7:41:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3420, "total_steps": 17540, "loss": 0.7924, "learning_rate": 1.945538011438336e-05, "epoch": 1.949412183826149, "percentage": 19.5, "elapsed_time": "13:28:48", "remaining_time": "2 days, 7:39:18", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3430, "total_steps": 17540, "loss": 0.8058, "learning_rate": 1.9448883343128222e-05, "epoch": 1.9551122194513715, "percentage": 19.56, "elapsed_time": "13:31:09", "remaining_time": "2 days, 7:36:52", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3440, "total_steps": 17540, "loss": 0.7957, "learning_rate": 1.944234914910637e-05, "epoch": 1.9608122550765943, "percentage": 19.61, "elapsed_time": "13:33:37", "remaining_time": "2 days, 7:34:53", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3450, "total_steps": 17540, "loss": 0.7956, "learning_rate": 1.9435777558196804e-05, "epoch": 1.9665122907018169, "percentage": 19.67, "elapsed_time": "13:35:57", "remaining_time": "2 days, 7:32:27", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3460, "total_steps": 17540, "loss": 0.8089, "learning_rate": 1.9429168596426635e-05, "epoch": 1.9722123263270395, "percentage": 19.73, "elapsed_time": "13:38:21", "remaining_time": "2 days, 7:30:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3470, "total_steps": 17540, "loss": 0.7965, "learning_rate": 1.9422522289970968e-05, "epoch": 1.9779123619522623, "percentage": 19.78, "elapsed_time": "13:40:45", "remaining_time": "2 days, 7:27:56", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3480, "total_steps": 17540, "loss": 0.793, "learning_rate": 1.9415838665152837e-05, "epoch": 1.9836123975774849, "percentage": 19.84, "elapsed_time": "13:43:04", "remaining_time": "2 days, 7:25:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3490, "total_steps": 17540, "loss": 0.806, "learning_rate": 1.940911774844307e-05, "epoch": 1.9893124332027075, "percentage": 19.9, "elapsed_time": "13:45:26", "remaining_time": "2 days, 7:23:02", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3500, "total_steps": 17540, "loss": 0.803, "learning_rate": 1.9402359566460175e-05, "epoch": 1.9950124688279303, "percentage": 19.95, "elapsed_time": "13:47:45", "remaining_time": "2 days, 7:20:29", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3510, "total_steps": 17540, "loss": 0.7912, "learning_rate": 1.9395564145970275e-05, "epoch": 2.0007125044531526, "percentage": 20.01, "elapsed_time": "13:50:07", "remaining_time": "2 days, 7:18:07", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3520, "total_steps": 17540, "loss": 0.772, "learning_rate": 1.9388731513886962e-05, "epoch": 2.0064125400783754, "percentage": 20.07, "elapsed_time": "13:52:28", "remaining_time": "2 days, 7:15:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3530, "total_steps": 17540, "loss": 0.7845, "learning_rate": 1.9381861697271208e-05, "epoch": 2.0121125757035982, "percentage": 20.13, "elapsed_time": "13:54:51", "remaining_time": "2 days, 7:13:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3540, "total_steps": 17540, "loss": 0.7835, "learning_rate": 1.9374954723331267e-05, "epoch": 2.0178126113288206, "percentage": 20.18, "elapsed_time": "13:57:13", "remaining_time": "2 days, 7:11:02", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3550, "total_steps": 17540, "loss": 0.7776, "learning_rate": 1.9368010619422542e-05, "epoch": 2.0235126469540434, "percentage": 20.24, "elapsed_time": "13:59:31", "remaining_time": "2 days, 7:08:25", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3560, "total_steps": 17540, "loss": 0.7837, "learning_rate": 1.93610294130475e-05, "epoch": 2.0292126825792662, "percentage": 20.3, "elapsed_time": "14:01:53", "remaining_time": "2 days, 7:06:04", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3570, "total_steps": 17540, "loss": 0.7818, "learning_rate": 1.9354011131855554e-05, "epoch": 2.0349127182044886, "percentage": 20.35, "elapsed_time": "14:04:13", "remaining_time": "2 days, 7:03:34", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3580, "total_steps": 17540, "loss": 0.779, "learning_rate": 1.934695580364295e-05, "epoch": 2.0406127538297114, "percentage": 20.41, "elapsed_time": "14:06:34", "remaining_time": "2 days, 7:01:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3590, "total_steps": 17540, "loss": 0.7794, "learning_rate": 1.9339863456352658e-05, "epoch": 2.0463127894549342, "percentage": 20.47, "elapsed_time": "14:08:47", "remaining_time": "2 days, 6:58:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3600, "total_steps": 17540, "loss": 0.7741, "learning_rate": 1.9332734118074274e-05, "epoch": 2.0520128250801566, "percentage": 20.52, "elapsed_time": "14:11:08", "remaining_time": "2 days, 6:55:49", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3610, "total_steps": 17540, "loss": 0.7891, "learning_rate": 1.9325567817043888e-05, "epoch": 2.0577128607053794, "percentage": 20.58, "elapsed_time": "14:13:32", "remaining_time": "2 days, 6:53:35", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3620, "total_steps": 17540, "loss": 0.7745, "learning_rate": 1.931836458164399e-05, "epoch": 2.063412896330602, "percentage": 20.64, "elapsed_time": "14:15:51", "remaining_time": "2 days, 6:51:03", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3630, "total_steps": 17540, "loss": 0.7744, "learning_rate": 1.9311124440403347e-05, "epoch": 2.0691129319558246, "percentage": 20.7, "elapsed_time": "14:18:14", "remaining_time": "2 days, 6:48:46", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3640, "total_steps": 17540, "loss": 0.7846, "learning_rate": 1.9303847421996895e-05, "epoch": 2.0748129675810474, "percentage": 20.75, "elapsed_time": "14:20:40", "remaining_time": "2 days, 6:46:40", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3650, "total_steps": 17540, "loss": 0.7767, "learning_rate": 1.929653355524562e-05, "epoch": 2.08051300320627, "percentage": 20.81, "elapsed_time": "14:23:01", "remaining_time": "2 days, 6:44:12", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3660, "total_steps": 17540, "loss": 0.7786, "learning_rate": 1.928918286911645e-05, "epoch": 2.0862130388314926, "percentage": 20.87, "elapsed_time": "14:25:21", "remaining_time": "2 days, 6:41:45", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3670, "total_steps": 17540, "loss": 0.788, "learning_rate": 1.9281795392722146e-05, "epoch": 2.0919130744567154, "percentage": 20.92, "elapsed_time": "14:27:43", "remaining_time": "2 days, 6:39:22", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3680, "total_steps": 17540, "loss": 0.7828, "learning_rate": 1.9274371155321167e-05, "epoch": 2.097613110081938, "percentage": 20.98, "elapsed_time": "14:30:08", "remaining_time": "2 days, 6:37:13", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3690, "total_steps": 17540, "loss": 0.784, "learning_rate": 1.9266910186317566e-05, "epoch": 2.1033131457071605, "percentage": 21.04, "elapsed_time": "14:32:31", "remaining_time": "2 days, 6:34:55", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3700, "total_steps": 17540, "loss": 0.7681, "learning_rate": 1.925941251526088e-05, "epoch": 2.1090131813323834, "percentage": 21.09, "elapsed_time": "14:34:54", "remaining_time": "2 days, 6:32:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3710, "total_steps": 17540, "loss": 0.7695, "learning_rate": 1.9251878171846008e-05, "epoch": 2.114713216957606, "percentage": 21.15, "elapsed_time": "14:37:16", "remaining_time": "2 days, 6:30:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3720, "total_steps": 17540, "loss": 0.7841, "learning_rate": 1.924430718591308e-05, "epoch": 2.1204132525828285, "percentage": 21.21, "elapsed_time": "14:39:43", "remaining_time": "2 days, 6:28:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3730, "total_steps": 17540, "loss": 0.7768, "learning_rate": 1.9236699587447363e-05, "epoch": 2.1261132882080513, "percentage": 21.27, "elapsed_time": "14:42:07", "remaining_time": "2 days, 6:25:58", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3740, "total_steps": 17540, "loss": 0.7785, "learning_rate": 1.922905540657912e-05, "epoch": 2.131813323833274, "percentage": 21.32, "elapsed_time": "14:44:40", "remaining_time": "2 days, 6:24:17", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3750, "total_steps": 17540, "loss": 0.7761, "learning_rate": 1.922137467358351e-05, "epoch": 2.1375133594584965, "percentage": 21.38, "elapsed_time": "14:46:56", "remaining_time": "2 days, 6:21:35", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3760, "total_steps": 17540, "loss": 0.7856, "learning_rate": 1.921365741888045e-05, "epoch": 2.1432133950837193, "percentage": 21.44, "elapsed_time": "14:49:19", "remaining_time": "2 days, 6:19:16", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3770, "total_steps": 17540, "loss": 0.7807, "learning_rate": 1.920590367303451e-05, "epoch": 2.1489134307089417, "percentage": 21.49, "elapsed_time": "14:51:41", "remaining_time": "2 days, 6:16:56", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3780, "total_steps": 17540, "loss": 0.7772, "learning_rate": 1.9198113466754775e-05, "epoch": 2.1546134663341645, "percentage": 21.55, "elapsed_time": "14:54:01", "remaining_time": "2 days, 6:14:27", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3790, "total_steps": 17540, "loss": 0.7753, "learning_rate": 1.9190286830894744e-05, "epoch": 2.1603135019593873, "percentage": 21.61, "elapsed_time": "14:56:22", "remaining_time": "2 days, 6:12:02", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3800, "total_steps": 17540, "loss": 0.782, "learning_rate": 1.9182423796452196e-05, "epoch": 2.16601353758461, "percentage": 21.66, "elapsed_time": "14:58:41", "remaining_time": "2 days, 6:09:29", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3810, "total_steps": 17540, "loss": 0.7792, "learning_rate": 1.9174524394569058e-05, "epoch": 2.1717135732098325, "percentage": 21.72, "elapsed_time": "15:01:02", "remaining_time": "2 days, 6:07:02", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3820, "total_steps": 17540, "loss": 0.7726, "learning_rate": 1.9166588656531305e-05, "epoch": 2.1774136088350553, "percentage": 21.78, "elapsed_time": "15:03:23", "remaining_time": "2 days, 6:04:40", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3830, "total_steps": 17540, "loss": 0.7743, "learning_rate": 1.9158616613768812e-05, "epoch": 2.1831136444602777, "percentage": 21.84, "elapsed_time": "15:05:45", "remaining_time": "2 days, 6:02:17", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3840, "total_steps": 17540, "loss": 0.7771, "learning_rate": 1.915060829785525e-05, "epoch": 2.1888136800855005, "percentage": 21.89, "elapsed_time": "15:08:09", "remaining_time": "2 days, 6:00:03", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3850, "total_steps": 17540, "loss": 0.778, "learning_rate": 1.914256374050795e-05, "epoch": 2.1945137157107233, "percentage": 21.95, "elapsed_time": "15:10:31", "remaining_time": "2 days, 5:57:40", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3860, "total_steps": 17540, "loss": 0.7782, "learning_rate": 1.9134482973587773e-05, "epoch": 2.2002137513359457, "percentage": 22.01, "elapsed_time": "15:12:55", "remaining_time": "2 days, 5:55:26", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3870, "total_steps": 17540, "loss": 0.7771, "learning_rate": 1.912636602909899e-05, "epoch": 2.2059137869611685, "percentage": 22.06, "elapsed_time": "15:15:13", "remaining_time": "2 days, 5:52:50", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3880, "total_steps": 17540, "loss": 0.7839, "learning_rate": 1.9118212939189165e-05, "epoch": 2.2116138225863913, "percentage": 22.12, "elapsed_time": "15:17:38", "remaining_time": "2 days, 5:50:40", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3890, "total_steps": 17540, "loss": 0.7681, "learning_rate": 1.9110023736149007e-05, "epoch": 2.2173138582116136, "percentage": 22.18, "elapsed_time": "15:20:00", "remaining_time": "2 days, 5:48:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3900, "total_steps": 17540, "loss": 0.779, "learning_rate": 1.910179845241226e-05, "epoch": 2.2230138938368365, "percentage": 22.23, "elapsed_time": "15:22:17", "remaining_time": "2 days, 5:45:39", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3910, "total_steps": 17540, "loss": 0.7811, "learning_rate": 1.9093537120555564e-05, "epoch": 2.2287139294620593, "percentage": 22.29, "elapsed_time": "15:24:34", "remaining_time": "2 days, 5:42:58", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3920, "total_steps": 17540, "loss": 0.7859, "learning_rate": 1.9085239773298324e-05, "epoch": 2.2344139650872816, "percentage": 22.35, "elapsed_time": "15:26:56", "remaining_time": "2 days, 5:40:39", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3930, "total_steps": 17540, "loss": 0.7673, "learning_rate": 1.9076906443502602e-05, "epoch": 2.2401140007125044, "percentage": 22.41, "elapsed_time": "15:29:20", "remaining_time": "2 days, 5:38:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3940, "total_steps": 17540, "loss": 0.7844, "learning_rate": 1.906853716417295e-05, "epoch": 2.2458140363377272, "percentage": 22.46, "elapsed_time": "15:31:41", "remaining_time": "2 days, 5:35:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3950, "total_steps": 17540, "loss": 0.7751, "learning_rate": 1.906013196845631e-05, "epoch": 2.2515140719629496, "percentage": 22.52, "elapsed_time": "15:34:01", "remaining_time": "2 days, 5:33:32", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3960, "total_steps": 17540, "loss": 0.7792, "learning_rate": 1.9051690889641884e-05, "epoch": 2.2572141075881724, "percentage": 22.58, "elapsed_time": "15:36:24", "remaining_time": "2 days, 5:31:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3970, "total_steps": 17540, "loss": 0.7707, "learning_rate": 1.904321396116097e-05, "epoch": 2.2629141432133952, "percentage": 22.63, "elapsed_time": "15:38:41", "remaining_time": "2 days, 5:28:34", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3980, "total_steps": 17540, "loss": 0.7848, "learning_rate": 1.903470121658686e-05, "epoch": 2.2686141788386176, "percentage": 22.69, "elapsed_time": "15:40:58", "remaining_time": "2 days, 5:25:57", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 3990, "total_steps": 17540, "loss": 0.7766, "learning_rate": 1.90261526896347e-05, "epoch": 2.2743142144638404, "percentage": 22.75, "elapsed_time": "15:43:24", "remaining_time": "2 days, 5:23:48", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4000, "total_steps": 17540, "loss": 0.7793, "learning_rate": 1.901756841416135e-05, "epoch": 2.280014250089063, "percentage": 22.81, "elapsed_time": "15:45:47", "remaining_time": "2 days, 5:21:29", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4010, "total_steps": 17540, "loss": 0.7686, "learning_rate": 1.900894842416525e-05, "epoch": 2.2857142857142856, "percentage": 22.86, "elapsed_time": "15:48:08", "remaining_time": "2 days, 5:19:05", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4020, "total_steps": 17540, "loss": 0.7725, "learning_rate": 1.9000292753786305e-05, "epoch": 2.2914143213395084, "percentage": 22.92, "elapsed_time": "15:50:28", "remaining_time": "2 days, 5:16:35", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4030, "total_steps": 17540, "loss": 0.7773, "learning_rate": 1.8991601437305715e-05, "epoch": 2.297114356964731, "percentage": 22.98, "elapsed_time": "15:52:52", "remaining_time": "2 days, 5:14:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4040, "total_steps": 17540, "loss": 0.7754, "learning_rate": 1.8982874509145866e-05, "epoch": 2.3028143925899536, "percentage": 23.03, "elapsed_time": "15:55:18", "remaining_time": "2 days, 5:12:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4050, "total_steps": 17540, "loss": 0.7761, "learning_rate": 1.8974112003870186e-05, "epoch": 2.3085144282151764, "percentage": 23.09, "elapsed_time": "15:57:39", "remaining_time": "2 days, 5:09:51", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4060, "total_steps": 17540, "loss": 0.7704, "learning_rate": 1.896531395618301e-05, "epoch": 2.314214463840399, "percentage": 23.15, "elapsed_time": "16:00:06", "remaining_time": "2 days, 5:07:45", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4070, "total_steps": 17540, "loss": 0.7787, "learning_rate": 1.8956480400929438e-05, "epoch": 2.3199144994656216, "percentage": 23.2, "elapsed_time": "16:02:32", "remaining_time": "2 days, 5:05:35", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4080, "total_steps": 17540, "loss": 0.7753, "learning_rate": 1.8947611373095196e-05, "epoch": 2.3256145350908444, "percentage": 23.26, "elapsed_time": "16:04:51", "remaining_time": "2 days, 5:03:04", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4090, "total_steps": 17540, "loss": 0.7809, "learning_rate": 1.893870690780651e-05, "epoch": 2.331314570716067, "percentage": 23.32, "elapsed_time": "16:07:10", "remaining_time": "2 days, 5:00:33", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4100, "total_steps": 17540, "loss": 0.7716, "learning_rate": 1.892976704032994e-05, "epoch": 2.3370146063412895, "percentage": 23.38, "elapsed_time": "16:09:36", "remaining_time": "2 days, 4:58:26", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4110, "total_steps": 17540, "loss": 0.7754, "learning_rate": 1.892079180607229e-05, "epoch": 2.3427146419665124, "percentage": 23.43, "elapsed_time": "16:12:03", "remaining_time": "2 days, 4:56:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4120, "total_steps": 17540, "loss": 0.7761, "learning_rate": 1.8911781240580402e-05, "epoch": 2.3484146775917347, "percentage": 23.49, "elapsed_time": "16:14:20", "remaining_time": "2 days, 4:53:41", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4130, "total_steps": 17540, "loss": 0.7685, "learning_rate": 1.8902735379541064e-05, "epoch": 2.3541147132169575, "percentage": 23.55, "elapsed_time": "16:16:44", "remaining_time": "2 days, 4:51:26", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4140, "total_steps": 17540, "loss": 0.7799, "learning_rate": 1.889365425878086e-05, "epoch": 2.3598147488421803, "percentage": 23.6, "elapsed_time": "16:19:03", "remaining_time": "2 days, 4:48:57", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4150, "total_steps": 17540, "loss": 0.7735, "learning_rate": 1.888453791426601e-05, "epoch": 2.365514784467403, "percentage": 23.66, "elapsed_time": "16:21:25", "remaining_time": "2 days, 4:46:33", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4160, "total_steps": 17540, "loss": 0.7718, "learning_rate": 1.8875386382102245e-05, "epoch": 2.3712148200926255, "percentage": 23.72, "elapsed_time": "16:23:44", "remaining_time": "2 days, 4:44:02", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4170, "total_steps": 17540, "loss": 0.7788, "learning_rate": 1.8866199698534658e-05, "epoch": 2.3769148557178483, "percentage": 23.77, "elapsed_time": "16:26:03", "remaining_time": "2 days, 4:41:33", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4180, "total_steps": 17540, "loss": 0.7627, "learning_rate": 1.885697789994756e-05, "epoch": 2.3826148913430707, "percentage": 23.83, "elapsed_time": "16:28:27", "remaining_time": "2 days, 4:39:17", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4190, "total_steps": 17540, "loss": 0.7793, "learning_rate": 1.8847721022864336e-05, "epoch": 2.3883149269682935, "percentage": 23.89, "elapsed_time": "16:30:52", "remaining_time": "2 days, 4:37:03", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4200, "total_steps": 17540, "loss": 0.7683, "learning_rate": 1.883842910394731e-05, "epoch": 2.3940149625935163, "percentage": 23.95, "elapsed_time": "16:33:07", "remaining_time": "2 days, 4:34:22", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4210, "total_steps": 17540, "loss": 0.7831, "learning_rate": 1.8829102179997572e-05, "epoch": 2.3997149982187387, "percentage": 24.0, "elapsed_time": "16:35:32", "remaining_time": "2 days, 4:32:10", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4220, "total_steps": 17540, "loss": 0.7695, "learning_rate": 1.8819740287954876e-05, "epoch": 2.4054150338439615, "percentage": 24.06, "elapsed_time": "16:37:54", "remaining_time": "2 days, 4:29:47", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4230, "total_steps": 17540, "loss": 0.7665, "learning_rate": 1.881034346489744e-05, "epoch": 2.4111150694691843, "percentage": 24.12, "elapsed_time": "16:40:11", "remaining_time": "2 days, 4:27:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4240, "total_steps": 17540, "loss": 0.7612, "learning_rate": 1.880091174804186e-05, "epoch": 2.4168151050944067, "percentage": 24.17, "elapsed_time": "16:42:36", "remaining_time": "2 days, 4:24:57", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4250, "total_steps": 17540, "loss": 0.7766, "learning_rate": 1.8791445174742894e-05, "epoch": 2.4225151407196295, "percentage": 24.23, "elapsed_time": "16:44:58", "remaining_time": "2 days, 4:22:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4260, "total_steps": 17540, "loss": 0.7721, "learning_rate": 1.8781943782493392e-05, "epoch": 2.4282151763448523, "percentage": 24.29, "elapsed_time": "16:47:19", "remaining_time": "2 days, 4:20:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4270, "total_steps": 17540, "loss": 0.7741, "learning_rate": 1.8772407608924067e-05, "epoch": 2.4339152119700747, "percentage": 24.34, "elapsed_time": "16:49:39", "remaining_time": "2 days, 4:17:45", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4280, "total_steps": 17540, "loss": 0.7789, "learning_rate": 1.8762836691803417e-05, "epoch": 2.4396152475952975, "percentage": 24.4, "elapsed_time": "16:52:01", "remaining_time": "2 days, 4:15:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4290, "total_steps": 17540, "loss": 0.7741, "learning_rate": 1.8753231069037522e-05, "epoch": 2.4453152832205203, "percentage": 24.46, "elapsed_time": "16:54:25", "remaining_time": "2 days, 4:13:07", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4300, "total_steps": 17540, "loss": 0.7697, "learning_rate": 1.874359077866992e-05, "epoch": 2.4510153188457426, "percentage": 24.52, "elapsed_time": "16:56:50", "remaining_time": "2 days, 4:10:54", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4310, "total_steps": 17540, "loss": 0.7724, "learning_rate": 1.8733915858881462e-05, "epoch": 2.4567153544709655, "percentage": 24.57, "elapsed_time": "16:59:16", "remaining_time": "2 days, 4:08:45", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4320, "total_steps": 17540, "loss": 0.7733, "learning_rate": 1.872420634799014e-05, "epoch": 2.4624153900961883, "percentage": 24.63, "elapsed_time": "17:01:38", "remaining_time": "2 days, 4:06:25", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4330, "total_steps": 17540, "loss": 0.7668, "learning_rate": 1.8714462284450948e-05, "epoch": 2.4681154257214106, "percentage": 24.69, "elapsed_time": "17:04:04", "remaining_time": "2 days, 4:04:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4340, "total_steps": 17540, "loss": 0.7758, "learning_rate": 1.8704683706855728e-05, "epoch": 2.4738154613466334, "percentage": 24.74, "elapsed_time": "17:06:28", "remaining_time": "2 days, 4:01:58", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4350, "total_steps": 17540, "loss": 0.7719, "learning_rate": 1.869487065393302e-05, "epoch": 2.4795154969718562, "percentage": 24.8, "elapsed_time": "17:08:49", "remaining_time": "2 days, 3:59:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4360, "total_steps": 17540, "loss": 0.7751, "learning_rate": 1.86850231645479e-05, "epoch": 2.4852155325970786, "percentage": 24.86, "elapsed_time": "17:11:12", "remaining_time": "2 days, 3:57:17", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4370, "total_steps": 17540, "loss": 0.7736, "learning_rate": 1.8675141277701834e-05, "epoch": 2.4909155682223014, "percentage": 24.91, "elapsed_time": "17:13:30", "remaining_time": "2 days, 3:54:44", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4380, "total_steps": 17540, "loss": 0.7672, "learning_rate": 1.866522503253252e-05, "epoch": 2.4966156038475242, "percentage": 24.97, "elapsed_time": "17:15:57", "remaining_time": "2 days, 3:52:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4390, "total_steps": 17540, "loss": 0.7691, "learning_rate": 1.8655274468313732e-05, "epoch": 2.5023156394727466, "percentage": 25.03, "elapsed_time": "17:18:19", "remaining_time": "2 days, 3:50:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4400, "total_steps": 17540, "loss": 0.7696, "learning_rate": 1.8645289624455175e-05, "epoch": 2.5080156750979694, "percentage": 25.09, "elapsed_time": "17:20:43", "remaining_time": "2 days, 3:47:57", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4410, "total_steps": 17540, "loss": 0.7646, "learning_rate": 1.8635270540502307e-05, "epoch": 2.5137157107231918, "percentage": 25.14, "elapsed_time": "17:23:07", "remaining_time": "2 days, 3:45:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4420, "total_steps": 17540, "loss": 0.7711, "learning_rate": 1.8625217256136206e-05, "epoch": 2.5194157463484146, "percentage": 25.2, "elapsed_time": "17:25:30", "remaining_time": "2 days, 3:43:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4430, "total_steps": 17540, "loss": 0.7805, "learning_rate": 1.8615129811173398e-05, "epoch": 2.5251157819736374, "percentage": 25.26, "elapsed_time": "17:27:49", "remaining_time": "2 days, 3:40:54", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4440, "total_steps": 17540, "loss": 0.7732, "learning_rate": 1.8605008245565704e-05, "epoch": 2.53081581759886, "percentage": 25.31, "elapsed_time": "17:30:08", "remaining_time": "2 days, 3:38:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4450, "total_steps": 17540, "loss": 0.7645, "learning_rate": 1.8594852599400083e-05, "epoch": 2.5365158532240826, "percentage": 25.37, "elapsed_time": "17:32:27", "remaining_time": "2 days, 3:35:54", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4460, "total_steps": 17540, "loss": 0.7618, "learning_rate": 1.8584662912898464e-05, "epoch": 2.5422158888493054, "percentage": 25.43, "elapsed_time": "17:34:49", "remaining_time": "2 days, 3:33:31", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4470, "total_steps": 17540, "loss": 0.7721, "learning_rate": 1.857443922641761e-05, "epoch": 2.5479159244745277, "percentage": 25.48, "elapsed_time": "17:37:16", "remaining_time": "2 days, 3:31:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4480, "total_steps": 17540, "loss": 0.7761, "learning_rate": 1.856418158044893e-05, "epoch": 2.5536159600997506, "percentage": 25.54, "elapsed_time": "17:39:39", "remaining_time": "2 days, 3:29:05", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4490, "total_steps": 17540, "loss": 0.7617, "learning_rate": 1.8553890015618333e-05, "epoch": 2.5593159957249734, "percentage": 25.6, "elapsed_time": "17:41:58", "remaining_time": "2 days, 3:26:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4500, "total_steps": 17540, "loss": 0.7691, "learning_rate": 1.8543564572686072e-05, "epoch": 2.565016031350196, "percentage": 25.66, "elapsed_time": "17:44:23", "remaining_time": "2 days, 3:24:21", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4510, "total_steps": 17540, "loss": 0.7651, "learning_rate": 1.8533205292546567e-05, "epoch": 2.5707160669754185, "percentage": 25.71, "elapsed_time": "17:46:47", "remaining_time": "2 days, 3:22:07", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4520, "total_steps": 17540, "loss": 0.7706, "learning_rate": 1.8522812216228254e-05, "epoch": 2.5764161026006414, "percentage": 25.77, "elapsed_time": "17:49:13", "remaining_time": "2 days, 3:19:56", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4530, "total_steps": 17540, "loss": 0.7778, "learning_rate": 1.851238538489343e-05, "epoch": 2.5821161382258637, "percentage": 25.83, "elapsed_time": "17:51:31", "remaining_time": "2 days, 3:17:22", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4540, "total_steps": 17540, "loss": 0.7698, "learning_rate": 1.8501924839838062e-05, "epoch": 2.5878161738510865, "percentage": 25.88, "elapsed_time": "17:53:57", "remaining_time": "2 days, 3:15:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4550, "total_steps": 17540, "loss": 0.7605, "learning_rate": 1.8491430622491665e-05, "epoch": 2.5935162094763093, "percentage": 25.94, "elapsed_time": "17:56:19", "remaining_time": "2 days, 3:12:51", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4560, "total_steps": 17540, "loss": 0.7661, "learning_rate": 1.8480902774417094e-05, "epoch": 2.599216245101532, "percentage": 26.0, "elapsed_time": "17:58:44", "remaining_time": "2 days, 3:10:37", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4570, "total_steps": 17540, "loss": 0.7619, "learning_rate": 1.8470341337310407e-05, "epoch": 2.6049162807267545, "percentage": 26.05, "elapsed_time": "18:01:08", "remaining_time": "2 days, 3:08:20", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4580, "total_steps": 17540, "loss": 0.7615, "learning_rate": 1.8459746353000704e-05, "epoch": 2.6106163163519773, "percentage": 26.11, "elapsed_time": "18:03:26", "remaining_time": "2 days, 3:05:47", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4590, "total_steps": 17540, "loss": 0.7688, "learning_rate": 1.8449117863449932e-05, "epoch": 2.6163163519771997, "percentage": 26.17, "elapsed_time": "18:05:52", "remaining_time": "2 days, 3:03:37", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4600, "total_steps": 17540, "loss": 0.7682, "learning_rate": 1.843845591075275e-05, "epoch": 2.6220163876024225, "percentage": 26.23, "elapsed_time": "18:08:12", "remaining_time": "2 days, 3:01:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4610, "total_steps": 17540, "loss": 0.7576, "learning_rate": 1.8427760537136342e-05, "epoch": 2.6277164232276453, "percentage": 26.28, "elapsed_time": "18:10:32", "remaining_time": "2 days, 2:58:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4620, "total_steps": 17540, "loss": 0.7655, "learning_rate": 1.8417031784960267e-05, "epoch": 2.6334164588528677, "percentage": 26.34, "elapsed_time": "18:12:56", "remaining_time": "2 days, 2:56:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4630, "total_steps": 17540, "loss": 0.7752, "learning_rate": 1.840626969671627e-05, "epoch": 2.6391164944780905, "percentage": 26.4, "elapsed_time": "18:15:16", "remaining_time": "2 days, 2:53:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4640, "total_steps": 17540, "loss": 0.774, "learning_rate": 1.8395474315028134e-05, "epoch": 2.6448165301033133, "percentage": 26.45, "elapsed_time": "18:17:38", "remaining_time": "2 days, 2:51:39", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4650, "total_steps": 17540, "loss": 0.7722, "learning_rate": 1.838464568265149e-05, "epoch": 2.6505165657285357, "percentage": 26.51, "elapsed_time": "18:19:58", "remaining_time": "2 days, 2:49:10", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4660, "total_steps": 17540, "loss": 0.7705, "learning_rate": 1.837378384247368e-05, "epoch": 2.6562166013537585, "percentage": 26.57, "elapsed_time": "18:22:21", "remaining_time": "2 days, 2:46:50", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4670, "total_steps": 17540, "loss": 0.7633, "learning_rate": 1.8362888837513548e-05, "epoch": 2.6619166369789813, "percentage": 26.62, "elapsed_time": "18:24:42", "remaining_time": "2 days, 2:44:27", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4680, "total_steps": 17540, "loss": 0.7612, "learning_rate": 1.83519607109213e-05, "epoch": 2.6676166726042037, "percentage": 26.68, "elapsed_time": "18:27:07", "remaining_time": "2 days, 2:42:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4690, "total_steps": 17540, "loss": 0.7627, "learning_rate": 1.834099950597832e-05, "epoch": 2.6733167082294265, "percentage": 26.74, "elapsed_time": "18:29:29", "remaining_time": "2 days, 2:39:51", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4700, "total_steps": 17540, "loss": 0.7661, "learning_rate": 1.8330005266096992e-05, "epoch": 2.679016743854649, "percentage": 26.8, "elapsed_time": "18:31:50", "remaining_time": "2 days, 2:37:27", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4710, "total_steps": 17540, "loss": 0.7581, "learning_rate": 1.8318978034820544e-05, "epoch": 2.6847167794798716, "percentage": 26.85, "elapsed_time": "18:34:08", "remaining_time": "2 days, 2:34:54", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4720, "total_steps": 17540, "loss": 0.7629, "learning_rate": 1.830791785582288e-05, "epoch": 2.6904168151050945, "percentage": 26.91, "elapsed_time": "18:36:30", "remaining_time": "2 days, 2:32:33", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4730, "total_steps": 17540, "loss": 0.7625, "learning_rate": 1.8296824772908365e-05, "epoch": 2.6961168507303173, "percentage": 26.97, "elapsed_time": "18:38:45", "remaining_time": "2 days, 2:29:51", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4740, "total_steps": 17540, "loss": 0.7667, "learning_rate": 1.828569883001171e-05, "epoch": 2.7018168863555396, "percentage": 27.02, "elapsed_time": "18:41:08", "remaining_time": "2 days, 2:27:32", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4750, "total_steps": 17540, "loss": 0.7657, "learning_rate": 1.827454007119775e-05, "epoch": 2.7075169219807624, "percentage": 27.08, "elapsed_time": "18:43:34", "remaining_time": "2 days, 2:25:21", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4760, "total_steps": 17540, "loss": 0.7691, "learning_rate": 1.8263348540661306e-05, "epoch": 2.713216957605985, "percentage": 27.14, "elapsed_time": "18:45:53", "remaining_time": "2 days, 2:22:53", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4770, "total_steps": 17540, "loss": 0.7635, "learning_rate": 1.8252124282726984e-05, "epoch": 2.7189169932312076, "percentage": 27.19, "elapsed_time": "18:48:14", "remaining_time": "2 days, 2:20:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4780, "total_steps": 17540, "loss": 0.7581, "learning_rate": 1.8240867341849e-05, "epoch": 2.7246170288564304, "percentage": 27.25, "elapsed_time": "18:50:40", "remaining_time": "2 days, 2:18:16", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4790, "total_steps": 17540, "loss": 0.7689, "learning_rate": 1.8229577762611033e-05, "epoch": 2.7303170644816532, "percentage": 27.31, "elapsed_time": "18:53:00", "remaining_time": "2 days, 2:15:49", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4800, "total_steps": 17540, "loss": 0.7546, "learning_rate": 1.8218255589726007e-05, "epoch": 2.7360171001068756, "percentage": 27.37, "elapsed_time": "18:55:23", "remaining_time": "2 days, 2:13:31", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4810, "total_steps": 17540, "loss": 0.7674, "learning_rate": 1.820690086803595e-05, "epoch": 2.7417171357320984, "percentage": 27.42, "elapsed_time": "18:57:44", "remaining_time": "2 days, 2:11:07", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4820, "total_steps": 17540, "loss": 0.7622, "learning_rate": 1.819551364251179e-05, "epoch": 2.7474171713573208, "percentage": 27.48, "elapsed_time": "19:00:05", "remaining_time": "2 days, 2:08:42", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4830, "total_steps": 17540, "loss": 0.7542, "learning_rate": 1.81840939582532e-05, "epoch": 2.7531172069825436, "percentage": 27.54, "elapsed_time": "19:02:29", "remaining_time": "2 days, 2:06:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4840, "total_steps": 17540, "loss": 0.7626, "learning_rate": 1.8172641860488393e-05, "epoch": 2.7588172426077664, "percentage": 27.59, "elapsed_time": "19:04:53", "remaining_time": "2 days, 2:04:10", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4850, "total_steps": 17540, "loss": 0.7671, "learning_rate": 1.816115739457397e-05, "epoch": 2.764517278232989, "percentage": 27.65, "elapsed_time": "19:07:12", "remaining_time": "2 days, 2:01:39", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4860, "total_steps": 17540, "loss": 0.7722, "learning_rate": 1.8149640605994722e-05, "epoch": 2.7702173138582116, "percentage": 27.71, "elapsed_time": "19:09:35", "remaining_time": "2 days, 1:59:20", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4870, "total_steps": 17540, "loss": 0.7666, "learning_rate": 1.8138091540363453e-05, "epoch": 2.7759173494834344, "percentage": 27.77, "elapsed_time": "19:11:55", "remaining_time": "2 days, 1:56:54", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4880, "total_steps": 17540, "loss": 0.7553, "learning_rate": 1.8126510243420807e-05, "epoch": 2.7816173851086567, "percentage": 27.82, "elapsed_time": "19:14:10", "remaining_time": "2 days, 1:54:13", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4890, "total_steps": 17540, "loss": 0.7649, "learning_rate": 1.811489676103508e-05, "epoch": 2.7873174207338796, "percentage": 27.88, "elapsed_time": "19:16:30", "remaining_time": "2 days, 1:51:47", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4900, "total_steps": 17540, "loss": 0.7632, "learning_rate": 1.8103251139202038e-05, "epoch": 2.7930174563591024, "percentage": 27.94, "elapsed_time": "19:18:52", "remaining_time": "2 days, 1:49:26", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4910, "total_steps": 17540, "loss": 0.7661, "learning_rate": 1.8091573424044742e-05, "epoch": 2.798717491984325, "percentage": 27.99, "elapsed_time": "19:21:11", "remaining_time": "2 days, 1:46:55", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4920, "total_steps": 17540, "loss": 0.7709, "learning_rate": 1.8079863661813352e-05, "epoch": 2.8044175276095475, "percentage": 28.05, "elapsed_time": "19:23:31", "remaining_time": "2 days, 1:44:29", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4930, "total_steps": 17540, "loss": 0.756, "learning_rate": 1.8068121898884955e-05, "epoch": 2.8101175632347704, "percentage": 28.11, "elapsed_time": "19:25:51", "remaining_time": "2 days, 1:42:03", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4940, "total_steps": 17540, "loss": 0.7537, "learning_rate": 1.8056348181763387e-05, "epoch": 2.8158175988599927, "percentage": 28.16, "elapsed_time": "19:28:13", "remaining_time": "2 days, 1:39:41", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4950, "total_steps": 17540, "loss": 0.763, "learning_rate": 1.8044542557079032e-05, "epoch": 2.8215176344852155, "percentage": 28.22, "elapsed_time": "19:30:33", "remaining_time": "2 days, 1:37:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4960, "total_steps": 17540, "loss": 0.7667, "learning_rate": 1.8032705071588638e-05, "epoch": 2.8272176701104383, "percentage": 28.28, "elapsed_time": "19:32:58", "remaining_time": "2 days, 1:35:01", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4970, "total_steps": 17540, "loss": 0.7632, "learning_rate": 1.8020835772175158e-05, "epoch": 2.8329177057356607, "percentage": 28.34, "elapsed_time": "19:35:17", "remaining_time": "2 days, 1:32:31", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4980, "total_steps": 17540, "loss": 0.7636, "learning_rate": 1.8008934705847533e-05, "epoch": 2.8386177413608835, "percentage": 28.39, "elapsed_time": "19:37:43", "remaining_time": "2 days, 1:30:20", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 4990, "total_steps": 17540, "loss": 0.7606, "learning_rate": 1.7997001919740514e-05, "epoch": 2.8443177769861063, "percentage": 28.45, "elapsed_time": "19:40:12", "remaining_time": "2 days, 1:28:16", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5000, "total_steps": 17540, "loss": 0.7615, "learning_rate": 1.7985037461114497e-05, "epoch": 2.8500178126113287, "percentage": 28.51, "elapsed_time": "19:42:37", "remaining_time": "2 days, 1:26:00", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5010, "total_steps": 17540, "loss": 0.7549, "learning_rate": 1.7973041377355303e-05, "epoch": 2.8557178482365515, "percentage": 28.56, "elapsed_time": "19:45:06", "remaining_time": "2 days, 1:23:56", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5020, "total_steps": 17540, "loss": 0.7661, "learning_rate": 1.7961013715974008e-05, "epoch": 2.8614178838617743, "percentage": 28.62, "elapsed_time": "19:47:27", "remaining_time": "2 days, 1:21:33", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5030, "total_steps": 17540, "loss": 0.756, "learning_rate": 1.7948954524606764e-05, "epoch": 2.8671179194869967, "percentage": 28.68, "elapsed_time": "19:49:44", "remaining_time": "2 days, 1:18:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5040, "total_steps": 17540, "loss": 0.7624, "learning_rate": 1.7936863851014585e-05, "epoch": 2.8728179551122195, "percentage": 28.73, "elapsed_time": "19:52:07", "remaining_time": "2 days, 1:16:38", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5050, "total_steps": 17540, "loss": 0.7731, "learning_rate": 1.7924741743083177e-05, "epoch": 2.878517990737442, "percentage": 28.79, "elapsed_time": "19:54:29", "remaining_time": "2 days, 1:14:18", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5060, "total_steps": 17540, "loss": 0.7478, "learning_rate": 1.7912588248822744e-05, "epoch": 2.8842180263626647, "percentage": 28.85, "elapsed_time": "19:56:52", "remaining_time": "2 days, 1:11:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5070, "total_steps": 17540, "loss": 0.7632, "learning_rate": 1.79004034163678e-05, "epoch": 2.8899180619878875, "percentage": 28.91, "elapsed_time": "19:59:21", "remaining_time": "2 days, 1:09:54", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5080, "total_steps": 17540, "loss": 0.7634, "learning_rate": 1.7888187293976974e-05, "epoch": 2.8956180976131103, "percentage": 28.96, "elapsed_time": "20:01:40", "remaining_time": "2 days, 1:07:25", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5090, "total_steps": 17540, "loss": 0.7689, "learning_rate": 1.7875939930032817e-05, "epoch": 2.9013181332383327, "percentage": 29.02, "elapsed_time": "20:03:59", "remaining_time": "2 days, 1:04:56", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5100, "total_steps": 17540, "loss": 0.7721, "learning_rate": 1.786366137304161e-05, "epoch": 2.9070181688635555, "percentage": 29.08, "elapsed_time": "20:06:22", "remaining_time": "2 days, 1:02:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5110, "total_steps": 17540, "loss": 0.7583, "learning_rate": 1.7851351671633192e-05, "epoch": 2.912718204488778, "percentage": 29.13, "elapsed_time": "20:08:47", "remaining_time": "2 days, 1:00:22", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5120, "total_steps": 17540, "loss": 0.7587, "learning_rate": 1.7839010874560732e-05, "epoch": 2.9184182401140006, "percentage": 29.19, "elapsed_time": "20:11:08", "remaining_time": "2 days, 0:57:57", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5130, "total_steps": 17540, "loss": 0.7571, "learning_rate": 1.782663903070057e-05, "epoch": 2.9241182757392234, "percentage": 29.25, "elapsed_time": "20:13:32", "remaining_time": "2 days, 0:55:41", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5140, "total_steps": 17540, "loss": 0.7591, "learning_rate": 1.7814236189051995e-05, "epoch": 2.9298183113644463, "percentage": 29.3, "elapsed_time": "20:15:57", "remaining_time": "2 days, 0:53:25", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5150, "total_steps": 17540, "loss": 0.7583, "learning_rate": 1.780180239873707e-05, "epoch": 2.9355183469896686, "percentage": 29.36, "elapsed_time": "20:18:15", "remaining_time": "2 days, 0:50:54", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5160, "total_steps": 17540, "loss": 0.7664, "learning_rate": 1.7789337709000435e-05, "epoch": 2.9412183826148914, "percentage": 29.42, "elapsed_time": "20:20:38", "remaining_time": "2 days, 0:48:35", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5170, "total_steps": 17540, "loss": 0.7551, "learning_rate": 1.777684216920911e-05, "epoch": 2.946918418240114, "percentage": 29.48, "elapsed_time": "20:23:01", "remaining_time": "2 days, 0:46:16", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5180, "total_steps": 17540, "loss": 0.7574, "learning_rate": 1.776431582885229e-05, "epoch": 2.9526184538653366, "percentage": 29.53, "elapsed_time": "20:25:27", "remaining_time": "2 days, 0:44:04", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5190, "total_steps": 17540, "loss": 0.7648, "learning_rate": 1.775175873754116e-05, "epoch": 2.9583184894905594, "percentage": 29.59, "elapsed_time": "20:27:51", "remaining_time": "2 days, 0:41:46", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5200, "total_steps": 17540, "loss": 0.7638, "learning_rate": 1.77391709450087e-05, "epoch": 2.9640185251157822, "percentage": 29.65, "elapsed_time": "20:30:10", "remaining_time": "2 days, 0:39:18", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5210, "total_steps": 17540, "loss": 0.7627, "learning_rate": 1.772655250110948e-05, "epoch": 2.9697185607410046, "percentage": 29.7, "elapsed_time": "20:32:34", "remaining_time": "2 days, 0:37:01", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5220, "total_steps": 17540, "loss": 0.7736, "learning_rate": 1.771390345581947e-05, "epoch": 2.9754185963662274, "percentage": 29.76, "elapsed_time": "20:34:57", "remaining_time": "2 days, 0:34:40", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5230, "total_steps": 17540, "loss": 0.7565, "learning_rate": 1.7701223859235828e-05, "epoch": 2.9811186319914498, "percentage": 29.82, "elapsed_time": "20:37:21", "remaining_time": "2 days, 0:32:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5240, "total_steps": 17540, "loss": 0.7582, "learning_rate": 1.7688513761576726e-05, "epoch": 2.9868186676166726, "percentage": 29.87, "elapsed_time": "20:39:48", "remaining_time": "2 days, 0:30:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5250, "total_steps": 17540, "loss": 0.7639, "learning_rate": 1.7675773213181124e-05, "epoch": 2.9925187032418954, "percentage": 29.93, "elapsed_time": "20:42:10", "remaining_time": "2 days, 0:27:51", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5260, "total_steps": 17540, "loss": 0.7658, "learning_rate": 1.7663002264508598e-05, "epoch": 2.9982187388671178, "percentage": 29.99, "elapsed_time": "20:44:32", "remaining_time": "2 days, 0:25:30", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5270, "total_steps": 17540, "loss": 0.7438, "learning_rate": 1.765020096613911e-05, "epoch": 3.0039187744923406, "percentage": 30.05, "elapsed_time": "20:46:50", "remaining_time": "2 days, 0:22:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5280, "total_steps": 17540, "loss": 0.7439, "learning_rate": 1.763736936877284e-05, "epoch": 3.0096188101175634, "percentage": 30.1, "elapsed_time": "20:49:07", "remaining_time": "2 days, 0:20:26", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5290, "total_steps": 17540, "loss": 0.7484, "learning_rate": 1.762450752322995e-05, "epoch": 3.0153188457427857, "percentage": 30.16, "elapsed_time": "20:51:33", "remaining_time": "2 days, 0:18:12", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5300, "total_steps": 17540, "loss": 0.7481, "learning_rate": 1.7611615480450413e-05, "epoch": 3.0210188813680086, "percentage": 30.22, "elapsed_time": "20:53:49", "remaining_time": "2 days, 0:15:38", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5310, "total_steps": 17540, "loss": 0.7517, "learning_rate": 1.7598693291493804e-05, "epoch": 3.0267189169932314, "percentage": 30.27, "elapsed_time": "20:56:08", "remaining_time": "2 days, 0:13:09", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5320, "total_steps": 17540, "loss": 0.7393, "learning_rate": 1.7585741007539083e-05, "epoch": 3.0324189526184537, "percentage": 30.33, "elapsed_time": "20:58:31", "remaining_time": "2 days, 0:10:50", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5330, "total_steps": 17540, "loss": 0.7366, "learning_rate": 1.7572758679884406e-05, "epoch": 3.0381189882436765, "percentage": 30.39, "elapsed_time": "21:00:59", "remaining_time": "2 days, 0:08:40", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5340, "total_steps": 17540, "loss": 0.7449, "learning_rate": 1.7559746359946925e-05, "epoch": 3.0438190238688994, "percentage": 30.44, "elapsed_time": "21:03:24", "remaining_time": "2 days, 0:06:26", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5350, "total_steps": 17540, "loss": 0.7397, "learning_rate": 1.7546704099262565e-05, "epoch": 3.0495190594941217, "percentage": 30.5, "elapsed_time": "21:05:48", "remaining_time": "2 days, 0:04:09", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5360, "total_steps": 17540, "loss": 0.7436, "learning_rate": 1.7533631949485847e-05, "epoch": 3.0552190951193445, "percentage": 30.56, "elapsed_time": "21:08:14", "remaining_time": "2 days, 0:01:56", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5370, "total_steps": 17540, "loss": 0.741, "learning_rate": 1.7520529962389655e-05, "epoch": 3.0609191307445673, "percentage": 30.62, "elapsed_time": "21:10:42", "remaining_time": "1 day, 23:59:47", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5380, "total_steps": 17540, "loss": 0.7421, "learning_rate": 1.7507398189865057e-05, "epoch": 3.0666191663697897, "percentage": 30.67, "elapsed_time": "21:13:03", "remaining_time": "1 day, 23:57:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5390, "total_steps": 17540, "loss": 0.7399, "learning_rate": 1.7494236683921084e-05, "epoch": 3.0723192019950125, "percentage": 30.73, "elapsed_time": "21:15:29", "remaining_time": "1 day, 23:55:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5400, "total_steps": 17540, "loss": 0.7425, "learning_rate": 1.7481045496684525e-05, "epoch": 3.0780192376202353, "percentage": 30.79, "elapsed_time": "21:17:55", "remaining_time": "1 day, 23:52:58", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5410, "total_steps": 17540, "loss": 0.7397, "learning_rate": 1.7467824680399728e-05, "epoch": 3.0837192732454577, "percentage": 30.84, "elapsed_time": "21:20:11", "remaining_time": "1 day, 23:50:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5420, "total_steps": 17540, "loss": 0.7357, "learning_rate": 1.7454574287428382e-05, "epoch": 3.0894193088706805, "percentage": 30.9, "elapsed_time": "21:22:35", "remaining_time": "1 day, 23:48:06", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5430, "total_steps": 17540, "loss": 0.7505, "learning_rate": 1.744129437024932e-05, "epoch": 3.0951193444959033, "percentage": 30.96, "elapsed_time": "21:24:57", "remaining_time": "1 day, 23:45:44", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5440, "total_steps": 17540, "loss": 0.7419, "learning_rate": 1.7427984981458305e-05, "epoch": 3.1008193801211257, "percentage": 31.01, "elapsed_time": "21:27:16", "remaining_time": "1 day, 23:43:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5450, "total_steps": 17540, "loss": 0.7298, "learning_rate": 1.7414646173767833e-05, "epoch": 3.1065194157463485, "percentage": 31.07, "elapsed_time": "21:29:34", "remaining_time": "1 day, 23:40:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5460, "total_steps": 17540, "loss": 0.748, "learning_rate": 1.74012780000069e-05, "epoch": 3.112219451371571, "percentage": 31.13, "elapsed_time": "21:31:56", "remaining_time": "1 day, 23:38:21", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5470, "total_steps": 17540, "loss": 0.7452, "learning_rate": 1.7387880513120815e-05, "epoch": 3.1179194869967937, "percentage": 31.19, "elapsed_time": "21:34:17", "remaining_time": "1 day, 23:35:58", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5480, "total_steps": 17540, "loss": 0.7436, "learning_rate": 1.7374453766170987e-05, "epoch": 3.1236195226220165, "percentage": 31.24, "elapsed_time": "21:36:40", "remaining_time": "1 day, 23:33:37", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5490, "total_steps": 17540, "loss": 0.7361, "learning_rate": 1.73609978123347e-05, "epoch": 3.129319558247239, "percentage": 31.3, "elapsed_time": "21:39:01", "remaining_time": "1 day, 23:31:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5500, "total_steps": 17540, "loss": 0.748, "learning_rate": 1.734751270490493e-05, "epoch": 3.1350195938724617, "percentage": 31.36, "elapsed_time": "21:41:19", "remaining_time": "1 day, 23:28:42", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5510, "total_steps": 17540, "loss": 0.7421, "learning_rate": 1.7333998497290097e-05, "epoch": 3.1407196294976845, "percentage": 31.41, "elapsed_time": "21:43:45", "remaining_time": "1 day, 23:26:29", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5520, "total_steps": 17540, "loss": 0.751, "learning_rate": 1.7320455243013896e-05, "epoch": 3.146419665122907, "percentage": 31.47, "elapsed_time": "21:46:00", "remaining_time": "1 day, 23:23:53", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5530, "total_steps": 17540, "loss": 0.7378, "learning_rate": 1.730688299571504e-05, "epoch": 3.1521197007481296, "percentage": 31.53, "elapsed_time": "21:48:20", "remaining_time": "1 day, 23:21:27", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5540, "total_steps": 17540, "loss": 0.7448, "learning_rate": 1.729328180914709e-05, "epoch": 3.1578197363733524, "percentage": 31.58, "elapsed_time": "21:50:39", "remaining_time": "1 day, 23:18:57", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5550, "total_steps": 17540, "loss": 0.7345, "learning_rate": 1.7279651737178204e-05, "epoch": 3.163519771998575, "percentage": 31.64, "elapsed_time": "21:53:00", "remaining_time": "1 day, 23:16:34", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5560, "total_steps": 17540, "loss": 0.73, "learning_rate": 1.726599283379096e-05, "epoch": 3.1692198076237976, "percentage": 31.7, "elapsed_time": "21:55:23", "remaining_time": "1 day, 23:14:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5570, "total_steps": 17540, "loss": 0.7304, "learning_rate": 1.7252305153082118e-05, "epoch": 3.1749198432490204, "percentage": 31.76, "elapsed_time": "21:57:40", "remaining_time": "1 day, 23:11:42", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5580, "total_steps": 17540, "loss": 0.7405, "learning_rate": 1.7238588749262396e-05, "epoch": 3.180619878874243, "percentage": 31.81, "elapsed_time": "22:00:06", "remaining_time": "1 day, 23:09:27", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5590, "total_steps": 17540, "loss": 0.7462, "learning_rate": 1.72248436766563e-05, "epoch": 3.1863199144994656, "percentage": 31.87, "elapsed_time": "22:02:31", "remaining_time": "1 day, 23:07:13", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5600, "total_steps": 17540, "loss": 0.7524, "learning_rate": 1.7211069989701855e-05, "epoch": 3.1920199501246884, "percentage": 31.93, "elapsed_time": "22:04:53", "remaining_time": "1 day, 23:04:52", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5610, "total_steps": 17540, "loss": 0.7562, "learning_rate": 1.7197267742950435e-05, "epoch": 3.197719985749911, "percentage": 31.98, "elapsed_time": "22:07:13", "remaining_time": "1 day, 23:02:25", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5620, "total_steps": 17540, "loss": 0.7341, "learning_rate": 1.718343699106651e-05, "epoch": 3.2034200213751336, "percentage": 32.04, "elapsed_time": "22:09:43", "remaining_time": "1 day, 23:00:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5630, "total_steps": 17540, "loss": 0.751, "learning_rate": 1.7169577788827448e-05, "epoch": 3.2091200570003564, "percentage": 32.1, "elapsed_time": "22:12:04", "remaining_time": "1 day, 22:57:55", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5640, "total_steps": 17540, "loss": 0.7317, "learning_rate": 1.7155690191123313e-05, "epoch": 3.2148200926255788, "percentage": 32.16, "elapsed_time": "22:14:22", "remaining_time": "1 day, 22:55:26", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5650, "total_steps": 17540, "loss": 0.7426, "learning_rate": 1.7141774252956606e-05, "epoch": 3.2205201282508016, "percentage": 32.21, "elapsed_time": "22:16:48", "remaining_time": "1 day, 22:53:13", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5660, "total_steps": 17540, "loss": 0.7472, "learning_rate": 1.712783002944209e-05, "epoch": 3.2262201638760244, "percentage": 32.27, "elapsed_time": "22:19:15", "remaining_time": "1 day, 22:51:02", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5670, "total_steps": 17540, "loss": 0.7368, "learning_rate": 1.7113857575806544e-05, "epoch": 3.2319201995012468, "percentage": 32.33, "elapsed_time": "22:21:36", "remaining_time": "1 day, 22:48:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5680, "total_steps": 17540, "loss": 0.7412, "learning_rate": 1.709985694738856e-05, "epoch": 3.2376202351264696, "percentage": 32.38, "elapsed_time": "22:24:02", "remaining_time": "1 day, 22:46:22", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5690, "total_steps": 17540, "loss": 0.7318, "learning_rate": 1.7085828199638315e-05, "epoch": 3.2433202707516924, "percentage": 32.44, "elapsed_time": "22:26:30", "remaining_time": "1 day, 22:44:13", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5700, "total_steps": 17540, "loss": 0.7388, "learning_rate": 1.707177138811735e-05, "epoch": 3.2490203063769147, "percentage": 32.5, "elapsed_time": "22:28:47", "remaining_time": "1 day, 22:41:41", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5710, "total_steps": 17540, "loss": 0.7369, "learning_rate": 1.7057686568498363e-05, "epoch": 3.2547203420021376, "percentage": 32.55, "elapsed_time": "22:31:12", "remaining_time": "1 day, 22:39:27", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5720, "total_steps": 17540, "loss": 0.74, "learning_rate": 1.7043573796564966e-05, "epoch": 3.2604203776273604, "percentage": 32.61, "elapsed_time": "22:33:41", "remaining_time": "1 day, 22:37:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5730, "total_steps": 17540, "loss": 0.7356, "learning_rate": 1.7029433128211495e-05, "epoch": 3.2661204132525827, "percentage": 32.67, "elapsed_time": "22:35:59", "remaining_time": "1 day, 22:34:48", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5740, "total_steps": 17540, "loss": 0.737, "learning_rate": 1.7015264619442758e-05, "epoch": 3.2718204488778055, "percentage": 32.73, "elapsed_time": "22:38:25", "remaining_time": "1 day, 22:32:35", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5750, "total_steps": 17540, "loss": 0.7352, "learning_rate": 1.7001068326373827e-05, "epoch": 3.277520484503028, "percentage": 32.78, "elapsed_time": "22:40:48", "remaining_time": "1 day, 22:30:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5760, "total_steps": 17540, "loss": 0.7485, "learning_rate": 1.698684430522982e-05, "epoch": 3.2832205201282507, "percentage": 32.84, "elapsed_time": "22:43:15", "remaining_time": "1 day, 22:28:02", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5770, "total_steps": 17540, "loss": 0.7428, "learning_rate": 1.6972592612345673e-05, "epoch": 3.2889205557534735, "percentage": 32.9, "elapsed_time": "22:45:33", "remaining_time": "1 day, 22:25:33", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5780, "total_steps": 17540, "loss": 0.7457, "learning_rate": 1.6958313304165915e-05, "epoch": 3.2946205913786963, "percentage": 32.95, "elapsed_time": "22:47:54", "remaining_time": "1 day, 22:23:09", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5790, "total_steps": 17540, "loss": 0.7288, "learning_rate": 1.694400643724445e-05, "epoch": 3.3003206270039187, "percentage": 33.01, "elapsed_time": "22:50:20", "remaining_time": "1 day, 22:20:54", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5800, "total_steps": 17540, "loss": 0.734, "learning_rate": 1.6929672068244325e-05, "epoch": 3.3060206626291415, "percentage": 33.07, "elapsed_time": "22:52:43", "remaining_time": "1 day, 22:18:35", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5810, "total_steps": 17540, "loss": 0.7428, "learning_rate": 1.691531025393751e-05, "epoch": 3.311720698254364, "percentage": 33.12, "elapsed_time": "22:55:03", "remaining_time": "1 day, 22:16:09", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5820, "total_steps": 17540, "loss": 0.7336, "learning_rate": 1.690092105120468e-05, "epoch": 3.3174207338795867, "percentage": 33.18, "elapsed_time": "22:57:27", "remaining_time": "1 day, 22:13:50", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5830, "total_steps": 17540, "loss": 0.735, "learning_rate": 1.688650451703498e-05, "epoch": 3.3231207695048095, "percentage": 33.24, "elapsed_time": "22:59:46", "remaining_time": "1 day, 22:11:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5840, "total_steps": 17540, "loss": 0.7478, "learning_rate": 1.68720607085258e-05, "epoch": 3.3288208051300323, "percentage": 33.3, "elapsed_time": "23:02:07", "remaining_time": "1 day, 22:08:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5850, "total_steps": 17540, "loss": 0.7364, "learning_rate": 1.685758968288255e-05, "epoch": 3.3345208407552547, "percentage": 33.35, "elapsed_time": "23:04:30", "remaining_time": "1 day, 22:06:39", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5860, "total_steps": 17540, "loss": 0.7459, "learning_rate": 1.684309149741845e-05, "epoch": 3.3402208763804775, "percentage": 33.41, "elapsed_time": "23:06:54", "remaining_time": "1 day, 22:04:20", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5870, "total_steps": 17540, "loss": 0.7293, "learning_rate": 1.6828566209554254e-05, "epoch": 3.3459209120057, "percentage": 33.47, "elapsed_time": "23:09:14", "remaining_time": "1 day, 22:01:55", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5880, "total_steps": 17540, "loss": 0.745, "learning_rate": 1.68140138768181e-05, "epoch": 3.3516209476309227, "percentage": 33.52, "elapsed_time": "23:11:31", "remaining_time": "1 day, 21:59:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5890, "total_steps": 17540, "loss": 0.74, "learning_rate": 1.6799434556845206e-05, "epoch": 3.3573209832561455, "percentage": 33.58, "elapsed_time": "23:13:54", "remaining_time": "1 day, 21:57:03", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5900, "total_steps": 17540, "loss": 0.7358, "learning_rate": 1.678482830737769e-05, "epoch": 3.363021018881368, "percentage": 33.64, "elapsed_time": "23:16:16", "remaining_time": "1 day, 21:54:41", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5910, "total_steps": 17540, "loss": 0.7481, "learning_rate": 1.6770195186264318e-05, "epoch": 3.3687210545065907, "percentage": 33.69, "elapsed_time": "23:18:36", "remaining_time": "1 day, 21:52:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5920, "total_steps": 17540, "loss": 0.7356, "learning_rate": 1.6755535251460282e-05, "epoch": 3.3744210901318135, "percentage": 33.75, "elapsed_time": "23:21:02", "remaining_time": "1 day, 21:50:00", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5930, "total_steps": 17540, "loss": 0.7369, "learning_rate": 1.674084856102698e-05, "epoch": 3.380121125757036, "percentage": 33.81, "elapsed_time": "23:23:30", "remaining_time": "1 day, 21:47:51", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5940, "total_steps": 17540, "loss": 0.7502, "learning_rate": 1.6726135173131767e-05, "epoch": 3.3858211613822586, "percentage": 33.87, "elapsed_time": "23:25:54", "remaining_time": "1 day, 21:45:32", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5950, "total_steps": 17540, "loss": 0.743, "learning_rate": 1.671139514604774e-05, "epoch": 3.3915211970074814, "percentage": 33.92, "elapsed_time": "23:28:21", "remaining_time": "1 day, 21:43:20", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5960, "total_steps": 17540, "loss": 0.7507, "learning_rate": 1.6696628538153498e-05, "epoch": 3.397221232632704, "percentage": 33.98, "elapsed_time": "23:30:42", "remaining_time": "1 day, 21:40:56", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5970, "total_steps": 17540, "loss": 0.7361, "learning_rate": 1.668183540793292e-05, "epoch": 3.4029212682579266, "percentage": 34.04, "elapsed_time": "23:33:00", "remaining_time": "1 day, 21:38:25", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5980, "total_steps": 17540, "loss": 0.7401, "learning_rate": 1.6667015813974928e-05, "epoch": 3.4086213038831494, "percentage": 34.09, "elapsed_time": "23:35:23", "remaining_time": "1 day, 21:36:05", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 5990, "total_steps": 17540, "loss": 0.7407, "learning_rate": 1.6652169814973246e-05, "epoch": 3.414321339508372, "percentage": 34.15, "elapsed_time": "23:37:41", "remaining_time": "1 day, 21:33:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6000, "total_steps": 17540, "loss": 0.745, "learning_rate": 1.6637297469726182e-05, "epoch": 3.4200213751335946, "percentage": 34.21, "elapsed_time": "23:40:00", "remaining_time": "1 day, 21:31:08", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6010, "total_steps": 17540, "loss": 0.7443, "learning_rate": 1.6622398837136397e-05, "epoch": 3.4257214107588174, "percentage": 34.26, "elapsed_time": "23:42:20", "remaining_time": "1 day, 21:28:42", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6020, "total_steps": 17540, "loss": 0.7441, "learning_rate": 1.660747397621065e-05, "epoch": 3.43142144638404, "percentage": 34.32, "elapsed_time": "23:44:44", "remaining_time": "1 day, 21:26:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6030, "total_steps": 17540, "loss": 0.7358, "learning_rate": 1.6592522946059594e-05, "epoch": 3.4371214820092626, "percentage": 34.38, "elapsed_time": "23:47:06", "remaining_time": "1 day, 21:24:03", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6040, "total_steps": 17540, "loss": 0.735, "learning_rate": 1.657754580589751e-05, "epoch": 3.4428215176344854, "percentage": 34.44, "elapsed_time": "23:49:28", "remaining_time": "1 day, 21:21:41", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6050, "total_steps": 17540, "loss": 0.7528, "learning_rate": 1.65625426150421e-05, "epoch": 3.4485215532597078, "percentage": 34.49, "elapsed_time": "23:51:47", "remaining_time": "1 day, 21:19:12", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6060, "total_steps": 17540, "loss": 0.7418, "learning_rate": 1.6547513432914242e-05, "epoch": 3.4542215888849306, "percentage": 34.55, "elapsed_time": "23:54:10", "remaining_time": "1 day, 21:16:52", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6070, "total_steps": 17540, "loss": 0.7453, "learning_rate": 1.6532458319037748e-05, "epoch": 3.4599216245101534, "percentage": 34.61, "elapsed_time": "23:56:36", "remaining_time": "1 day, 21:14:39", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6080, "total_steps": 17540, "loss": 0.7355, "learning_rate": 1.6517377333039134e-05, "epoch": 3.4656216601353758, "percentage": 34.66, "elapsed_time": "23:58:57", "remaining_time": "1 day, 21:12:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6090, "total_steps": 17540, "loss": 0.7311, "learning_rate": 1.650227053464739e-05, "epoch": 3.4713216957605986, "percentage": 34.72, "elapsed_time": "1 day, 0:01:18", "remaining_time": "1 day, 21:09:51", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6100, "total_steps": 17540, "loss": 0.7416, "learning_rate": 1.6487137983693732e-05, "epoch": 3.477021731385821, "percentage": 34.78, "elapsed_time": "1 day, 0:03:36", "remaining_time": "1 day, 21:07:21", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6110, "total_steps": 17540, "loss": 0.7424, "learning_rate": 1.647197974011137e-05, "epoch": 3.4827217670110437, "percentage": 34.83, "elapsed_time": "1 day, 0:05:58", "remaining_time": "1 day, 21:04:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6120, "total_steps": 17540, "loss": 0.7387, "learning_rate": 1.645679586393527e-05, "epoch": 3.4884218026362666, "percentage": 34.89, "elapsed_time": "1 day, 0:08:17", "remaining_time": "1 day, 21:02:31", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6130, "total_steps": 17540, "loss": 0.7331, "learning_rate": 1.6441586415301928e-05, "epoch": 3.4941218382614894, "percentage": 34.95, "elapsed_time": "1 day, 0:10:39", "remaining_time": "1 day, 21:00:10", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6140, "total_steps": 17540, "loss": 0.7382, "learning_rate": 1.6426351454449102e-05, "epoch": 3.4998218738867117, "percentage": 35.01, "elapsed_time": "1 day, 0:13:04", "remaining_time": "1 day, 20:57:53", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6150, "total_steps": 17540, "loss": 0.7386, "learning_rate": 1.641109104171561e-05, "epoch": 3.5055219095119345, "percentage": 35.06, "elapsed_time": "1 day, 0:15:32", "remaining_time": "1 day, 20:55:42", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6160, "total_steps": 17540, "loss": 0.7434, "learning_rate": 1.6395805237541066e-05, "epoch": 3.511221945137157, "percentage": 35.12, "elapsed_time": "1 day, 0:17:52", "remaining_time": "1 day, 20:53:16", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6170, "total_steps": 17540, "loss": 0.7403, "learning_rate": 1.6380494102465644e-05, "epoch": 3.5169219807623797, "percentage": 35.18, "elapsed_time": "1 day, 0:20:14", "remaining_time": "1 day, 20:50:54", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6180, "total_steps": 17540, "loss": 0.7295, "learning_rate": 1.6365157697129853e-05, "epoch": 3.5226220163876025, "percentage": 35.23, "elapsed_time": "1 day, 0:22:39", "remaining_time": "1 day, 20:48:37", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6190, "total_steps": 17540, "loss": 0.7342, "learning_rate": 1.6349796082274275e-05, "epoch": 3.5283220520128253, "percentage": 35.29, "elapsed_time": "1 day, 0:25:03", "remaining_time": "1 day, 20:46:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6200, "total_steps": 17540, "loss": 0.737, "learning_rate": 1.6334409318739344e-05, "epoch": 3.5340220876380477, "percentage": 35.35, "elapsed_time": "1 day, 0:27:24", "remaining_time": "1 day, 20:43:56", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6210, "total_steps": 17540, "loss": 0.747, "learning_rate": 1.631899746746509e-05, "epoch": 3.5397221232632705, "percentage": 35.4, "elapsed_time": "1 day, 0:29:42", "remaining_time": "1 day, 20:41:26", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6220, "total_steps": 17540, "loss": 0.7344, "learning_rate": 1.630356058949091e-05, "epoch": 3.545422158888493, "percentage": 35.46, "elapsed_time": "1 day, 0:31:58", "remaining_time": "1 day, 20:38:54", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6230, "total_steps": 17540, "loss": 0.7371, "learning_rate": 1.628809874595531e-05, "epoch": 3.5511221945137157, "percentage": 35.52, "elapsed_time": "1 day, 0:34:17", "remaining_time": "1 day, 20:36:26", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6240, "total_steps": 17540, "loss": 0.733, "learning_rate": 1.6272611998095694e-05, "epoch": 3.5568222301389385, "percentage": 35.58, "elapsed_time": "1 day, 0:36:35", "remaining_time": "1 day, 20:33:56", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6250, "total_steps": 17540, "loss": 0.741, "learning_rate": 1.6257100407248075e-05, "epoch": 3.562522265764161, "percentage": 35.63, "elapsed_time": "1 day, 0:38:57", "remaining_time": "1 day, 20:31:35", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6260, "total_steps": 17540, "loss": 0.7364, "learning_rate": 1.6241564034846883e-05, "epoch": 3.5682223013893837, "percentage": 35.69, "elapsed_time": "1 day, 0:41:20", "remaining_time": "1 day, 20:29:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6270, "total_steps": 17540, "loss": 0.7358, "learning_rate": 1.622600294242467e-05, "epoch": 3.5739223370146065, "percentage": 35.75, "elapsed_time": "1 day, 0:43:39", "remaining_time": "1 day, 20:26:47", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6280, "total_steps": 17540, "loss": 0.7519, "learning_rate": 1.6210417191611917e-05, "epoch": 3.579622372639829, "percentage": 35.8, "elapsed_time": "1 day, 0:46:02", "remaining_time": "1 day, 20:24:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6290, "total_steps": 17540, "loss": 0.7376, "learning_rate": 1.6194806844136755e-05, "epoch": 3.5853224082650517, "percentage": 35.86, "elapsed_time": "1 day, 0:48:26", "remaining_time": "1 day, 20:22:08", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6300, "total_steps": 17540, "loss": 0.7295, "learning_rate": 1.617917196182473e-05, "epoch": 3.5910224438902745, "percentage": 35.92, "elapsed_time": "1 day, 0:50:49", "remaining_time": "1 day, 20:19:48", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6310, "total_steps": 17540, "loss": 0.7433, "learning_rate": 1.616351260659856e-05, "epoch": 3.596722479515497, "percentage": 35.97, "elapsed_time": "1 day, 0:53:16", "remaining_time": "1 day, 20:17:35", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6320, "total_steps": 17540, "loss": 0.7385, "learning_rate": 1.6147828840477893e-05, "epoch": 3.6024225151407196, "percentage": 36.03, "elapsed_time": "1 day, 0:55:38", "remaining_time": "1 day, 20:15:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6330, "total_steps": 17540, "loss": 0.7346, "learning_rate": 1.6132120725579057e-05, "epoch": 3.608122550765942, "percentage": 36.09, "elapsed_time": "1 day, 0:58:07", "remaining_time": "1 day, 20:13:03", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6340, "total_steps": 17540, "loss": 0.7308, "learning_rate": 1.611638832411481e-05, "epoch": 3.613822586391165, "percentage": 36.15, "elapsed_time": "1 day, 1:00:24", "remaining_time": "1 day, 20:10:34", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6350, "total_steps": 17540, "loss": 0.7402, "learning_rate": 1.61006316983941e-05, "epoch": 3.6195226220163876, "percentage": 36.2, "elapsed_time": "1 day, 1:02:53", "remaining_time": "1 day, 20:08:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6360, "total_steps": 17540, "loss": 0.7434, "learning_rate": 1.6084850910821822e-05, "epoch": 3.6252226576416104, "percentage": 36.26, "elapsed_time": "1 day, 1:05:14", "remaining_time": "1 day, 20:06:00", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6370, "total_steps": 17540, "loss": 0.7377, "learning_rate": 1.6069046023898554e-05, "epoch": 3.630922693266833, "percentage": 36.32, "elapsed_time": "1 day, 1:07:33", "remaining_time": "1 day, 20:03:33", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6380, "total_steps": 17540, "loss": 0.7387, "learning_rate": 1.6053217100220332e-05, "epoch": 3.6366227288920556, "percentage": 36.37, "elapsed_time": "1 day, 1:09:53", "remaining_time": "1 day, 20:01:06", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6390, "total_steps": 17540, "loss": 0.7436, "learning_rate": 1.6037364202478386e-05, "epoch": 3.642322764517278, "percentage": 36.43, "elapsed_time": "1 day, 1:12:16", "remaining_time": "1 day, 19:58:46", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6400, "total_steps": 17540, "loss": 0.741, "learning_rate": 1.6021487393458893e-05, "epoch": 3.648022800142501, "percentage": 36.49, "elapsed_time": "1 day, 1:14:44", "remaining_time": "1 day, 19:56:35", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6410, "total_steps": 17540, "loss": 0.7274, "learning_rate": 1.600558673604274e-05, "epoch": 3.6537228357677236, "percentage": 36.55, "elapsed_time": "1 day, 1:17:05", "remaining_time": "1 day, 19:54:12", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6420, "total_steps": 17540, "loss": 0.7357, "learning_rate": 1.598966229320526e-05, "epoch": 3.6594228713929464, "percentage": 36.6, "elapsed_time": "1 day, 1:19:25", "remaining_time": "1 day, 19:51:47", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6430, "total_steps": 17540, "loss": 0.7361, "learning_rate": 1.5973714128015987e-05, "epoch": 3.665122907018169, "percentage": 36.66, "elapsed_time": "1 day, 1:21:50", "remaining_time": "1 day, 19:49:30", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6440, "total_steps": 17540, "loss": 0.7328, "learning_rate": 1.595774230363842e-05, "epoch": 3.6708229426433916, "percentage": 36.72, "elapsed_time": "1 day, 1:24:13", "remaining_time": "1 day, 19:47:09", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6450, "total_steps": 17540, "loss": 0.7342, "learning_rate": 1.5941746883329745e-05, "epoch": 3.676522978268614, "percentage": 36.77, "elapsed_time": "1 day, 1:26:32", "remaining_time": "1 day, 19:44:41", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6460, "total_steps": 17540, "loss": 0.7331, "learning_rate": 1.5925727930440617e-05, "epoch": 3.6822230138938368, "percentage": 36.83, "elapsed_time": "1 day, 1:28:51", "remaining_time": "1 day, 19:42:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6470, "total_steps": 17540, "loss": 0.7435, "learning_rate": 1.5909685508414884e-05, "epoch": 3.6879230495190596, "percentage": 36.89, "elapsed_time": "1 day, 1:31:09", "remaining_time": "1 day, 19:39:46", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6480, "total_steps": 17540, "loss": 0.738, "learning_rate": 1.589361968078935e-05, "epoch": 3.6936230851442824, "percentage": 36.94, "elapsed_time": "1 day, 1:33:27", "remaining_time": "1 day, 19:37:16", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6490, "total_steps": 17540, "loss": 0.744, "learning_rate": 1.587753051119351e-05, "epoch": 3.6993231207695048, "percentage": 37.0, "elapsed_time": "1 day, 1:35:44", "remaining_time": "1 day, 19:34:47", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6500, "total_steps": 17540, "loss": 0.7338, "learning_rate": 1.586141806334931e-05, "epoch": 3.7050231563947276, "percentage": 37.06, "elapsed_time": "1 day, 1:38:08", "remaining_time": "1 day, 19:32:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6510, "total_steps": 17540, "loss": 0.7381, "learning_rate": 1.5845282401070893e-05, "epoch": 3.71072319201995, "percentage": 37.12, "elapsed_time": "1 day, 1:40:31", "remaining_time": "1 day, 19:30:07", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6520, "total_steps": 17540, "loss": 0.7305, "learning_rate": 1.5829123588264348e-05, "epoch": 3.7164232276451727, "percentage": 37.17, "elapsed_time": "1 day, 1:42:50", "remaining_time": "1 day, 19:27:41", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6530, "total_steps": 17540, "loss": 0.732, "learning_rate": 1.5812941688927435e-05, "epoch": 3.7221232632703956, "percentage": 37.23, "elapsed_time": "1 day, 1:45:17", "remaining_time": "1 day, 19:25:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6540, "total_steps": 17540, "loss": 0.7357, "learning_rate": 1.579673676714937e-05, "epoch": 3.7278232988956184, "percentage": 37.29, "elapsed_time": "1 day, 1:47:40", "remaining_time": "1 day, 19:23:06", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6550, "total_steps": 17540, "loss": 0.7359, "learning_rate": 1.5780508887110543e-05, "epoch": 3.7335233345208407, "percentage": 37.34, "elapsed_time": "1 day, 1:50:03", "remaining_time": "1 day, 19:20:47", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6560, "total_steps": 17540, "loss": 0.733, "learning_rate": 1.5764258113082266e-05, "epoch": 3.7392233701460635, "percentage": 37.4, "elapsed_time": "1 day, 1:52:29", "remaining_time": "1 day, 19:18:31", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6570, "total_steps": 17540, "loss": 0.7177, "learning_rate": 1.5747984509426528e-05, "epoch": 3.744923405771286, "percentage": 37.46, "elapsed_time": "1 day, 1:54:53", "remaining_time": "1 day, 19:16:13", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6580, "total_steps": 17540, "loss": 0.7336, "learning_rate": 1.5731688140595737e-05, "epoch": 3.7506234413965087, "percentage": 37.51, "elapsed_time": "1 day, 1:57:11", "remaining_time": "1 day, 19:13:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6590, "total_steps": 17540, "loss": 0.7237, "learning_rate": 1.5715369071132462e-05, "epoch": 3.7563234770217315, "percentage": 37.57, "elapsed_time": "1 day, 1:59:32", "remaining_time": "1 day, 19:11:20", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6600, "total_steps": 17540, "loss": 0.7311, "learning_rate": 1.569902736566918e-05, "epoch": 3.762023512646954, "percentage": 37.63, "elapsed_time": "1 day, 2:01:55", "remaining_time": "1 day, 19:08:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6610, "total_steps": 17540, "loss": 0.7254, "learning_rate": 1.5682663088928017e-05, "epoch": 3.7677235482721767, "percentage": 37.69, "elapsed_time": "1 day, 2:04:19", "remaining_time": "1 day, 19:06:41", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6620, "total_steps": 17540, "loss": 0.7347, "learning_rate": 1.5666276305720497e-05, "epoch": 3.7734235838973995, "percentage": 37.74, "elapsed_time": "1 day, 2:06:42", "remaining_time": "1 day, 19:04:21", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6630, "total_steps": 17540, "loss": 0.7287, "learning_rate": 1.564986708094728e-05, "epoch": 3.779123619522622, "percentage": 37.8, "elapsed_time": "1 day, 2:09:02", "remaining_time": "1 day, 19:01:56", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6640, "total_steps": 17540, "loss": 0.7382, "learning_rate": 1.5633435479597906e-05, "epoch": 3.7848236551478447, "percentage": 37.86, "elapsed_time": "1 day, 2:11:22", "remaining_time": "1 day, 18:59:31", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6650, "total_steps": 17540, "loss": 0.7284, "learning_rate": 1.561698156675054e-05, "epoch": 3.7905236907730675, "percentage": 37.91, "elapsed_time": "1 day, 2:13:43", "remaining_time": "1 day, 18:57:07", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6660, "total_steps": 17540, "loss": 0.7428, "learning_rate": 1.5600505407571706e-05, "epoch": 3.79622372639829, "percentage": 37.97, "elapsed_time": "1 day, 2:16:03", "remaining_time": "1 day, 18:54:41", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6670, "total_steps": 17540, "loss": 0.7382, "learning_rate": 1.558400706731605e-05, "epoch": 3.8019237620235127, "percentage": 38.03, "elapsed_time": "1 day, 2:18:22", "remaining_time": "1 day, 18:52:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6680, "total_steps": 17540, "loss": 0.731, "learning_rate": 1.5567486611326058e-05, "epoch": 3.807623797648735, "percentage": 38.08, "elapsed_time": "1 day, 2:20:41", "remaining_time": "1 day, 18:49:47", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6690, "total_steps": 17540, "loss": 0.7333, "learning_rate": 1.555094410503181e-05, "epoch": 3.813323833273958, "percentage": 38.14, "elapsed_time": "1 day, 2:23:00", "remaining_time": "1 day, 18:47:21", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6700, "total_steps": 17540, "loss": 0.7327, "learning_rate": 1.5534379613950704e-05, "epoch": 3.8190238688991807, "percentage": 38.2, "elapsed_time": "1 day, 2:25:22", "remaining_time": "1 day, 18:45:00", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6710, "total_steps": 17540, "loss": 0.7411, "learning_rate": 1.5517793203687232e-05, "epoch": 3.8247239045244035, "percentage": 38.26, "elapsed_time": "1 day, 2:27:39", "remaining_time": "1 day, 18:42:29", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6720, "total_steps": 17540, "loss": 0.7392, "learning_rate": 1.5501184939932685e-05, "epoch": 3.830423940149626, "percentage": 38.31, "elapsed_time": "1 day, 2:30:02", "remaining_time": "1 day, 18:40:09", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6730, "total_steps": 17540, "loss": 0.7159, "learning_rate": 1.54845548884649e-05, "epoch": 3.8361239757748486, "percentage": 38.37, "elapsed_time": "1 day, 2:32:22", "remaining_time": "1 day, 18:37:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6740, "total_steps": 17540, "loss": 0.7358, "learning_rate": 1.5467903115148023e-05, "epoch": 3.841824011400071, "percentage": 38.43, "elapsed_time": "1 day, 2:34:41", "remaining_time": "1 day, 18:35:17", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6750, "total_steps": 17540, "loss": 0.732, "learning_rate": 1.5451229685932212e-05, "epoch": 3.847524047025294, "percentage": 38.48, "elapsed_time": "1 day, 2:37:07", "remaining_time": "1 day, 18:33:01", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6760, "total_steps": 17540, "loss": 0.7294, "learning_rate": 1.5434534666853406e-05, "epoch": 3.8532240826505166, "percentage": 38.54, "elapsed_time": "1 day, 2:39:33", "remaining_time": "1 day, 18:30:46", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6770, "total_steps": 17540, "loss": 0.7368, "learning_rate": 1.541781812403305e-05, "epoch": 3.8589241182757394, "percentage": 38.6, "elapsed_time": "1 day, 2:41:52", "remaining_time": "1 day, 18:28:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6780, "total_steps": 17540, "loss": 0.7359, "learning_rate": 1.540108012367783e-05, "epoch": 3.864624153900962, "percentage": 38.65, "elapsed_time": "1 day, 2:44:10", "remaining_time": "1 day, 18:25:50", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6790, "total_steps": 17540, "loss": 0.7237, "learning_rate": 1.538432073207942e-05, "epoch": 3.8703241895261846, "percentage": 38.71, "elapsed_time": "1 day, 2:46:30", "remaining_time": "1 day, 18:23:26", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6800, "total_steps": 17540, "loss": 0.7227, "learning_rate": 1.536754001561422e-05, "epoch": 3.876024225151407, "percentage": 38.77, "elapsed_time": "1 day, 2:48:52", "remaining_time": "1 day, 18:21:04", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6810, "total_steps": 17540, "loss": 0.7384, "learning_rate": 1.535073804074307e-05, "epoch": 3.88172426077663, "percentage": 38.83, "elapsed_time": "1 day, 2:51:12", "remaining_time": "1 day, 18:18:38", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6820, "total_steps": 17540, "loss": 0.7278, "learning_rate": 1.5333914874011025e-05, "epoch": 3.8874242964018526, "percentage": 38.88, "elapsed_time": "1 day, 2:53:34", "remaining_time": "1 day, 18:16:17", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6830, "total_steps": 17540, "loss": 0.7352, "learning_rate": 1.5317070582047066e-05, "epoch": 3.8931243320270754, "percentage": 38.94, "elapsed_time": "1 day, 2:55:59", "remaining_time": "1 day, 18:14:00", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6840, "total_steps": 17540, "loss": 0.7296, "learning_rate": 1.530020523156383e-05, "epoch": 3.898824367652298, "percentage": 39.0, "elapsed_time": "1 day, 2:58:23", "remaining_time": "1 day, 18:11:41", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6850, "total_steps": 17540, "loss": 0.72, "learning_rate": 1.5283318889357367e-05, "epoch": 3.9045244032775206, "percentage": 39.05, "elapsed_time": "1 day, 3:00:42", "remaining_time": "1 day, 18:09:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6860, "total_steps": 17540, "loss": 0.7379, "learning_rate": 1.5266411622306873e-05, "epoch": 3.910224438902743, "percentage": 39.11, "elapsed_time": "1 day, 3:03:02", "remaining_time": "1 day, 18:06:49", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6870, "total_steps": 17540, "loss": 0.7317, "learning_rate": 1.5249483497374403e-05, "epoch": 3.9159244745279658, "percentage": 39.17, "elapsed_time": "1 day, 3:05:23", "remaining_time": "1 day, 18:04:26", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6880, "total_steps": 17540, "loss": 0.74, "learning_rate": 1.5232534581604633e-05, "epoch": 3.9216245101531886, "percentage": 39.22, "elapsed_time": "1 day, 3:07:51", "remaining_time": "1 day, 18:02:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6890, "total_steps": 17540, "loss": 0.7305, "learning_rate": 1.5215564942124573e-05, "epoch": 3.9273245457784114, "percentage": 39.28, "elapsed_time": "1 day, 3:10:12", "remaining_time": "1 day, 17:59:50", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6900, "total_steps": 17540, "loss": 0.7415, "learning_rate": 1.5198574646143311e-05, "epoch": 3.9330245814036338, "percentage": 39.34, "elapsed_time": "1 day, 3:12:39", "remaining_time": "1 day, 17:57:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6910, "total_steps": 17540, "loss": 0.7343, "learning_rate": 1.5181563760951754e-05, "epoch": 3.9387246170288566, "percentage": 39.4, "elapsed_time": "1 day, 3:14:53", "remaining_time": "1 day, 17:55:02", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6920, "total_steps": 17540, "loss": 0.7305, "learning_rate": 1.516453235392235e-05, "epoch": 3.944424652654079, "percentage": 39.45, "elapsed_time": "1 day, 3:17:13", "remaining_time": "1 day, 17:52:37", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6930, "total_steps": 17540, "loss": 0.7301, "learning_rate": 1.5147480492508817e-05, "epoch": 3.9501246882793017, "percentage": 39.51, "elapsed_time": "1 day, 3:19:36", "remaining_time": "1 day, 17:50:17", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6940, "total_steps": 17540, "loss": 0.7441, "learning_rate": 1.5130408244245893e-05, "epoch": 3.9558247239045246, "percentage": 39.57, "elapsed_time": "1 day, 3:21:56", "remaining_time": "1 day, 17:47:51", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6950, "total_steps": 17540, "loss": 0.7335, "learning_rate": 1.5113315676749056e-05, "epoch": 3.961524759529747, "percentage": 39.62, "elapsed_time": "1 day, 3:24:16", "remaining_time": "1 day, 17:45:26", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6960, "total_steps": 17540, "loss": 0.736, "learning_rate": 1.5096202857714261e-05, "epoch": 3.9672247951549697, "percentage": 39.68, "elapsed_time": "1 day, 3:26:37", "remaining_time": "1 day, 17:43:03", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6970, "total_steps": 17540, "loss": 0.7306, "learning_rate": 1.5079069854917666e-05, "epoch": 3.9729248307801925, "percentage": 39.74, "elapsed_time": "1 day, 3:29:00", "remaining_time": "1 day, 17:40:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6980, "total_steps": 17540, "loss": 0.7335, "learning_rate": 1.5061916736215372e-05, "epoch": 3.978624866405415, "percentage": 39.79, "elapsed_time": "1 day, 3:31:22", "remaining_time": "1 day, 17:38:20", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 6990, "total_steps": 17540, "loss": 0.7261, "learning_rate": 1.5044743569543147e-05, "epoch": 3.9843249020306377, "percentage": 39.85, "elapsed_time": "1 day, 3:33:44", "remaining_time": "1 day, 17:35:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7000, "total_steps": 17540, "loss": 0.7319, "learning_rate": 1.5027550422916164e-05, "epoch": 3.9900249376558605, "percentage": 39.91, "elapsed_time": "1 day, 3:36:07", "remaining_time": "1 day, 17:33:39", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7010, "total_steps": 17540, "loss": 0.7394, "learning_rate": 1.5010337364428723e-05, "epoch": 3.995724973281083, "percentage": 39.97, "elapsed_time": "1 day, 3:38:29", "remaining_time": "1 day, 17:31:17", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7020, "total_steps": 17540, "loss": 0.7275, "learning_rate": 1.4993104462253987e-05, "epoch": 4.001425008906305, "percentage": 40.02, "elapsed_time": "1 day, 3:40:50", "remaining_time": "1 day, 17:28:53", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7030, "total_steps": 17540, "loss": 0.7152, "learning_rate": 1.4975851784643713e-05, "epoch": 4.007125044531528, "percentage": 40.08, "elapsed_time": "1 day, 3:43:08", "remaining_time": "1 day, 17:26:26", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7040, "total_steps": 17540, "loss": 0.7165, "learning_rate": 1.4958579399927977e-05, "epoch": 4.012825080156751, "percentage": 40.14, "elapsed_time": "1 day, 3:45:30", "remaining_time": "1 day, 17:24:04", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7050, "total_steps": 17540, "loss": 0.7102, "learning_rate": 1.4941287376514908e-05, "epoch": 4.018525115781974, "percentage": 40.19, "elapsed_time": "1 day, 3:47:54", "remaining_time": "1 day, 17:21:45", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7060, "total_steps": 17540, "loss": 0.7132, "learning_rate": 1.4923975782890415e-05, "epoch": 4.0242251514071965, "percentage": 40.25, "elapsed_time": "1 day, 3:50:24", "remaining_time": "1 day, 17:19:35", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7070, "total_steps": 17540, "loss": 0.7147, "learning_rate": 1.4906644687617915e-05, "epoch": 4.029925187032419, "percentage": 40.31, "elapsed_time": "1 day, 3:52:45", "remaining_time": "1 day, 17:17:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7080, "total_steps": 17540, "loss": 0.7158, "learning_rate": 1.4889294159338061e-05, "epoch": 4.035625222657641, "percentage": 40.36, "elapsed_time": "1 day, 3:55:08", "remaining_time": "1 day, 17:14:50", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7090, "total_steps": 17540, "loss": 0.7045, "learning_rate": 1.4871924266768474e-05, "epoch": 4.041325258282864, "percentage": 40.42, "elapsed_time": "1 day, 3:57:26", "remaining_time": "1 day, 17:12:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7100, "total_steps": 17540, "loss": 0.7176, "learning_rate": 1.4854535078703466e-05, "epoch": 4.047025293908087, "percentage": 40.48, "elapsed_time": "1 day, 3:59:50", "remaining_time": "1 day, 17:10:04", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7110, "total_steps": 17540, "loss": 0.7142, "learning_rate": 1.483712666401377e-05, "epoch": 4.05272532953331, "percentage": 40.54, "elapsed_time": "1 day, 4:02:14", "remaining_time": "1 day, 17:07:45", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7120, "total_steps": 17540, "loss": 0.7241, "learning_rate": 1.4819699091646272e-05, "epoch": 4.0584253651585325, "percentage": 40.59, "elapsed_time": "1 day, 4:04:35", "remaining_time": "1 day, 17:05:21", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7130, "total_steps": 17540, "loss": 0.7157, "learning_rate": 1.4802252430623725e-05, "epoch": 4.064125400783755, "percentage": 40.65, "elapsed_time": "1 day, 4:06:57", "remaining_time": "1 day, 17:03:00", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7140, "total_steps": 17540, "loss": 0.7154, "learning_rate": 1.4784786750044486e-05, "epoch": 4.069825436408977, "percentage": 40.71, "elapsed_time": "1 day, 4:09:22", "remaining_time": "1 day, 17:00:42", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7150, "total_steps": 17540, "loss": 0.7118, "learning_rate": 1.4767302119082243e-05, "epoch": 4.0755254720342, "percentage": 40.76, "elapsed_time": "1 day, 4:11:43", "remaining_time": "1 day, 16:58:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7160, "total_steps": 17540, "loss": 0.7051, "learning_rate": 1.4749798606985735e-05, "epoch": 4.081225507659423, "percentage": 40.82, "elapsed_time": "1 day, 4:14:04", "remaining_time": "1 day, 16:55:56", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7170, "total_steps": 17540, "loss": 0.7143, "learning_rate": 1.4732276283078484e-05, "epoch": 4.086925543284646, "percentage": 40.88, "elapsed_time": "1 day, 4:16:29", "remaining_time": "1 day, 16:53:38", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7180, "total_steps": 17540, "loss": 0.7151, "learning_rate": 1.4714735216758512e-05, "epoch": 4.0926255789098684, "percentage": 40.94, "elapsed_time": "1 day, 4:18:53", "remaining_time": "1 day, 16:51:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7190, "total_steps": 17540, "loss": 0.7058, "learning_rate": 1.4697175477498074e-05, "epoch": 4.098325614535091, "percentage": 40.99, "elapsed_time": "1 day, 4:21:11", "remaining_time": "1 day, 16:48:51", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7200, "total_steps": 17540, "loss": 0.7207, "learning_rate": 1.4679597134843382e-05, "epoch": 4.104025650160313, "percentage": 41.05, "elapsed_time": "1 day, 4:23:36", "remaining_time": "1 day, 16:46:33", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7210, "total_steps": 17540, "loss": 0.7229, "learning_rate": 1.4662000258414324e-05, "epoch": 4.109725685785536, "percentage": 41.11, "elapsed_time": "1 day, 4:25:57", "remaining_time": "1 day, 16:44:10", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7220, "total_steps": 17540, "loss": 0.7111, "learning_rate": 1.4644384917904195e-05, "epoch": 4.115425721410759, "percentage": 41.16, "elapsed_time": "1 day, 4:28:27", "remaining_time": "1 day, 16:41:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7230, "total_steps": 17540, "loss": 0.7205, "learning_rate": 1.4626751183079415e-05, "epoch": 4.121125757035982, "percentage": 41.22, "elapsed_time": "1 day, 4:30:50", "remaining_time": "1 day, 16:39:39", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7240, "total_steps": 17540, "loss": 0.7108, "learning_rate": 1.460909912377926e-05, "epoch": 4.126825792661204, "percentage": 41.28, "elapsed_time": "1 day, 4:33:17", "remaining_time": "1 day, 16:37:25", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7250, "total_steps": 17540, "loss": 0.7157, "learning_rate": 1.4591428809915573e-05, "epoch": 4.132525828286427, "percentage": 41.33, "elapsed_time": "1 day, 4:35:41", "remaining_time": "1 day, 16:35:05", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7260, "total_steps": 17540, "loss": 0.7122, "learning_rate": 1.4573740311472506e-05, "epoch": 4.138225863911649, "percentage": 41.39, "elapsed_time": "1 day, 4:38:05", "remaining_time": "1 day, 16:32:46", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7270, "total_steps": 17540, "loss": 0.7211, "learning_rate": 1.4556033698506224e-05, "epoch": 4.143925899536872, "percentage": 41.45, "elapsed_time": "1 day, 4:40:34", "remaining_time": "1 day, 16:30:34", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7280, "total_steps": 17540, "loss": 0.7222, "learning_rate": 1.4538309041144636e-05, "epoch": 4.149625935162095, "percentage": 41.51, "elapsed_time": "1 day, 4:42:51", "remaining_time": "1 day, 16:28:06", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7290, "total_steps": 17540, "loss": 0.7139, "learning_rate": 1.4520566409587118e-05, "epoch": 4.155325970787318, "percentage": 41.56, "elapsed_time": "1 day, 4:45:17", "remaining_time": "1 day, 16:25:48", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7300, "total_steps": 17540, "loss": 0.7097, "learning_rate": 1.4502805874104237e-05, "epoch": 4.16102600641254, "percentage": 41.62, "elapsed_time": "1 day, 4:47:36", "remaining_time": "1 day, 16:23:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7310, "total_steps": 17540, "loss": 0.7055, "learning_rate": 1.4485027505037464e-05, "epoch": 4.166726042037762, "percentage": 41.68, "elapsed_time": "1 day, 4:50:00", "remaining_time": "1 day, 16:21:03", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7320, "total_steps": 17540, "loss": 0.7246, "learning_rate": 1.4467231372798905e-05, "epoch": 4.172426077662985, "percentage": 41.73, "elapsed_time": "1 day, 4:52:22", "remaining_time": "1 day, 16:18:41", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7330, "total_steps": 17540, "loss": 0.7241, "learning_rate": 1.4449417547871014e-05, "epoch": 4.178126113288208, "percentage": 41.79, "elapsed_time": "1 day, 4:54:40", "remaining_time": "1 day, 16:16:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7340, "total_steps": 17540, "loss": 0.7273, "learning_rate": 1.443158610080632e-05, "epoch": 4.183826148913431, "percentage": 41.85, "elapsed_time": "1 day, 4:57:02", "remaining_time": "1 day, 16:13:52", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7350, "total_steps": 17540, "loss": 0.7065, "learning_rate": 1.441373710222715e-05, "epoch": 4.1895261845386536, "percentage": 41.9, "elapsed_time": "1 day, 4:59:23", "remaining_time": "1 day, 16:11:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7360, "total_steps": 17540, "loss": 0.7081, "learning_rate": 1.439587062282533e-05, "epoch": 4.195226220163876, "percentage": 41.96, "elapsed_time": "1 day, 5:01:49", "remaining_time": "1 day, 16:09:12", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7370, "total_steps": 17540, "loss": 0.7213, "learning_rate": 1.437798673336194e-05, "epoch": 4.200926255789098, "percentage": 42.02, "elapsed_time": "1 day, 5:04:06", "remaining_time": "1 day, 16:06:44", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7380, "total_steps": 17540, "loss": 0.7115, "learning_rate": 1.4360085504666994e-05, "epoch": 4.206626291414321, "percentage": 42.08, "elapsed_time": "1 day, 5:06:28", "remaining_time": "1 day, 16:04:21", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7390, "total_steps": 17540, "loss": 0.7073, "learning_rate": 1.4342167007639196e-05, "epoch": 4.212326327039544, "percentage": 42.13, "elapsed_time": "1 day, 5:08:48", "remaining_time": "1 day, 16:01:57", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7400, "total_steps": 17540, "loss": 0.7124, "learning_rate": 1.4324231313245629e-05, "epoch": 4.218026362664767, "percentage": 42.19, "elapsed_time": "1 day, 5:11:11", "remaining_time": "1 day, 15:59:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7410, "total_steps": 17540, "loss": 0.7051, "learning_rate": 1.430627849252149e-05, "epoch": 4.2237263982899895, "percentage": 42.25, "elapsed_time": "1 day, 5:13:30", "remaining_time": "1 day, 15:57:10", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7420, "total_steps": 17540, "loss": 0.7127, "learning_rate": 1.4288308616569811e-05, "epoch": 4.229426433915212, "percentage": 42.3, "elapsed_time": "1 day, 5:15:55", "remaining_time": "1 day, 15:54:52", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7430, "total_steps": 17540, "loss": 0.7189, "learning_rate": 1.4270321756561169e-05, "epoch": 4.235126469540434, "percentage": 42.36, "elapsed_time": "1 day, 5:18:17", "remaining_time": "1 day, 15:52:30", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7440, "total_steps": 17540, "loss": 0.7076, "learning_rate": 1.4252317983733406e-05, "epoch": 4.240826505165657, "percentage": 42.42, "elapsed_time": "1 day, 5:20:36", "remaining_time": "1 day, 15:50:03", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7450, "total_steps": 17540, "loss": 0.7144, "learning_rate": 1.4234297369391345e-05, "epoch": 4.24652654079088, "percentage": 42.47, "elapsed_time": "1 day, 5:22:58", "remaining_time": "1 day, 15:47:42", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7460, "total_steps": 17540, "loss": 0.7106, "learning_rate": 1.4216259984906522e-05, "epoch": 4.252226576416103, "percentage": 42.53, "elapsed_time": "1 day, 5:25:20", "remaining_time": "1 day, 15:45:21", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7470, "total_steps": 17540, "loss": 0.7251, "learning_rate": 1.4198205901716877e-05, "epoch": 4.2579266120413255, "percentage": 42.59, "elapsed_time": "1 day, 5:27:41", "remaining_time": "1 day, 15:42:56", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7480, "total_steps": 17540, "loss": 0.7147, "learning_rate": 1.4180135191326498e-05, "epoch": 4.263626647666548, "percentage": 42.65, "elapsed_time": "1 day, 5:29:59", "remaining_time": "1 day, 15:40:29", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7490, "total_steps": 17540, "loss": 0.7142, "learning_rate": 1.4162047925305318e-05, "epoch": 4.26932668329177, "percentage": 42.7, "elapsed_time": "1 day, 5:32:16", "remaining_time": "1 day, 15:38:01", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7500, "total_steps": 17540, "loss": 0.7152, "learning_rate": 1.4143944175288846e-05, "epoch": 4.275026718916993, "percentage": 42.76, "elapsed_time": "1 day, 5:34:32", "remaining_time": "1 day, 15:35:30", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7510, "total_steps": 17540, "loss": 0.7135, "learning_rate": 1.4125824012977871e-05, "epoch": 4.280726754542216, "percentage": 42.82, "elapsed_time": "1 day, 5:36:52", "remaining_time": "1 day, 15:33:06", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7520, "total_steps": 17540, "loss": 0.7124, "learning_rate": 1.4107687510138193e-05, "epoch": 4.286426790167439, "percentage": 42.87, "elapsed_time": "1 day, 5:39:11", "remaining_time": "1 day, 15:30:41", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7530, "total_steps": 17540, "loss": 0.719, "learning_rate": 1.408953473860031e-05, "epoch": 4.2921268257926615, "percentage": 42.93, "elapsed_time": "1 day, 5:41:34", "remaining_time": "1 day, 15:28:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7540, "total_steps": 17540, "loss": 0.7076, "learning_rate": 1.4071365770259175e-05, "epoch": 4.297826861417883, "percentage": 42.99, "elapsed_time": "1 day, 5:43:55", "remaining_time": "1 day, 15:25:57", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7550, "total_steps": 17540, "loss": 0.7181, "learning_rate": 1.4053180677073877e-05, "epoch": 4.303526897043106, "percentage": 43.04, "elapsed_time": "1 day, 5:46:15", "remaining_time": "1 day, 15:23:32", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7560, "total_steps": 17540, "loss": 0.7278, "learning_rate": 1.403497953106737e-05, "epoch": 4.309226932668329, "percentage": 43.1, "elapsed_time": "1 day, 5:48:34", "remaining_time": "1 day, 15:21:06", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7570, "total_steps": 17540, "loss": 0.7179, "learning_rate": 1.4016762404326189e-05, "epoch": 4.314926968293552, "percentage": 43.16, "elapsed_time": "1 day, 5:50:58", "remaining_time": "1 day, 15:18:46", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7580, "total_steps": 17540, "loss": 0.7209, "learning_rate": 1.399852936900016e-05, "epoch": 4.320627003918775, "percentage": 43.22, "elapsed_time": "1 day, 5:53:19", "remaining_time": "1 day, 15:16:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7590, "total_steps": 17540, "loss": 0.7174, "learning_rate": 1.3980280497302113e-05, "epoch": 4.326327039543997, "percentage": 43.27, "elapsed_time": "1 day, 5:55:37", "remaining_time": "1 day, 15:13:56", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7600, "total_steps": 17540, "loss": 0.7197, "learning_rate": 1.39620158615076e-05, "epoch": 4.33202707516922, "percentage": 43.33, "elapsed_time": "1 day, 5:58:01", "remaining_time": "1 day, 15:11:37", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7610, "total_steps": 17540, "loss": 0.7134, "learning_rate": 1.3943735533954612e-05, "epoch": 4.337727110794442, "percentage": 43.39, "elapsed_time": "1 day, 6:00:24", "remaining_time": "1 day, 15:09:17", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7620, "total_steps": 17540, "loss": 0.7173, "learning_rate": 1.392543958704328e-05, "epoch": 4.343427146419665, "percentage": 43.44, "elapsed_time": "1 day, 6:02:46", "remaining_time": "1 day, 15:06:55", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7630, "total_steps": 17540, "loss": 0.7125, "learning_rate": 1.3907128093235604e-05, "epoch": 4.349127182044888, "percentage": 43.5, "elapsed_time": "1 day, 6:05:10", "remaining_time": "1 day, 15:04:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7640, "total_steps": 17540, "loss": 0.7149, "learning_rate": 1.3888801125055156e-05, "epoch": 4.354827217670111, "percentage": 43.56, "elapsed_time": "1 day, 6:07:37", "remaining_time": "1 day, 15:02:20", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7650, "total_steps": 17540, "loss": 0.7023, "learning_rate": 1.3870458755086793e-05, "epoch": 4.360527253295333, "percentage": 43.61, "elapsed_time": "1 day, 6:09:57", "remaining_time": "1 day, 14:59:55", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7660, "total_steps": 17540, "loss": 0.7072, "learning_rate": 1.3852101055976367e-05, "epoch": 4.366227288920555, "percentage": 43.67, "elapsed_time": "1 day, 6:12:23", "remaining_time": "1 day, 14:57:39", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7670, "total_steps": 17540, "loss": 0.7185, "learning_rate": 1.3833728100430455e-05, "epoch": 4.371927324545778, "percentage": 43.73, "elapsed_time": "1 day, 6:14:42", "remaining_time": "1 day, 14:55:12", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7680, "total_steps": 17540, "loss": 0.7144, "learning_rate": 1.3815339961216046e-05, "epoch": 4.377627360171001, "percentage": 43.79, "elapsed_time": "1 day, 6:17:04", "remaining_time": "1 day, 14:52:50", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7690, "total_steps": 17540, "loss": 0.7162, "learning_rate": 1.3796936711160269e-05, "epoch": 4.383327395796224, "percentage": 43.84, "elapsed_time": "1 day, 6:19:29", "remaining_time": "1 day, 14:50:33", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7700, "total_steps": 17540, "loss": 0.7119, "learning_rate": 1.3778518423150101e-05, "epoch": 4.389027431421447, "percentage": 43.9, "elapsed_time": "1 day, 6:21:54", "remaining_time": "1 day, 14:48:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7710, "total_steps": 17540, "loss": 0.7098, "learning_rate": 1.3760085170132076e-05, "epoch": 4.394727467046669, "percentage": 43.96, "elapsed_time": "1 day, 6:24:16", "remaining_time": "1 day, 14:45:53", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7720, "total_steps": 17540, "loss": 0.7142, "learning_rate": 1.3741637025112e-05, "epoch": 4.400427502671891, "percentage": 44.01, "elapsed_time": "1 day, 6:26:36", "remaining_time": "1 day, 14:43:29", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7730, "total_steps": 17540, "loss": 0.7104, "learning_rate": 1.3723174061154652e-05, "epoch": 4.406127538297114, "percentage": 44.07, "elapsed_time": "1 day, 6:28:58", "remaining_time": "1 day, 14:41:06", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7740, "total_steps": 17540, "loss": 0.716, "learning_rate": 1.3704696351383516e-05, "epoch": 4.411827573922337, "percentage": 44.13, "elapsed_time": "1 day, 6:31:23", "remaining_time": "1 day, 14:38:48", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7750, "total_steps": 17540, "loss": 0.7295, "learning_rate": 1.3686203968980465e-05, "epoch": 4.41752760954756, "percentage": 44.18, "elapsed_time": "1 day, 6:33:52", "remaining_time": "1 day, 14:36:35", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7760, "total_steps": 17540, "loss": 0.7153, "learning_rate": 1.3667696987185486e-05, "epoch": 4.4232276451727826, "percentage": 44.24, "elapsed_time": "1 day, 6:36:08", "remaining_time": "1 day, 14:34:06", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7770, "total_steps": 17540, "loss": 0.7121, "learning_rate": 1.3649175479296393e-05, "epoch": 4.428927680798005, "percentage": 44.3, "elapsed_time": "1 day, 6:38:28", "remaining_time": "1 day, 14:31:41", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7780, "total_steps": 17540, "loss": 0.7179, "learning_rate": 1.3630639518668528e-05, "epoch": 4.434627716423227, "percentage": 44.36, "elapsed_time": "1 day, 6:40:52", "remaining_time": "1 day, 14:29:22", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7790, "total_steps": 17540, "loss": 0.7206, "learning_rate": 1.3612089178714473e-05, "epoch": 4.44032775204845, "percentage": 44.41, "elapsed_time": "1 day, 6:43:15", "remaining_time": "1 day, 14:27:01", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7800, "total_steps": 17540, "loss": 0.7262, "learning_rate": 1.3593524532903757e-05, "epoch": 4.446027787673673, "percentage": 44.47, "elapsed_time": "1 day, 6:45:40", "remaining_time": "1 day, 14:24:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7810, "total_steps": 17540, "loss": 0.7133, "learning_rate": 1.357494565476258e-05, "epoch": 4.451727823298896, "percentage": 44.53, "elapsed_time": "1 day, 6:48:06", "remaining_time": "1 day, 14:22:27", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7820, "total_steps": 17540, "loss": 0.7216, "learning_rate": 1.3556352617873492e-05, "epoch": 4.4574278589241185, "percentage": 44.58, "elapsed_time": "1 day, 6:50:27", "remaining_time": "1 day, 14:20:02", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7830, "total_steps": 17540, "loss": 0.7069, "learning_rate": 1.3537745495875138e-05, "epoch": 4.463127894549341, "percentage": 44.64, "elapsed_time": "1 day, 6:52:46", "remaining_time": "1 day, 14:17:37", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7840, "total_steps": 17540, "loss": 0.7175, "learning_rate": 1.3519124362461937e-05, "epoch": 4.468827930174563, "percentage": 44.7, "elapsed_time": "1 day, 6:55:04", "remaining_time": "1 day, 14:15:10", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7850, "total_steps": 17540, "loss": 0.7019, "learning_rate": 1.3500489291383798e-05, "epoch": 4.474527965799786, "percentage": 44.75, "elapsed_time": "1 day, 6:57:23", "remaining_time": "1 day, 14:12:45", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7860, "total_steps": 17540, "loss": 0.7056, "learning_rate": 1.348184035644584e-05, "epoch": 4.480228001425009, "percentage": 44.81, "elapsed_time": "1 day, 6:59:48", "remaining_time": "1 day, 14:10:26", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7870, "total_steps": 17540, "loss": 0.7065, "learning_rate": 1.3463177631508079e-05, "epoch": 4.485928037050232, "percentage": 44.87, "elapsed_time": "1 day, 7:02:09", "remaining_time": "1 day, 14:08:03", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7880, "total_steps": 17540, "loss": 0.7064, "learning_rate": 1.3444501190485164e-05, "epoch": 4.4916280726754545, "percentage": 44.93, "elapsed_time": "1 day, 7:04:32", "remaining_time": "1 day, 14:05:42", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7890, "total_steps": 17540, "loss": 0.7087, "learning_rate": 1.3425811107346052e-05, "epoch": 4.497328108300676, "percentage": 44.98, "elapsed_time": "1 day, 7:06:52", "remaining_time": "1 day, 14:03:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7900, "total_steps": 17540, "loss": 0.7087, "learning_rate": 1.3407107456113737e-05, "epoch": 4.503028143925899, "percentage": 45.04, "elapsed_time": "1 day, 7:09:09", "remaining_time": "1 day, 14:00:50", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7910, "total_steps": 17540, "loss": 0.7146, "learning_rate": 1.3388390310864945e-05, "epoch": 4.508728179551122, "percentage": 45.1, "elapsed_time": "1 day, 7:11:37", "remaining_time": "1 day, 13:58:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7920, "total_steps": 17540, "loss": 0.7129, "learning_rate": 1.3369659745729854e-05, "epoch": 4.514428215176345, "percentage": 45.15, "elapsed_time": "1 day, 7:13:58", "remaining_time": "1 day, 13:56:13", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7930, "total_steps": 17540, "loss": 0.7174, "learning_rate": 1.3350915834891786e-05, "epoch": 4.520128250801568, "percentage": 45.21, "elapsed_time": "1 day, 7:16:22", "remaining_time": "1 day, 13:53:53", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7940, "total_steps": 17540, "loss": 0.7129, "learning_rate": 1.333215865258692e-05, "epoch": 4.5258282864267905, "percentage": 45.27, "elapsed_time": "1 day, 7:18:43", "remaining_time": "1 day, 13:51:30", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7950, "total_steps": 17540, "loss": 0.7152, "learning_rate": 1.3313388273103999e-05, "epoch": 4.531528322052013, "percentage": 45.32, "elapsed_time": "1 day, 7:21:04", "remaining_time": "1 day, 13:49:06", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7960, "total_steps": 17540, "loss": 0.7132, "learning_rate": 1.3294604770784035e-05, "epoch": 4.537228357677235, "percentage": 45.38, "elapsed_time": "1 day, 7:23:28", "remaining_time": "1 day, 13:46:47", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7970, "total_steps": 17540, "loss": 0.7131, "learning_rate": 1.3275808220020006e-05, "epoch": 4.542928393302458, "percentage": 45.44, "elapsed_time": "1 day, 7:25:45", "remaining_time": "1 day, 13:44:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7980, "total_steps": 17540, "loss": 0.7175, "learning_rate": 1.3256998695256578e-05, "epoch": 4.548628428927681, "percentage": 45.5, "elapsed_time": "1 day, 7:28:06", "remaining_time": "1 day, 13:41:57", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 7990, "total_steps": 17540, "loss": 0.7203, "learning_rate": 1.32381762709898e-05, "epoch": 4.554328464552904, "percentage": 45.55, "elapsed_time": "1 day, 7:30:28", "remaining_time": "1 day, 13:39:34", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8000, "total_steps": 17540, "loss": 0.7064, "learning_rate": 1.3219341021766803e-05, "epoch": 4.560028500178126, "percentage": 45.61, "elapsed_time": "1 day, 7:32:48", "remaining_time": "1 day, 13:37:10", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8010, "total_steps": 17540, "loss": 0.7195, "learning_rate": 1.3200493022185525e-05, "epoch": 4.565728535803348, "percentage": 45.67, "elapsed_time": "1 day, 7:35:10", "remaining_time": "1 day, 13:34:47", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8020, "total_steps": 17540, "loss": 0.7171, "learning_rate": 1.3181632346894388e-05, "epoch": 4.571428571428571, "percentage": 45.72, "elapsed_time": "1 day, 7:37:32", "remaining_time": "1 day, 13:32:26", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8030, "total_steps": 17540, "loss": 0.7108, "learning_rate": 1.3162759070592024e-05, "epoch": 4.577128607053794, "percentage": 45.78, "elapsed_time": "1 day, 7:39:57", "remaining_time": "1 day, 13:30:07", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8040, "total_steps": 17540, "loss": 0.7104, "learning_rate": 1.314387326802697e-05, "epoch": 4.582828642679017, "percentage": 45.84, "elapsed_time": "1 day, 7:42:20", "remaining_time": "1 day, 13:27:47", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8050, "total_steps": 17540, "loss": 0.712, "learning_rate": 1.312497501399738e-05, "epoch": 4.58852867830424, "percentage": 45.9, "elapsed_time": "1 day, 7:44:40", "remaining_time": "1 day, 13:25:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8060, "total_steps": 17540, "loss": 0.7187, "learning_rate": 1.3106064383350715e-05, "epoch": 4.594228713929462, "percentage": 45.95, "elapsed_time": "1 day, 7:47:01", "remaining_time": "1 day, 13:23:00", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8070, "total_steps": 17540, "loss": 0.7225, "learning_rate": 1.308714145098345e-05, "epoch": 4.599928749554684, "percentage": 46.01, "elapsed_time": "1 day, 7:49:20", "remaining_time": "1 day, 13:20:35", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8080, "total_steps": 17540, "loss": 0.7096, "learning_rate": 1.3068206291840799e-05, "epoch": 4.605628785179907, "percentage": 46.07, "elapsed_time": "1 day, 7:51:40", "remaining_time": "1 day, 13:18:10", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8090, "total_steps": 17540, "loss": 0.717, "learning_rate": 1.3049258980916387e-05, "epoch": 4.61132882080513, "percentage": 46.12, "elapsed_time": "1 day, 7:54:05", "remaining_time": "1 day, 13:15:51", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8100, "total_steps": 17540, "loss": 0.7188, "learning_rate": 1.3030299593251964e-05, "epoch": 4.617028856430353, "percentage": 46.18, "elapsed_time": "1 day, 7:56:26", "remaining_time": "1 day, 13:13:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8110, "total_steps": 17540, "loss": 0.7071, "learning_rate": 1.3011328203937121e-05, "epoch": 4.622728892055576, "percentage": 46.24, "elapsed_time": "1 day, 7:58:47", "remaining_time": "1 day, 13:11:05", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8120, "total_steps": 17540, "loss": 0.7141, "learning_rate": 1.2992344888108981e-05, "epoch": 4.628428927680798, "percentage": 46.29, "elapsed_time": "1 day, 8:01:11", "remaining_time": "1 day, 13:08:45", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8130, "total_steps": 17540, "loss": 0.713, "learning_rate": 1.297334972095189e-05, "epoch": 4.63412896330602, "percentage": 46.35, "elapsed_time": "1 day, 8:03:32", "remaining_time": "1 day, 13:06:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8140, "total_steps": 17540, "loss": 0.7026, "learning_rate": 1.2954342777697152e-05, "epoch": 4.639828998931243, "percentage": 46.41, "elapsed_time": "1 day, 8:05:51", "remaining_time": "1 day, 13:03:57", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8150, "total_steps": 17540, "loss": 0.7108, "learning_rate": 1.2935324133622688e-05, "epoch": 4.645529034556466, "percentage": 46.47, "elapsed_time": "1 day, 8:08:12", "remaining_time": "1 day, 13:01:34", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8160, "total_steps": 17540, "loss": 0.7091, "learning_rate": 1.291629386405278e-05, "epoch": 4.651229070181689, "percentage": 46.52, "elapsed_time": "1 day, 8:10:34", "remaining_time": "1 day, 12:59:12", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8170, "total_steps": 17540, "loss": 0.7193, "learning_rate": 1.2897252044357745e-05, "epoch": 4.6569291058069116, "percentage": 46.58, "elapsed_time": "1 day, 8:13:00", "remaining_time": "1 day, 12:56:55", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8180, "total_steps": 17540, "loss": 0.7222, "learning_rate": 1.2878198749953642e-05, "epoch": 4.662629141432134, "percentage": 46.64, "elapsed_time": "1 day, 8:15:23", "remaining_time": "1 day, 12:54:35", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8190, "total_steps": 17540, "loss": 0.71, "learning_rate": 1.285913405630198e-05, "epoch": 4.668329177057356, "percentage": 46.69, "elapsed_time": "1 day, 8:17:44", "remaining_time": "1 day, 12:52:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8200, "total_steps": 17540, "loss": 0.7058, "learning_rate": 1.2840058038909415e-05, "epoch": 4.674029212682579, "percentage": 46.75, "elapsed_time": "1 day, 8:20:04", "remaining_time": "1 day, 12:49:47", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8210, "total_steps": 17540, "loss": 0.7139, "learning_rate": 1.2820970773327456e-05, "epoch": 4.679729248307802, "percentage": 46.81, "elapsed_time": "1 day, 8:22:23", "remaining_time": "1 day, 12:47:21", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8220, "total_steps": 17540, "loss": 0.7075, "learning_rate": 1.2801872335152152e-05, "epoch": 4.685429283933025, "percentage": 46.86, "elapsed_time": "1 day, 8:24:41", "remaining_time": "1 day, 12:44:55", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8230, "total_steps": 17540, "loss": 0.7069, "learning_rate": 1.2782762800023806e-05, "epoch": 4.6911293195582475, "percentage": 46.92, "elapsed_time": "1 day, 8:27:01", "remaining_time": "1 day, 12:42:32", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8240, "total_steps": 17540, "loss": 0.7087, "learning_rate": 1.2763642243626668e-05, "epoch": 4.6968293551834694, "percentage": 46.98, "elapsed_time": "1 day, 8:29:23", "remaining_time": "1 day, 12:40:09", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8250, "total_steps": 17540, "loss": 0.7047, "learning_rate": 1.2744510741688648e-05, "epoch": 4.702529390808692, "percentage": 47.04, "elapsed_time": "1 day, 8:31:39", "remaining_time": "1 day, 12:37:41", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8260, "total_steps": 17540, "loss": 0.7204, "learning_rate": 1.2725368369980996e-05, "epoch": 4.708229426433915, "percentage": 47.09, "elapsed_time": "1 day, 8:33:56", "remaining_time": "1 day, 12:35:13", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8270, "total_steps": 17540, "loss": 0.7111, "learning_rate": 1.270621520431801e-05, "epoch": 4.713929462059138, "percentage": 47.15, "elapsed_time": "1 day, 8:36:13", "remaining_time": "1 day, 12:32:46", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8280, "total_steps": 17540, "loss": 0.7067, "learning_rate": 1.2687051320556751e-05, "epoch": 4.719629497684361, "percentage": 47.21, "elapsed_time": "1 day, 8:38:35", "remaining_time": "1 day, 12:30:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8290, "total_steps": 17540, "loss": 0.7161, "learning_rate": 1.2667876794596721e-05, "epoch": 4.7253295333095835, "percentage": 47.26, "elapsed_time": "1 day, 8:40:57", "remaining_time": "1 day, 12:28:02", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8300, "total_steps": 17540, "loss": 0.7004, "learning_rate": 1.2648691702379568e-05, "epoch": 4.731029568934806, "percentage": 47.32, "elapsed_time": "1 day, 8:43:22", "remaining_time": "1 day, 12:25:44", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8310, "total_steps": 17540, "loss": 0.699, "learning_rate": 1.2629496119888795e-05, "epoch": 4.736729604560028, "percentage": 47.38, "elapsed_time": "1 day, 8:45:43", "remaining_time": "1 day, 12:23:20", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8320, "total_steps": 17540, "loss": 0.7087, "learning_rate": 1.2610290123149454e-05, "epoch": 4.742429640185251, "percentage": 47.43, "elapsed_time": "1 day, 8:48:04", "remaining_time": "1 day, 12:20:58", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8330, "total_steps": 17540, "loss": 0.7161, "learning_rate": 1.2591073788227827e-05, "epoch": 4.748129675810474, "percentage": 47.49, "elapsed_time": "1 day, 8:50:28", "remaining_time": "1 day, 12:18:38", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8340, "total_steps": 17540, "loss": 0.7142, "learning_rate": 1.257184719123117e-05, "epoch": 4.753829711435697, "percentage": 47.55, "elapsed_time": "1 day, 8:53:00", "remaining_time": "1 day, 12:16:27", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8350, "total_steps": 17540, "loss": 0.7126, "learning_rate": 1.2552610408307348e-05, "epoch": 4.7595297470609195, "percentage": 47.61, "elapsed_time": "1 day, 8:55:22", "remaining_time": "1 day, 12:14:05", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8360, "total_steps": 17540, "loss": 0.7135, "learning_rate": 1.2533363515644595e-05, "epoch": 4.765229782686141, "percentage": 47.66, "elapsed_time": "1 day, 8:57:43", "remaining_time": "1 day, 12:11:42", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8370, "total_steps": 17540, "loss": 0.7187, "learning_rate": 1.2514106589471169e-05, "epoch": 4.770929818311364, "percentage": 47.72, "elapsed_time": "1 day, 9:00:03", "remaining_time": "1 day, 12:09:18", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8380, "total_steps": 17540, "loss": 0.7017, "learning_rate": 1.2494839706055075e-05, "epoch": 4.776629853936587, "percentage": 47.78, "elapsed_time": "1 day, 9:02:26", "remaining_time": "1 day, 12:06:58", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8390, "total_steps": 17540, "loss": 0.7078, "learning_rate": 1.2475562941703755e-05, "epoch": 4.78232988956181, "percentage": 47.83, "elapsed_time": "1 day, 9:04:45", "remaining_time": "1 day, 12:04:33", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8400, "total_steps": 17540, "loss": 0.7135, "learning_rate": 1.2456276372763776e-05, "epoch": 4.788029925187033, "percentage": 47.89, "elapsed_time": "1 day, 9:07:11", "remaining_time": "1 day, 12:02:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8410, "total_steps": 17540, "loss": 0.7227, "learning_rate": 1.2436980075620543e-05, "epoch": 4.793729960812255, "percentage": 47.95, "elapsed_time": "1 day, 9:09:32", "remaining_time": "1 day, 11:59:52", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8420, "total_steps": 17540, "loss": 0.7125, "learning_rate": 1.2417674126697989e-05, "epoch": 4.799429996437477, "percentage": 48.0, "elapsed_time": "1 day, 9:11:55", "remaining_time": "1 day, 11:57:31", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8430, "total_steps": 17540, "loss": 0.7094, "learning_rate": 1.2398358602458275e-05, "epoch": 4.8051300320627, "percentage": 48.06, "elapsed_time": "1 day, 9:14:17", "remaining_time": "1 day, 11:55:09", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8440, "total_steps": 17540, "loss": 0.7029, "learning_rate": 1.2379033579401483e-05, "epoch": 4.810830067687923, "percentage": 48.12, "elapsed_time": "1 day, 9:16:37", "remaining_time": "1 day, 11:52:46", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8450, "total_steps": 17540, "loss": 0.7028, "learning_rate": 1.2359699134065316e-05, "epoch": 4.816530103313146, "percentage": 48.18, "elapsed_time": "1 day, 9:18:58", "remaining_time": "1 day, 11:50:22", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8460, "total_steps": 17540, "loss": 0.709, "learning_rate": 1.2340355343024793e-05, "epoch": 4.822230138938369, "percentage": 48.23, "elapsed_time": "1 day, 9:21:21", "remaining_time": "1 day, 11:48:01", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8470, "total_steps": 17540, "loss": 0.7006, "learning_rate": 1.2321002282891952e-05, "epoch": 4.8279301745635905, "percentage": 48.29, "elapsed_time": "1 day, 9:23:39", "remaining_time": "1 day, 11:45:35", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8480, "total_steps": 17540, "loss": 0.7033, "learning_rate": 1.2301640030315537e-05, "epoch": 4.833630210188813, "percentage": 48.35, "elapsed_time": "1 day, 9:26:08", "remaining_time": "1 day, 11:43:21", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8490, "total_steps": 17540, "loss": 0.7032, "learning_rate": 1.2282268661980697e-05, "epoch": 4.839330245814036, "percentage": 48.4, "elapsed_time": "1 day, 9:28:33", "remaining_time": "1 day, 11:41:02", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8500, "total_steps": 17540, "loss": 0.6981, "learning_rate": 1.2262888254608691e-05, "epoch": 4.845030281439259, "percentage": 48.46, "elapsed_time": "1 day, 9:30:48", "remaining_time": "1 day, 11:38:33", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8510, "total_steps": 17540, "loss": 0.7065, "learning_rate": 1.2243498884956578e-05, "epoch": 4.850730317064482, "percentage": 48.52, "elapsed_time": "1 day, 9:33:07", "remaining_time": "1 day, 11:36:07", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8520, "total_steps": 17540, "loss": 0.7143, "learning_rate": 1.2224100629816905e-05, "epoch": 4.856430352689705, "percentage": 48.57, "elapsed_time": "1 day, 9:35:29", "remaining_time": "1 day, 11:33:46", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8530, "total_steps": 17540, "loss": 0.7185, "learning_rate": 1.2204693566017417e-05, "epoch": 4.862130388314927, "percentage": 48.63, "elapsed_time": "1 day, 9:37:54", "remaining_time": "1 day, 11:31:27", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8540, "total_steps": 17540, "loss": 0.7134, "learning_rate": 1.2185277770420739e-05, "epoch": 4.867830423940149, "percentage": 48.69, "elapsed_time": "1 day, 9:40:16", "remaining_time": "1 day, 11:29:05", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8550, "total_steps": 17540, "loss": 0.7213, "learning_rate": 1.2165853319924088e-05, "epoch": 4.873530459565372, "percentage": 48.75, "elapsed_time": "1 day, 9:42:41", "remaining_time": "1 day, 11:26:46", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8560, "total_steps": 17540, "loss": 0.7084, "learning_rate": 1.2146420291458954e-05, "epoch": 4.879230495190595, "percentage": 48.8, "elapsed_time": "1 day, 9:45:00", "remaining_time": "1 day, 11:24:21", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8570, "total_steps": 17540, "loss": 0.7061, "learning_rate": 1.21269787619908e-05, "epoch": 4.884930530815818, "percentage": 48.86, "elapsed_time": "1 day, 9:47:27", "remaining_time": "1 day, 11:22:05", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8580, "total_steps": 17540, "loss": 0.7121, "learning_rate": 1.2107528808518756e-05, "epoch": 4.8906305664410405, "percentage": 48.92, "elapsed_time": "1 day, 9:49:50", "remaining_time": "1 day, 11:19:44", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8590, "total_steps": 17540, "loss": 0.7134, "learning_rate": 1.2088070508075325e-05, "epoch": 4.8963306020662625, "percentage": 48.97, "elapsed_time": "1 day, 9:52:14", "remaining_time": "1 day, 11:17:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8600, "total_steps": 17540, "loss": 0.7018, "learning_rate": 1.2068603937726057e-05, "epoch": 4.902030637691485, "percentage": 49.03, "elapsed_time": "1 day, 9:54:40", "remaining_time": "1 day, 11:15:07", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8610, "total_steps": 17540, "loss": 0.7129, "learning_rate": 1.2049129174569261e-05, "epoch": 4.907730673316708, "percentage": 49.09, "elapsed_time": "1 day, 9:56:55", "remaining_time": "1 day, 11:12:38", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8620, "total_steps": 17540, "loss": 0.7033, "learning_rate": 1.2029646295735694e-05, "epoch": 4.913430708941931, "percentage": 49.14, "elapsed_time": "1 day, 9:59:12", "remaining_time": "1 day, 11:10:10", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8630, "total_steps": 17540, "loss": 0.7102, "learning_rate": 1.2010155378388253e-05, "epoch": 4.919130744567154, "percentage": 49.2, "elapsed_time": "1 day, 10:01:32", "remaining_time": "1 day, 11:07:46", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8640, "total_steps": 17540, "loss": 0.7059, "learning_rate": 1.1990656499721673e-05, "epoch": 4.9248307801923765, "percentage": 49.26, "elapsed_time": "1 day, 10:03:55", "remaining_time": "1 day, 11:05:25", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8650, "total_steps": 17540, "loss": 0.7019, "learning_rate": 1.1971149736962229e-05, "epoch": 4.930530815817599, "percentage": 49.32, "elapsed_time": "1 day, 10:06:14", "remaining_time": "1 day, 11:03:01", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8660, "total_steps": 17540, "loss": 0.7094, "learning_rate": 1.1951635167367403e-05, "epoch": 4.936230851442821, "percentage": 49.37, "elapsed_time": "1 day, 10:08:39", "remaining_time": "1 day, 11:00:42", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8670, "total_steps": 17540, "loss": 0.7186, "learning_rate": 1.1932112868225613e-05, "epoch": 4.941930887068044, "percentage": 49.43, "elapsed_time": "1 day, 10:11:01", "remaining_time": "1 day, 10:58:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8680, "total_steps": 17540, "loss": 0.7129, "learning_rate": 1.1912582916855883e-05, "epoch": 4.947630922693267, "percentage": 49.49, "elapsed_time": "1 day, 10:13:22", "remaining_time": "1 day, 10:55:57", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8690, "total_steps": 17540, "loss": 0.7101, "learning_rate": 1.1893045390607542e-05, "epoch": 4.95333095831849, "percentage": 49.54, "elapsed_time": "1 day, 10:15:45", "remaining_time": "1 day, 10:53:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8700, "total_steps": 17540, "loss": 0.7117, "learning_rate": 1.1873500366859925e-05, "epoch": 4.9590309939437125, "percentage": 49.6, "elapsed_time": "1 day, 10:18:12", "remaining_time": "1 day, 10:51:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8710, "total_steps": 17540, "loss": 0.7124, "learning_rate": 1.1853947923022057e-05, "epoch": 4.964731029568934, "percentage": 49.66, "elapsed_time": "1 day, 10:20:35", "remaining_time": "1 day, 10:48:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8720, "total_steps": 17540, "loss": 0.7061, "learning_rate": 1.1834388136532358e-05, "epoch": 4.970431065194157, "percentage": 49.71, "elapsed_time": "1 day, 10:22:52", "remaining_time": "1 day, 10:46:32", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8730, "total_steps": 17540, "loss": 0.7056, "learning_rate": 1.1814821084858315e-05, "epoch": 4.97613110081938, "percentage": 49.77, "elapsed_time": "1 day, 10:25:12", "remaining_time": "1 day, 10:44:08", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8740, "total_steps": 17540, "loss": 0.6997, "learning_rate": 1.1795246845496205e-05, "epoch": 4.981831136444603, "percentage": 49.83, "elapsed_time": "1 day, 10:27:31", "remaining_time": "1 day, 10:41:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8750, "total_steps": 17540, "loss": 0.7088, "learning_rate": 1.1775665495970756e-05, "epoch": 4.987531172069826, "percentage": 49.89, "elapsed_time": "1 day, 10:29:56", "remaining_time": "1 day, 10:39:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8760, "total_steps": 17540, "loss": 0.705, "learning_rate": 1.1756077113834873e-05, "epoch": 4.9932312076950485, "percentage": 49.94, "elapsed_time": "1 day, 10:32:22", "remaining_time": "1 day, 10:37:06", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8770, "total_steps": 17540, "loss": 0.7137, "learning_rate": 1.1736481776669307e-05, "epoch": 4.99893124332027, "percentage": 50.0, "elapsed_time": "1 day, 10:34:48", "remaining_time": "1 day, 10:34:48", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8780, "total_steps": 17540, "loss": 0.6993, "learning_rate": 1.1716879562082343e-05, "epoch": 5.004631278945493, "percentage": 50.06, "elapsed_time": "1 day, 10:37:11", "remaining_time": "1 day, 10:32:27", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8790, "total_steps": 17540, "loss": 0.6859, "learning_rate": 1.1697270547709527e-05, "epoch": 5.010331314570716, "percentage": 50.11, "elapsed_time": "1 day, 10:39:33", "remaining_time": "1 day, 10:30:05", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8800, "total_steps": 17540, "loss": 0.6986, "learning_rate": 1.1677654811213316e-05, "epoch": 5.016031350195939, "percentage": 50.17, "elapsed_time": "1 day, 10:41:51", "remaining_time": "1 day, 10:27:39", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8810, "total_steps": 17540, "loss": 0.6982, "learning_rate": 1.16580324302828e-05, "epoch": 5.021731385821162, "percentage": 50.23, "elapsed_time": "1 day, 10:44:13", "remaining_time": "1 day, 10:25:17", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8820, "total_steps": 17540, "loss": 0.7033, "learning_rate": 1.1638403482633383e-05, "epoch": 5.027431421446384, "percentage": 50.29, "elapsed_time": "1 day, 10:46:33", "remaining_time": "1 day, 10:22:53", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8830, "total_steps": 17540, "loss": 0.673, "learning_rate": 1.1618768046006476e-05, "epoch": 5.033131457071606, "percentage": 50.34, "elapsed_time": "1 day, 10:48:53", "remaining_time": "1 day, 10:20:29", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8840, "total_steps": 17540, "loss": 0.6934, "learning_rate": 1.1599126198169196e-05, "epoch": 5.038831492696829, "percentage": 50.4, "elapsed_time": "1 day, 10:51:13", "remaining_time": "1 day, 10:18:06", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8850, "total_steps": 17540, "loss": 0.6989, "learning_rate": 1.1579478016914038e-05, "epoch": 5.044531528322052, "percentage": 50.46, "elapsed_time": "1 day, 10:53:38", "remaining_time": "1 day, 10:15:47", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8860, "total_steps": 17540, "loss": 0.6962, "learning_rate": 1.1559823580058591e-05, "epoch": 5.050231563947275, "percentage": 50.51, "elapsed_time": "1 day, 10:55:55", "remaining_time": "1 day, 10:13:21", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8870, "total_steps": 17540, "loss": 0.6789, "learning_rate": 1.1540162965445224e-05, "epoch": 5.055931599572498, "percentage": 50.57, "elapsed_time": "1 day, 10:58:15", "remaining_time": "1 day, 10:10:56", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8880, "total_steps": 17540, "loss": 0.6963, "learning_rate": 1.152049625094076e-05, "epoch": 5.06163163519772, "percentage": 50.63, "elapsed_time": "1 day, 11:00:38", "remaining_time": "1 day, 10:08:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8890, "total_steps": 17540, "loss": 0.6852, "learning_rate": 1.150082351443619e-05, "epoch": 5.067331670822942, "percentage": 50.68, "elapsed_time": "1 day, 11:02:57", "remaining_time": "1 day, 10:06:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8900, "total_steps": 17540, "loss": 0.6904, "learning_rate": 1.1481144833846358e-05, "epoch": 5.073031706448165, "percentage": 50.74, "elapsed_time": "1 day, 11:05:26", "remaining_time": "1 day, 10:03:55", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8910, "total_steps": 17540, "loss": 0.6896, "learning_rate": 1.146146028710964e-05, "epoch": 5.078731742073388, "percentage": 50.8, "elapsed_time": "1 day, 11:07:46", "remaining_time": "1 day, 10:01:32", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8920, "total_steps": 17540, "loss": 0.6951, "learning_rate": 1.144176995218765e-05, "epoch": 5.084431777698611, "percentage": 50.86, "elapsed_time": "1 day, 11:10:09", "remaining_time": "1 day, 9:59:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8930, "total_steps": 17540, "loss": 0.6918, "learning_rate": 1.1422073907064932e-05, "epoch": 5.090131813323834, "percentage": 50.91, "elapsed_time": "1 day, 11:12:32", "remaining_time": "1 day, 9:56:50", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8940, "total_steps": 17540, "loss": 0.6855, "learning_rate": 1.1402372229748635e-05, "epoch": 5.0958318489490555, "percentage": 50.97, "elapsed_time": "1 day, 11:14:53", "remaining_time": "1 day, 9:54:27", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8950, "total_steps": 17540, "loss": 0.6899, "learning_rate": 1.1382664998268222e-05, "epoch": 5.101531884574278, "percentage": 51.03, "elapsed_time": "1 day, 11:17:19", "remaining_time": "1 day, 9:52:09", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8960, "total_steps": 17540, "loss": 0.6946, "learning_rate": 1.1362952290675153e-05, "epoch": 5.107231920199501, "percentage": 51.08, "elapsed_time": "1 day, 11:19:41", "remaining_time": "1 day, 9:49:47", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8970, "total_steps": 17540, "loss": 0.69, "learning_rate": 1.1343234185042575e-05, "epoch": 5.112931955824724, "percentage": 51.14, "elapsed_time": "1 day, 11:21:58", "remaining_time": "1 day, 9:47:20", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8980, "total_steps": 17540, "loss": 0.6932, "learning_rate": 1.1323510759465012e-05, "epoch": 5.118631991449947, "percentage": 51.2, "elapsed_time": "1 day, 11:24:21", "remaining_time": "1 day, 9:45:00", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 8990, "total_steps": 17540, "loss": 0.695, "learning_rate": 1.1303782092058062e-05, "epoch": 5.1243320270751695, "percentage": 51.25, "elapsed_time": "1 day, 11:26:42", "remaining_time": "1 day, 9:42:37", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9000, "total_steps": 17540, "loss": 0.6916, "learning_rate": 1.1284048260958076e-05, "epoch": 5.1300320627003915, "percentage": 51.31, "elapsed_time": "1 day, 11:29:06", "remaining_time": "1 day, 9:40:17", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9010, "total_steps": 17540, "loss": 0.7005, "learning_rate": 1.126430934432187e-05, "epoch": 5.135732098325614, "percentage": 51.37, "elapsed_time": "1 day, 11:31:26", "remaining_time": "1 day, 9:37:53", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9020, "total_steps": 17540, "loss": 0.6972, "learning_rate": 1.1244565420326388e-05, "epoch": 5.141432133950837, "percentage": 51.43, "elapsed_time": "1 day, 11:33:46", "remaining_time": "1 day, 9:35:30", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9030, "total_steps": 17540, "loss": 0.6872, "learning_rate": 1.1224816567168413e-05, "epoch": 5.14713216957606, "percentage": 51.48, "elapsed_time": "1 day, 11:36:09", "remaining_time": "1 day, 9:33:09", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9040, "total_steps": 17540, "loss": 0.7017, "learning_rate": 1.1205062863064247e-05, "epoch": 5.152832205201283, "percentage": 51.54, "elapsed_time": "1 day, 11:38:32", "remaining_time": "1 day, 9:30:47", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9050, "total_steps": 17540, "loss": 0.6879, "learning_rate": 1.1185304386249405e-05, "epoch": 5.1585322408265055, "percentage": 51.6, "elapsed_time": "1 day, 11:40:52", "remaining_time": "1 day, 9:28:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9060, "total_steps": 17540, "loss": 0.6969, "learning_rate": 1.1165541214978306e-05, "epoch": 5.164232276451727, "percentage": 51.65, "elapsed_time": "1 day, 11:43:12", "remaining_time": "1 day, 9:26:00", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9070, "total_steps": 17540, "loss": 0.6879, "learning_rate": 1.1145773427523963e-05, "epoch": 5.16993231207695, "percentage": 51.71, "elapsed_time": "1 day, 11:45:33", "remaining_time": "1 day, 9:23:37", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9080, "total_steps": 17540, "loss": 0.7013, "learning_rate": 1.1126001102177667e-05, "epoch": 5.175632347702173, "percentage": 51.77, "elapsed_time": "1 day, 11:47:54", "remaining_time": "1 day, 9:21:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9090, "total_steps": 17540, "loss": 0.693, "learning_rate": 1.1106224317248682e-05, "epoch": 5.181332383327396, "percentage": 51.82, "elapsed_time": "1 day, 11:50:22", "remaining_time": "1 day, 9:18:58", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9100, "total_steps": 17540, "loss": 0.7021, "learning_rate": 1.108644315106394e-05, "epoch": 5.187032418952619, "percentage": 51.88, "elapsed_time": "1 day, 11:52:44", "remaining_time": "1 day, 9:16:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9110, "total_steps": 17540, "loss": 0.6828, "learning_rate": 1.1066657681967723e-05, "epoch": 5.1927324545778415, "percentage": 51.94, "elapsed_time": "1 day, 11:55:12", "remaining_time": "1 day, 9:14:20", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9120, "total_steps": 17540, "loss": 0.6917, "learning_rate": 1.1046867988321349e-05, "epoch": 5.198432490203063, "percentage": 52.0, "elapsed_time": "1 day, 11:57:29", "remaining_time": "1 day, 9:11:53", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9130, "total_steps": 17540, "loss": 0.7009, "learning_rate": 1.102707414850287e-05, "epoch": 5.204132525828286, "percentage": 52.05, "elapsed_time": "1 day, 11:59:51", "remaining_time": "1 day, 9:09:31", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9140, "total_steps": 17540, "loss": 0.6877, "learning_rate": 1.100727624090677e-05, "epoch": 5.209832561453509, "percentage": 52.11, "elapsed_time": "1 day, 12:02:16", "remaining_time": "1 day, 9:07:12", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9150, "total_steps": 17540, "loss": 0.6892, "learning_rate": 1.0987474343943625e-05, "epoch": 5.215532597078732, "percentage": 52.17, "elapsed_time": "1 day, 12:04:41", "remaining_time": "1 day, 9:04:53", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9160, "total_steps": 17540, "loss": 0.686, "learning_rate": 1.0967668536039828e-05, "epoch": 5.221232632703955, "percentage": 52.22, "elapsed_time": "1 day, 12:07:02", "remaining_time": "1 day, 9:02:30", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9170, "total_steps": 17540, "loss": 0.7028, "learning_rate": 1.0947858895637255e-05, "epoch": 5.2269326683291775, "percentage": 52.28, "elapsed_time": "1 day, 12:09:28", "remaining_time": "1 day, 9:00:12", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9180, "total_steps": 17540, "loss": 0.6941, "learning_rate": 1.0928045501192952e-05, "epoch": 5.232632703954399, "percentage": 52.34, "elapsed_time": "1 day, 12:11:48", "remaining_time": "1 day, 8:57:48", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9190, "total_steps": 17540, "loss": 0.7014, "learning_rate": 1.0908228431178847e-05, "epoch": 5.238332739579622, "percentage": 52.39, "elapsed_time": "1 day, 12:14:06", "remaining_time": "1 day, 8:55:22", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9200, "total_steps": 17540, "loss": 0.6871, "learning_rate": 1.0888407764081416e-05, "epoch": 5.244032775204845, "percentage": 52.45, "elapsed_time": "1 day, 12:16:30", "remaining_time": "1 day, 8:53:03", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9210, "total_steps": 17540, "loss": 0.6838, "learning_rate": 1.0868583578401391e-05, "epoch": 5.249732810830068, "percentage": 52.51, "elapsed_time": "1 day, 12:18:54", "remaining_time": "1 day, 8:50:42", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9220, "total_steps": 17540, "loss": 0.7054, "learning_rate": 1.0848755952653426e-05, "epoch": 5.255432846455291, "percentage": 52.57, "elapsed_time": "1 day, 12:21:17", "remaining_time": "1 day, 8:48:22", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9230, "total_steps": 17540, "loss": 0.6933, "learning_rate": 1.0828924965365814e-05, "epoch": 5.261132882080513, "percentage": 52.62, "elapsed_time": "1 day, 12:23:39", "remaining_time": "1 day, 8:46:00", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9240, "total_steps": 17540, "loss": 0.686, "learning_rate": 1.0809090695080148e-05, "epoch": 5.266832917705735, "percentage": 52.68, "elapsed_time": "1 day, 12:26:02", "remaining_time": "1 day, 8:43:39", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9250, "total_steps": 17540, "loss": 0.6979, "learning_rate": 1.0789253220351035e-05, "epoch": 5.272532953330958, "percentage": 52.74, "elapsed_time": "1 day, 12:28:22", "remaining_time": "1 day, 8:41:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9260, "total_steps": 17540, "loss": 0.6888, "learning_rate": 1.0769412619745762e-05, "epoch": 5.278232988956181, "percentage": 52.79, "elapsed_time": "1 day, 12:30:41", "remaining_time": "1 day, 8:38:51", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9270, "total_steps": 17540, "loss": 0.6962, "learning_rate": 1.0749568971844011e-05, "epoch": 5.283933024581404, "percentage": 52.85, "elapsed_time": "1 day, 12:33:03", "remaining_time": "1 day, 8:36:29", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9280, "total_steps": 17540, "loss": 0.6888, "learning_rate": 1.0729722355237519e-05, "epoch": 5.289633060206627, "percentage": 52.91, "elapsed_time": "1 day, 12:35:21", "remaining_time": "1 day, 8:34:03", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9290, "total_steps": 17540, "loss": 0.6942, "learning_rate": 1.0709872848529787e-05, "epoch": 5.2953330958318485, "percentage": 52.96, "elapsed_time": "1 day, 12:37:45", "remaining_time": "1 day, 8:31:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9300, "total_steps": 17540, "loss": 0.6944, "learning_rate": 1.0690020530335764e-05, "epoch": 5.301033131457071, "percentage": 53.02, "elapsed_time": "1 day, 12:40:09", "remaining_time": "1 day, 8:29:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9310, "total_steps": 17540, "loss": 0.6955, "learning_rate": 1.0670165479281522e-05, "epoch": 5.306733167082294, "percentage": 53.08, "elapsed_time": "1 day, 12:42:33", "remaining_time": "1 day, 8:27:03", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9320, "total_steps": 17540, "loss": 0.6836, "learning_rate": 1.065030777400398e-05, "epoch": 5.312433202707517, "percentage": 53.14, "elapsed_time": "1 day, 12:44:58", "remaining_time": "1 day, 8:24:44", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9330, "total_steps": 17540, "loss": 0.7044, "learning_rate": 1.0630447493150547e-05, "epoch": 5.31813323833274, "percentage": 53.19, "elapsed_time": "1 day, 12:47:16", "remaining_time": "1 day, 8:22:18", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9340, "total_steps": 17540, "loss": 0.6893, "learning_rate": 1.0610584715378843e-05, "epoch": 5.323833273957963, "percentage": 53.25, "elapsed_time": "1 day, 12:49:39", "remaining_time": "1 day, 8:19:57", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9350, "total_steps": 17540, "loss": 0.7029, "learning_rate": 1.0590719519356373e-05, "epoch": 5.3295333095831845, "percentage": 53.31, "elapsed_time": "1 day, 12:52:02", "remaining_time": "1 day, 8:17:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9360, "total_steps": 17540, "loss": 0.6918, "learning_rate": 1.0570851983760228e-05, "epoch": 5.335233345208407, "percentage": 53.36, "elapsed_time": "1 day, 12:54:20", "remaining_time": "1 day, 8:15:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9370, "total_steps": 17540, "loss": 0.6962, "learning_rate": 1.0550982187276752e-05, "epoch": 5.34093338083363, "percentage": 53.42, "elapsed_time": "1 day, 12:56:46", "remaining_time": "1 day, 8:12:52", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9380, "total_steps": 17540, "loss": 0.7039, "learning_rate": 1.0531110208601254e-05, "epoch": 5.346633416458853, "percentage": 53.48, "elapsed_time": "1 day, 12:59:05", "remaining_time": "1 day, 8:10:27", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9390, "total_steps": 17540, "loss": 0.6922, "learning_rate": 1.0511236126437682e-05, "epoch": 5.352333452084076, "percentage": 53.53, "elapsed_time": "1 day, 13:01:29", "remaining_time": "1 day, 8:08:07", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9400, "total_steps": 17540, "loss": 0.6929, "learning_rate": 1.0491360019498312e-05, "epoch": 5.3580334877092985, "percentage": 53.59, "elapsed_time": "1 day, 13:03:56", "remaining_time": "1 day, 8:05:50", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9410, "total_steps": 17540, "loss": 0.6905, "learning_rate": 1.0471481966503446e-05, "epoch": 5.3637335233345205, "percentage": 53.65, "elapsed_time": "1 day, 13:06:17", "remaining_time": "1 day, 8:03:27", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9420, "total_steps": 17540, "loss": 0.6809, "learning_rate": 1.0451602046181084e-05, "epoch": 5.369433558959743, "percentage": 53.71, "elapsed_time": "1 day, 13:08:40", "remaining_time": "1 day, 8:01:06", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9430, "total_steps": 17540, "loss": 0.6954, "learning_rate": 1.0431720337266632e-05, "epoch": 5.375133594584966, "percentage": 53.76, "elapsed_time": "1 day, 13:11:03", "remaining_time": "1 day, 7:58:45", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9440, "total_steps": 17540, "loss": 0.6869, "learning_rate": 1.0411836918502573e-05, "epoch": 5.380833630210189, "percentage": 53.82, "elapsed_time": "1 day, 13:13:23", "remaining_time": "1 day, 7:56:21", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9450, "total_steps": 17540, "loss": 0.6908, "learning_rate": 1.0391951868638167e-05, "epoch": 5.386533665835412, "percentage": 53.88, "elapsed_time": "1 day, 13:15:50", "remaining_time": "1 day, 7:54:03", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9460, "total_steps": 17540, "loss": 0.693, "learning_rate": 1.0372065266429124e-05, "epoch": 5.3922337014606345, "percentage": 53.93, "elapsed_time": "1 day, 13:18:09", "remaining_time": "1 day, 7:51:39", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9470, "total_steps": 17540, "loss": 0.6885, "learning_rate": 1.0352177190637315e-05, "epoch": 5.397933737085856, "percentage": 53.99, "elapsed_time": "1 day, 13:20:32", "remaining_time": "1 day, 7:49:18", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9480, "total_steps": 17540, "loss": 0.6905, "learning_rate": 1.0332287720030442e-05, "epoch": 5.403633772711079, "percentage": 54.05, "elapsed_time": "1 day, 13:22:48", "remaining_time": "1 day, 7:46:51", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9490, "total_steps": 17540, "loss": 0.6978, "learning_rate": 1.0312396933381728e-05, "epoch": 5.409333808336302, "percentage": 54.1, "elapsed_time": "1 day, 13:25:10", "remaining_time": "1 day, 7:44:29", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9500, "total_steps": 17540, "loss": 0.6881, "learning_rate": 1.0292504909469612e-05, "epoch": 5.415033843961525, "percentage": 54.16, "elapsed_time": "1 day, 13:27:37", "remaining_time": "1 day, 7:42:12", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9510, "total_steps": 17540, "loss": 0.691, "learning_rate": 1.0272611727077426e-05, "epoch": 5.420733879586748, "percentage": 54.22, "elapsed_time": "1 day, 13:29:57", "remaining_time": "1 day, 7:39:48", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9520, "total_steps": 17540, "loss": 0.6909, "learning_rate": 1.0252717464993105e-05, "epoch": 5.42643391521197, "percentage": 54.28, "elapsed_time": "1 day, 13:32:15", "remaining_time": "1 day, 7:37:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9530, "total_steps": 17540, "loss": 0.6877, "learning_rate": 1.0232822202008845e-05, "epoch": 5.432133950837192, "percentage": 54.33, "elapsed_time": "1 day, 13:34:37", "remaining_time": "1 day, 7:35:01", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9540, "total_steps": 17540, "loss": 0.6854, "learning_rate": 1.0212926016920816e-05, "epoch": 5.437833986462415, "percentage": 54.39, "elapsed_time": "1 day, 13:36:58", "remaining_time": "1 day, 7:32:38", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9550, "total_steps": 17540, "loss": 0.6834, "learning_rate": 1.019302898852884e-05, "epoch": 5.443534022087638, "percentage": 54.45, "elapsed_time": "1 day, 13:39:16", "remaining_time": "1 day, 7:30:13", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9560, "total_steps": 17540, "loss": 0.6935, "learning_rate": 1.0173131195636068e-05, "epoch": 5.449234057712861, "percentage": 54.5, "elapsed_time": "1 day, 13:41:41", "remaining_time": "1 day, 7:27:53", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9570, "total_steps": 17540, "loss": 0.6978, "learning_rate": 1.0153232717048686e-05, "epoch": 5.454934093338084, "percentage": 54.56, "elapsed_time": "1 day, 13:44:07", "remaining_time": "1 day, 7:25:34", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9580, "total_steps": 17540, "loss": 0.694, "learning_rate": 1.0133333631575606e-05, "epoch": 5.4606341289633065, "percentage": 54.62, "elapsed_time": "1 day, 13:46:21", "remaining_time": "1 day, 7:23:07", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9590, "total_steps": 17540, "loss": 0.6774, "learning_rate": 1.0113434018028124e-05, "epoch": 5.466334164588528, "percentage": 54.68, "elapsed_time": "1 day, 13:48:45", "remaining_time": "1 day, 7:20:46", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9600, "total_steps": 17540, "loss": 0.6924, "learning_rate": 1.0093533955219639e-05, "epoch": 5.472034200213751, "percentage": 54.73, "elapsed_time": "1 day, 13:51:07", "remaining_time": "1 day, 7:18:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9610, "total_steps": 17540, "loss": 0.6998, "learning_rate": 1.0073633521965334e-05, "epoch": 5.477734235838974, "percentage": 54.79, "elapsed_time": "1 day, 13:53:30", "remaining_time": "1 day, 7:16:03", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9620, "total_steps": 17540, "loss": 0.6927, "learning_rate": 1.0053732797081843e-05, "epoch": 5.483434271464197, "percentage": 54.85, "elapsed_time": "1 day, 13:55:51", "remaining_time": "1 day, 7:13:40", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9630, "total_steps": 17540, "loss": 0.6846, "learning_rate": 1.003383185938697e-05, "epoch": 5.48913430708942, "percentage": 54.9, "elapsed_time": "1 day, 13:58:19", "remaining_time": "1 day, 7:11:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9640, "total_steps": 17540, "loss": 0.6924, "learning_rate": 1.0013930787699358e-05, "epoch": 5.4948343427146416, "percentage": 54.96, "elapsed_time": "1 day, 14:00:44", "remaining_time": "1 day, 7:09:04", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9650, "total_steps": 17540, "loss": 0.6988, "learning_rate": 9.994029660838175e-06, "epoch": 5.500534378339864, "percentage": 55.02, "elapsed_time": "1 day, 14:03:11", "remaining_time": "1 day, 7:06:46", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9660, "total_steps": 17540, "loss": 0.6856, "learning_rate": 9.974128557622814e-06, "epoch": 5.506234413965087, "percentage": 55.07, "elapsed_time": "1 day, 14:05:34", "remaining_time": "1 day, 7:04:25", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9670, "total_steps": 17540, "loss": 0.6862, "learning_rate": 9.95422755687257e-06, "epoch": 5.51193444959031, "percentage": 55.13, "elapsed_time": "1 day, 14:07:57", "remaining_time": "1 day, 7:02:04", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9680, "total_steps": 17540, "loss": 0.6937, "learning_rate": 9.934326737406338e-06, "epoch": 5.517634485215533, "percentage": 55.19, "elapsed_time": "1 day, 14:10:17", "remaining_time": "1 day, 6:59:40", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9690, "total_steps": 17540, "loss": 0.6912, "learning_rate": 9.91442617804229e-06, "epoch": 5.523334520840756, "percentage": 55.25, "elapsed_time": "1 day, 14:12:45", "remaining_time": "1 day, 6:57:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9700, "total_steps": 17540, "loss": 0.703, "learning_rate": 9.894525957597566e-06, "epoch": 5.529034556465978, "percentage": 55.3, "elapsed_time": "1 day, 14:15:02", "remaining_time": "1 day, 6:54:57", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9710, "total_steps": 17540, "loss": 0.6823, "learning_rate": 9.87462615488797e-06, "epoch": 5.5347345920912, "percentage": 55.36, "elapsed_time": "1 day, 14:17:22", "remaining_time": "1 day, 6:52:34", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9720, "total_steps": 17540, "loss": 0.6936, "learning_rate": 9.854726848727645e-06, "epoch": 5.540434627716423, "percentage": 55.42, "elapsed_time": "1 day, 14:19:42", "remaining_time": "1 day, 6:50:10", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9730, "total_steps": 17540, "loss": 0.6909, "learning_rate": 9.834828117928776e-06, "epoch": 5.546134663341646, "percentage": 55.47, "elapsed_time": "1 day, 14:22:08", "remaining_time": "1 day, 6:47:52", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9740, "total_steps": 17540, "loss": 0.7087, "learning_rate": 9.81493004130126e-06, "epoch": 5.551834698966869, "percentage": 55.53, "elapsed_time": "1 day, 14:24:36", "remaining_time": "1 day, 6:45:34", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9750, "total_steps": 17540, "loss": 0.6869, "learning_rate": 9.795032697652408e-06, "epoch": 5.557534734592092, "percentage": 55.59, "elapsed_time": "1 day, 14:26:57", "remaining_time": "1 day, 6:43:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9760, "total_steps": 17540, "loss": 0.6975, "learning_rate": 9.775136165786626e-06, "epoch": 5.5632347702173135, "percentage": 55.64, "elapsed_time": "1 day, 14:29:16", "remaining_time": "1 day, 6:40:47", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9770, "total_steps": 17540, "loss": 0.7019, "learning_rate": 9.755240524505107e-06, "epoch": 5.568934805842536, "percentage": 55.7, "elapsed_time": "1 day, 14:31:38", "remaining_time": "1 day, 6:38:25", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9780, "total_steps": 17540, "loss": 0.6906, "learning_rate": 9.735345852605519e-06, "epoch": 5.574634841467759, "percentage": 55.76, "elapsed_time": "1 day, 14:34:03", "remaining_time": "1 day, 6:36:06", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9790, "total_steps": 17540, "loss": 0.7011, "learning_rate": 9.715452228881683e-06, "epoch": 5.580334877092982, "percentage": 55.82, "elapsed_time": "1 day, 14:36:28", "remaining_time": "1 day, 6:33:46", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9800, "total_steps": 17540, "loss": 0.6822, "learning_rate": 9.695559732123275e-06, "epoch": 5.586034912718205, "percentage": 55.87, "elapsed_time": "1 day, 14:38:49", "remaining_time": "1 day, 6:31:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9810, "total_steps": 17540, "loss": 0.6941, "learning_rate": 9.675668441115503e-06, "epoch": 5.5917349483434275, "percentage": 55.93, "elapsed_time": "1 day, 14:41:17", "remaining_time": "1 day, 6:29:06", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9820, "total_steps": 17540, "loss": 0.6934, "learning_rate": 9.655778434638807e-06, "epoch": 5.5974349839686495, "percentage": 55.99, "elapsed_time": "1 day, 14:43:37", "remaining_time": "1 day, 6:26:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9830, "total_steps": 17540, "loss": 0.6963, "learning_rate": 9.635889791468533e-06, "epoch": 5.603135019593872, "percentage": 56.04, "elapsed_time": "1 day, 14:46:00", "remaining_time": "1 day, 6:24:21", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9840, "total_steps": 17540, "loss": 0.6995, "learning_rate": 9.616002590374628e-06, "epoch": 5.608835055219095, "percentage": 56.1, "elapsed_time": "1 day, 14:48:18", "remaining_time": "1 day, 6:21:57", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9850, "total_steps": 17540, "loss": 0.6951, "learning_rate": 9.596116910121328e-06, "epoch": 5.614535090844318, "percentage": 56.16, "elapsed_time": "1 day, 14:50:33", "remaining_time": "1 day, 6:19:29", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9860, "total_steps": 17540, "loss": 0.6916, "learning_rate": 9.57623282946685e-06, "epoch": 5.620235126469541, "percentage": 56.21, "elapsed_time": "1 day, 14:52:56", "remaining_time": "1 day, 6:17:08", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9870, "total_steps": 17540, "loss": 0.6943, "learning_rate": 9.556350427163073e-06, "epoch": 5.625935162094763, "percentage": 56.27, "elapsed_time": "1 day, 14:55:17", "remaining_time": "1 day, 6:14:45", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9880, "total_steps": 17540, "loss": 0.6797, "learning_rate": 9.536469781955224e-06, "epoch": 5.631635197719985, "percentage": 56.33, "elapsed_time": "1 day, 14:57:42", "remaining_time": "1 day, 6:12:25", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9890, "total_steps": 17540, "loss": 0.6842, "learning_rate": 9.516590972581579e-06, "epoch": 5.637335233345208, "percentage": 56.39, "elapsed_time": "1 day, 14:59:59", "remaining_time": "1 day, 6:10:00", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9900, "total_steps": 17540, "loss": 0.703, "learning_rate": 9.496714077773132e-06, "epoch": 5.643035268970431, "percentage": 56.44, "elapsed_time": "1 day, 15:02:19", "remaining_time": "1 day, 6:07:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9910, "total_steps": 17540, "loss": 0.6915, "learning_rate": 9.476839176253311e-06, "epoch": 5.648735304595654, "percentage": 56.5, "elapsed_time": "1 day, 15:04:39", "remaining_time": "1 day, 6:05:13", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9920, "total_steps": 17540, "loss": 0.6946, "learning_rate": 9.456966346737638e-06, "epoch": 5.654435340220877, "percentage": 56.56, "elapsed_time": "1 day, 15:07:02", "remaining_time": "1 day, 6:02:51", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9930, "total_steps": 17540, "loss": 0.6936, "learning_rate": 9.437095667933427e-06, "epoch": 5.6601353758460995, "percentage": 56.61, "elapsed_time": "1 day, 15:09:27", "remaining_time": "1 day, 6:00:32", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9940, "total_steps": 17540, "loss": 0.6929, "learning_rate": 9.417227218539475e-06, "epoch": 5.665835411471321, "percentage": 56.67, "elapsed_time": "1 day, 15:11:49", "remaining_time": "1 day, 5:58:10", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9950, "total_steps": 17540, "loss": 0.6865, "learning_rate": 9.397361077245762e-06, "epoch": 5.671535447096544, "percentage": 56.73, "elapsed_time": "1 day, 15:14:11", "remaining_time": "1 day, 5:55:48", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9960, "total_steps": 17540, "loss": 0.6944, "learning_rate": 9.377497322733109e-06, "epoch": 5.677235482721767, "percentage": 56.78, "elapsed_time": "1 day, 15:16:32", "remaining_time": "1 day, 5:53:26", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9970, "total_steps": 17540, "loss": 0.7028, "learning_rate": 9.357636033672892e-06, "epoch": 5.68293551834699, "percentage": 56.84, "elapsed_time": "1 day, 15:18:56", "remaining_time": "1 day, 5:51:05", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9980, "total_steps": 17540, "loss": 0.6857, "learning_rate": 9.337777288726722e-06, "epoch": 5.688635553972213, "percentage": 56.9, "elapsed_time": "1 day, 15:21:21", "remaining_time": "1 day, 5:48:46", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 9990, "total_steps": 17540, "loss": 0.6923, "learning_rate": 9.317921166546139e-06, "epoch": 5.694335589597435, "percentage": 56.96, "elapsed_time": "1 day, 15:23:45", "remaining_time": "1 day, 5:46:25", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10000, "total_steps": 17540, "loss": 0.6904, "learning_rate": 9.298067745772286e-06, "epoch": 5.700035625222657, "percentage": 57.01, "elapsed_time": "1 day, 15:26:07", "remaining_time": "1 day, 5:44:03", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10010, "total_steps": 17540, "loss": 0.689, "learning_rate": 9.278217105035613e-06, "epoch": 5.70573566084788, "percentage": 57.07, "elapsed_time": "1 day, 15:28:35", "remaining_time": "1 day, 5:41:45", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10020, "total_steps": 17540, "loss": 0.6867, "learning_rate": 9.258369322955558e-06, "epoch": 5.711435696473103, "percentage": 57.13, "elapsed_time": "1 day, 15:30:53", "remaining_time": "1 day, 5:39:21", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10030, "total_steps": 17540, "loss": 0.6988, "learning_rate": 9.238524478140231e-06, "epoch": 5.717135732098326, "percentage": 57.18, "elapsed_time": "1 day, 15:33:16", "remaining_time": "1 day, 5:36:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10040, "total_steps": 17540, "loss": 0.6813, "learning_rate": 9.218682649186123e-06, "epoch": 5.722835767723549, "percentage": 57.24, "elapsed_time": "1 day, 15:35:36", "remaining_time": "1 day, 5:34:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10050, "total_steps": 17540, "loss": 0.6828, "learning_rate": 9.198843914677776e-06, "epoch": 5.7285358033487705, "percentage": 57.3, "elapsed_time": "1 day, 15:37:57", "remaining_time": "1 day, 5:32:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10060, "total_steps": 17540, "loss": 0.6947, "learning_rate": 9.17900835318746e-06, "epoch": 5.734235838973993, "percentage": 57.35, "elapsed_time": "1 day, 15:40:20", "remaining_time": "1 day, 5:29:52", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10070, "total_steps": 17540, "loss": 0.6869, "learning_rate": 9.159176043274896e-06, "epoch": 5.739935874599216, "percentage": 57.41, "elapsed_time": "1 day, 15:42:40", "remaining_time": "1 day, 5:27:29", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10080, "total_steps": 17540, "loss": 0.6807, "learning_rate": 9.139347063486926e-06, "epoch": 5.745635910224439, "percentage": 57.47, "elapsed_time": "1 day, 15:45:03", "remaining_time": "1 day, 5:25:07", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10090, "total_steps": 17540, "loss": 0.6905, "learning_rate": 9.119521492357196e-06, "epoch": 5.751335945849662, "percentage": 57.53, "elapsed_time": "1 day, 15:47:26", "remaining_time": "1 day, 5:22:46", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10100, "total_steps": 17540, "loss": 0.6914, "learning_rate": 9.099699408405854e-06, "epoch": 5.757035981474885, "percentage": 57.58, "elapsed_time": "1 day, 15:49:45", "remaining_time": "1 day, 5:20:22", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10110, "total_steps": 17540, "loss": 0.6947, "learning_rate": 9.079880890139238e-06, "epoch": 5.7627360171001065, "percentage": 57.64, "elapsed_time": "1 day, 15:52:07", "remaining_time": "1 day, 5:18:00", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10120, "total_steps": 17540, "loss": 0.6937, "learning_rate": 9.06006601604956e-06, "epoch": 5.768436052725329, "percentage": 57.7, "elapsed_time": "1 day, 15:54:24", "remaining_time": "1 day, 5:15:35", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10130, "total_steps": 17540, "loss": 0.7006, "learning_rate": 9.040254864614608e-06, "epoch": 5.774136088350552, "percentage": 57.75, "elapsed_time": "1 day, 15:56:53", "remaining_time": "1 day, 5:13:18", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10140, "total_steps": 17540, "loss": 0.6984, "learning_rate": 9.020447514297417e-06, "epoch": 5.779836123975775, "percentage": 57.81, "elapsed_time": "1 day, 15:59:19", "remaining_time": "1 day, 5:10:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10150, "total_steps": 17540, "loss": 0.6908, "learning_rate": 9.000644043545974e-06, "epoch": 5.785536159600998, "percentage": 57.87, "elapsed_time": "1 day, 16:01:47", "remaining_time": "1 day, 5:08:41", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10160, "total_steps": 17540, "loss": 0.6913, "learning_rate": 8.980844530792889e-06, "epoch": 5.791236195226221, "percentage": 57.92, "elapsed_time": "1 day, 16:04:09", "remaining_time": "1 day, 5:06:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10170, "total_steps": 17540, "loss": 0.6887, "learning_rate": 8.96104905445512e-06, "epoch": 5.7969362308514425, "percentage": 57.98, "elapsed_time": "1 day, 16:06:31", "remaining_time": "1 day, 5:03:57", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10180, "total_steps": 17540, "loss": 0.6937, "learning_rate": 8.941257692933613e-06, "epoch": 5.802636266476665, "percentage": 58.04, "elapsed_time": "1 day, 16:08:56", "remaining_time": "1 day, 5:01:38", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10190, "total_steps": 17540, "loss": 0.6893, "learning_rate": 8.92147052461303e-06, "epoch": 5.808336302101888, "percentage": 58.1, "elapsed_time": "1 day, 16:11:20", "remaining_time": "1 day, 4:59:17", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10200, "total_steps": 17540, "loss": 0.6976, "learning_rate": 8.901687627861423e-06, "epoch": 5.814036337727111, "percentage": 58.15, "elapsed_time": "1 day, 16:13:39", "remaining_time": "1 day, 4:56:53", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10210, "total_steps": 17540, "loss": 0.6935, "learning_rate": 8.881909081029923e-06, "epoch": 5.819736373352334, "percentage": 58.21, "elapsed_time": "1 day, 16:16:04", "remaining_time": "1 day, 4:54:33", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10220, "total_steps": 17540, "loss": 0.7015, "learning_rate": 8.862134962452444e-06, "epoch": 5.825436408977556, "percentage": 58.27, "elapsed_time": "1 day, 16:18:33", "remaining_time": "1 day, 4:52:16", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10230, "total_steps": 17540, "loss": 0.6956, "learning_rate": 8.84236535044535e-06, "epoch": 5.8311364446027785, "percentage": 58.32, "elapsed_time": "1 day, 16:20:53", "remaining_time": "1 day, 4:49:52", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10240, "total_steps": 17540, "loss": 0.6904, "learning_rate": 8.822600323307163e-06, "epoch": 5.836836480228001, "percentage": 58.38, "elapsed_time": "1 day, 16:23:13", "remaining_time": "1 day, 4:47:29", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10250, "total_steps": 17540, "loss": 0.6876, "learning_rate": 8.802839959318238e-06, "epoch": 5.842536515853224, "percentage": 58.44, "elapsed_time": "1 day, 16:25:37", "remaining_time": "1 day, 4:45:08", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10260, "total_steps": 17540, "loss": 0.6939, "learning_rate": 8.783084336740474e-06, "epoch": 5.848236551478447, "percentage": 58.49, "elapsed_time": "1 day, 16:28:01", "remaining_time": "1 day, 4:42:48", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10270, "total_steps": 17540, "loss": 0.6881, "learning_rate": 8.763333533816985e-06, "epoch": 5.85393658710367, "percentage": 58.55, "elapsed_time": "1 day, 16:30:23", "remaining_time": "1 day, 4:40:26", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10280, "total_steps": 17540, "loss": 0.6843, "learning_rate": 8.743587628771793e-06, "epoch": 5.8596366227288925, "percentage": 58.61, "elapsed_time": "1 day, 16:32:45", "remaining_time": "1 day, 4:38:04", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10290, "total_steps": 17540, "loss": 0.6834, "learning_rate": 8.723846699809522e-06, "epoch": 5.865336658354114, "percentage": 58.67, "elapsed_time": "1 day, 16:35:05", "remaining_time": "1 day, 4:35:41", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10300, "total_steps": 17540, "loss": 0.6918, "learning_rate": 8.704110825115098e-06, "epoch": 5.871036693979337, "percentage": 58.72, "elapsed_time": "1 day, 16:37:31", "remaining_time": "1 day, 4:33:21", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10310, "total_steps": 17540, "loss": 0.6928, "learning_rate": 8.68438008285342e-06, "epoch": 5.87673672960456, "percentage": 58.78, "elapsed_time": "1 day, 16:39:56", "remaining_time": "1 day, 4:31:02", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10320, "total_steps": 17540, "loss": 0.6844, "learning_rate": 8.664654551169061e-06, "epoch": 5.882436765229783, "percentage": 58.84, "elapsed_time": "1 day, 16:42:21", "remaining_time": "1 day, 4:28:41", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10330, "total_steps": 17540, "loss": 0.6915, "learning_rate": 8.644934308185959e-06, "epoch": 5.888136800855006, "percentage": 58.89, "elapsed_time": "1 day, 16:44:43", "remaining_time": "1 day, 4:26:20", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10340, "total_steps": 17540, "loss": 0.6826, "learning_rate": 8.6252194320071e-06, "epoch": 5.893836836480228, "percentage": 58.95, "elapsed_time": "1 day, 16:47:04", "remaining_time": "1 day, 4:23:57", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10350, "total_steps": 17540, "loss": 0.6871, "learning_rate": 8.605510000714228e-06, "epoch": 5.89953687210545, "percentage": 59.01, "elapsed_time": "1 day, 16:49:31", "remaining_time": "1 day, 4:21:38", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10360, "total_steps": 17540, "loss": 0.6926, "learning_rate": 8.585806092367513e-06, "epoch": 5.905236907730673, "percentage": 59.06, "elapsed_time": "1 day, 16:51:56", "remaining_time": "1 day, 4:19:18", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10370, "total_steps": 17540, "loss": 0.6819, "learning_rate": 8.566107785005251e-06, "epoch": 5.910936943355896, "percentage": 59.12, "elapsed_time": "1 day, 16:54:25", "remaining_time": "1 day, 4:17:01", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10380, "total_steps": 17540, "loss": 0.692, "learning_rate": 8.546415156643549e-06, "epoch": 5.916636978981119, "percentage": 59.18, "elapsed_time": "1 day, 16:56:48", "remaining_time": "1 day, 4:14:40", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10390, "total_steps": 17540, "loss": 0.6984, "learning_rate": 8.526728285276039e-06, "epoch": 5.922337014606342, "percentage": 59.24, "elapsed_time": "1 day, 16:59:08", "remaining_time": "1 day, 4:12:17", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10400, "total_steps": 17540, "loss": 0.686, "learning_rate": 8.507047248873539e-06, "epoch": 5.928037050231564, "percentage": 59.29, "elapsed_time": "1 day, 17:01:26", "remaining_time": "1 day, 4:09:52", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10410, "total_steps": 17540, "loss": 0.6824, "learning_rate": 8.487372125383757e-06, "epoch": 5.933737085856786, "percentage": 59.35, "elapsed_time": "1 day, 17:03:47", "remaining_time": "1 day, 4:07:30", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10420, "total_steps": 17540, "loss": 0.6952, "learning_rate": 8.467702992730992e-06, "epoch": 5.939437121482009, "percentage": 59.41, "elapsed_time": "1 day, 17:06:13", "remaining_time": "1 day, 4:05:10", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10430, "total_steps": 17540, "loss": 0.691, "learning_rate": 8.448039928815804e-06, "epoch": 5.945137157107232, "percentage": 59.46, "elapsed_time": "1 day, 17:08:39", "remaining_time": "1 day, 4:02:50", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10440, "total_steps": 17540, "loss": 0.6969, "learning_rate": 8.42838301151473e-06, "epoch": 5.950837192732455, "percentage": 59.52, "elapsed_time": "1 day, 17:11:04", "remaining_time": "1 day, 4:00:31", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10450, "total_steps": 17540, "loss": 0.711, "learning_rate": 8.408732318679953e-06, "epoch": 5.956537228357677, "percentage": 59.58, "elapsed_time": "1 day, 17:13:26", "remaining_time": "1 day, 3:58:09", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10460, "total_steps": 17540, "loss": 0.6955, "learning_rate": 8.389087928139008e-06, "epoch": 5.9622372639828995, "percentage": 59.64, "elapsed_time": "1 day, 17:15:49", "remaining_time": "1 day, 3:55:47", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10470, "total_steps": 17540, "loss": 0.6943, "learning_rate": 8.369449917694466e-06, "epoch": 5.967937299608122, "percentage": 59.69, "elapsed_time": "1 day, 17:18:06", "remaining_time": "1 day, 3:53:22", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10480, "total_steps": 17540, "loss": 0.6905, "learning_rate": 8.34981836512364e-06, "epoch": 5.973637335233345, "percentage": 59.75, "elapsed_time": "1 day, 17:20:26", "remaining_time": "1 day, 3:50:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10490, "total_steps": 17540, "loss": 0.703, "learning_rate": 8.330193348178254e-06, "epoch": 5.979337370858568, "percentage": 59.81, "elapsed_time": "1 day, 17:22:53", "remaining_time": "1 day, 3:48:40", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10500, "total_steps": 17540, "loss": 0.6957, "learning_rate": 8.310574944584151e-06, "epoch": 5.985037406483791, "percentage": 59.86, "elapsed_time": "1 day, 17:25:17", "remaining_time": "1 day, 3:46:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10510, "total_steps": 17540, "loss": 0.6918, "learning_rate": 8.290963232040984e-06, "epoch": 5.990737442109014, "percentage": 59.92, "elapsed_time": "1 day, 17:27:38", "remaining_time": "1 day, 3:43:56", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10520, "total_steps": 17540, "loss": 0.6945, "learning_rate": 8.271358288221897e-06, "epoch": 5.9964374777342355, "percentage": 59.98, "elapsed_time": "1 day, 17:29:58", "remaining_time": "1 day, 3:41:33", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10530, "total_steps": 17540, "loss": 0.6872, "learning_rate": 8.251760190773243e-06, "epoch": 6.002137513359458, "percentage": 60.03, "elapsed_time": "1 day, 17:32:30", "remaining_time": "1 day, 3:39:18", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10540, "total_steps": 17540, "loss": 0.6774, "learning_rate": 8.232169017314247e-06, "epoch": 6.007837548984681, "percentage": 60.09, "elapsed_time": "1 day, 17:34:48", "remaining_time": "1 day, 3:36:53", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10550, "total_steps": 17540, "loss": 0.6681, "learning_rate": 8.212584845436713e-06, "epoch": 6.013537584609904, "percentage": 60.15, "elapsed_time": "1 day, 17:37:08", "remaining_time": "1 day, 3:34:30", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10560, "total_steps": 17540, "loss": 0.6697, "learning_rate": 8.193007752704714e-06, "epoch": 6.019237620235127, "percentage": 60.21, "elapsed_time": "1 day, 17:39:30", "remaining_time": "1 day, 3:32:08", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10570, "total_steps": 17540, "loss": 0.6725, "learning_rate": 8.173437816654292e-06, "epoch": 6.024937655860349, "percentage": 60.26, "elapsed_time": "1 day, 17:41:48", "remaining_time": "1 day, 3:29:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10580, "total_steps": 17540, "loss": 0.6894, "learning_rate": 8.153875114793137e-06, "epoch": 6.0306376914855715, "percentage": 60.32, "elapsed_time": "1 day, 17:44:12", "remaining_time": "1 day, 3:27:22", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10590, "total_steps": 17540, "loss": 0.6775, "learning_rate": 8.13431972460029e-06, "epoch": 6.036337727110794, "percentage": 60.38, "elapsed_time": "1 day, 17:46:37", "remaining_time": "1 day, 3:25:02", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10600, "total_steps": 17540, "loss": 0.6709, "learning_rate": 8.11477172352584e-06, "epoch": 6.042037762736017, "percentage": 60.43, "elapsed_time": "1 day, 17:48:52", "remaining_time": "1 day, 3:22:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10610, "total_steps": 17540, "loss": 0.6823, "learning_rate": 8.095231188990597e-06, "epoch": 6.04773779836124, "percentage": 60.49, "elapsed_time": "1 day, 17:51:13", "remaining_time": "1 day, 3:20:13", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10620, "total_steps": 17540, "loss": 0.681, "learning_rate": 8.075698198385817e-06, "epoch": 6.053437833986463, "percentage": 60.55, "elapsed_time": "1 day, 17:53:33", "remaining_time": "1 day, 3:17:50", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10630, "total_steps": 17540, "loss": 0.6738, "learning_rate": 8.056172829072863e-06, "epoch": 6.059137869611685, "percentage": 60.6, "elapsed_time": "1 day, 17:55:58", "remaining_time": "1 day, 3:15:30", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10640, "total_steps": 17540, "loss": 0.6846, "learning_rate": 8.036655158382922e-06, "epoch": 6.0648379052369075, "percentage": 60.66, "elapsed_time": "1 day, 17:58:23", "remaining_time": "1 day, 3:13:09", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10650, "total_steps": 17540, "loss": 0.674, "learning_rate": 8.017145263616683e-06, "epoch": 6.07053794086213, "percentage": 60.72, "elapsed_time": "1 day, 18:00:45", "remaining_time": "1 day, 3:10:48", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10660, "total_steps": 17540, "loss": 0.6852, "learning_rate": 7.997643222044051e-06, "epoch": 6.076237976487353, "percentage": 60.78, "elapsed_time": "1 day, 18:03:10", "remaining_time": "1 day, 3:08:27", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10670, "total_steps": 17540, "loss": 0.6688, "learning_rate": 7.978149110903816e-06, "epoch": 6.081938012112576, "percentage": 60.83, "elapsed_time": "1 day, 18:05:33", "remaining_time": "1 day, 3:06:06", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10680, "total_steps": 17540, "loss": 0.6797, "learning_rate": 7.958663007403362e-06, "epoch": 6.087638047737799, "percentage": 60.89, "elapsed_time": "1 day, 18:07:56", "remaining_time": "1 day, 3:03:44", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10690, "total_steps": 17540, "loss": 0.6658, "learning_rate": 7.939184988718359e-06, "epoch": 6.093338083363021, "percentage": 60.95, "elapsed_time": "1 day, 18:10:18", "remaining_time": "1 day, 3:01:22", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10700, "total_steps": 17540, "loss": 0.676, "learning_rate": 7.919715131992459e-06, "epoch": 6.099038118988243, "percentage": 61.0, "elapsed_time": "1 day, 18:12:44", "remaining_time": "1 day, 2:59:03", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10710, "total_steps": 17540, "loss": 0.6753, "learning_rate": 7.900253514336985e-06, "epoch": 6.104738154613466, "percentage": 61.06, "elapsed_time": "1 day, 18:15:04", "remaining_time": "1 day, 2:56:40", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10720, "total_steps": 17540, "loss": 0.667, "learning_rate": 7.88080021283063e-06, "epoch": 6.110438190238689, "percentage": 61.12, "elapsed_time": "1 day, 18:17:25", "remaining_time": "1 day, 2:54:17", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10730, "total_steps": 17540, "loss": 0.6666, "learning_rate": 7.86135530451915e-06, "epoch": 6.116138225863912, "percentage": 61.17, "elapsed_time": "1 day, 18:19:45", "remaining_time": "1 day, 2:51:54", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10740, "total_steps": 17540, "loss": 0.6774, "learning_rate": 7.84191886641506e-06, "epoch": 6.121838261489135, "percentage": 61.23, "elapsed_time": "1 day, 18:22:06", "remaining_time": "1 day, 2:49:32", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10750, "total_steps": 17540, "loss": 0.6766, "learning_rate": 7.822490975497326e-06, "epoch": 6.127538297114357, "percentage": 61.29, "elapsed_time": "1 day, 18:24:29", "remaining_time": "1 day, 2:47:10", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10760, "total_steps": 17540, "loss": 0.6845, "learning_rate": 7.80307170871107e-06, "epoch": 6.133238332739579, "percentage": 61.35, "elapsed_time": "1 day, 18:26:55", "remaining_time": "1 day, 2:44:51", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10770, "total_steps": 17540, "loss": 0.682, "learning_rate": 7.783661142967247e-06, "epoch": 6.138938368364802, "percentage": 61.4, "elapsed_time": "1 day, 18:29:18", "remaining_time": "1 day, 2:42:29", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10780, "total_steps": 17540, "loss": 0.6716, "learning_rate": 7.764259355142354e-06, "epoch": 6.144638403990025, "percentage": 61.46, "elapsed_time": "1 day, 18:31:38", "remaining_time": "1 day, 2:40:05", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10790, "total_steps": 17540, "loss": 0.6846, "learning_rate": 7.744866422078133e-06, "epoch": 6.150338439615248, "percentage": 61.52, "elapsed_time": "1 day, 18:34:06", "remaining_time": "1 day, 2:37:47", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10800, "total_steps": 17540, "loss": 0.6793, "learning_rate": 7.725482420581245e-06, "epoch": 6.156038475240471, "percentage": 61.57, "elapsed_time": "1 day, 18:36:24", "remaining_time": "1 day, 2:35:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10810, "total_steps": 17540, "loss": 0.6787, "learning_rate": 7.70610742742298e-06, "epoch": 6.161738510865693, "percentage": 61.63, "elapsed_time": "1 day, 18:38:45", "remaining_time": "1 day, 2:33:00", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10820, "total_steps": 17540, "loss": 0.6801, "learning_rate": 7.686741519338949e-06, "epoch": 6.167438546490915, "percentage": 61.69, "elapsed_time": "1 day, 18:41:06", "remaining_time": "1 day, 2:30:38", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10830, "total_steps": 17540, "loss": 0.6813, "learning_rate": 7.667384773028778e-06, "epoch": 6.173138582116138, "percentage": 61.74, "elapsed_time": "1 day, 18:43:30", "remaining_time": "1 day, 2:28:17", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10840, "total_steps": 17540, "loss": 0.6784, "learning_rate": 7.64803726515582e-06, "epoch": 6.178838617741361, "percentage": 61.8, "elapsed_time": "1 day, 18:45:54", "remaining_time": "1 day, 2:25:56", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10850, "total_steps": 17540, "loss": 0.6873, "learning_rate": 7.62869907234683e-06, "epoch": 6.184538653366584, "percentage": 61.86, "elapsed_time": "1 day, 18:48:11", "remaining_time": "1 day, 2:23:31", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10860, "total_steps": 17540, "loss": 0.6816, "learning_rate": 7.609370271191667e-06, "epoch": 6.190238688991807, "percentage": 61.92, "elapsed_time": "1 day, 18:50:29", "remaining_time": "1 day, 2:21:06", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10870, "total_steps": 17540, "loss": 0.6745, "learning_rate": 7.590050938242997e-06, "epoch": 6.1959387246170285, "percentage": 61.97, "elapsed_time": "1 day, 18:52:51", "remaining_time": "1 day, 2:18:44", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10880, "total_steps": 17540, "loss": 0.6805, "learning_rate": 7.57074115001599e-06, "epoch": 6.201638760242251, "percentage": 62.03, "elapsed_time": "1 day, 18:55:09", "remaining_time": "1 day, 2:16:20", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10890, "total_steps": 17540, "loss": 0.6695, "learning_rate": 7.551440982988011e-06, "epoch": 6.207338795867474, "percentage": 62.09, "elapsed_time": "1 day, 18:57:33", "remaining_time": "1 day, 2:13:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10900, "total_steps": 17540, "loss": 0.671, "learning_rate": 7.532150513598318e-06, "epoch": 6.213038831492697, "percentage": 62.14, "elapsed_time": "1 day, 18:59:57", "remaining_time": "1 day, 2:11:38", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10910, "total_steps": 17540, "loss": 0.6755, "learning_rate": 7.512869818247763e-06, "epoch": 6.21873886711792, "percentage": 62.2, "elapsed_time": "1 day, 19:02:23", "remaining_time": "1 day, 2:09:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10920, "total_steps": 17540, "loss": 0.6838, "learning_rate": 7.493598973298485e-06, "epoch": 6.224438902743142, "percentage": 62.26, "elapsed_time": "1 day, 19:04:52", "remaining_time": "1 day, 2:07:00", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10930, "total_steps": 17540, "loss": 0.6861, "learning_rate": 7.47433805507362e-06, "epoch": 6.2301389383683645, "percentage": 62.31, "elapsed_time": "1 day, 19:07:16", "remaining_time": "1 day, 2:04:40", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10940, "total_steps": 17540, "loss": 0.6751, "learning_rate": 7.4550871398569755e-06, "epoch": 6.235838973993587, "percentage": 62.37, "elapsed_time": "1 day, 19:09:41", "remaining_time": "1 day, 2:02:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10950, "total_steps": 17540, "loss": 0.6846, "learning_rate": 7.4358463038927464e-06, "epoch": 6.24153900961881, "percentage": 62.43, "elapsed_time": "1 day, 19:12:02", "remaining_time": "1 day, 1:59:57", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10960, "total_steps": 17540, "loss": 0.6689, "learning_rate": 7.416615623385205e-06, "epoch": 6.247239045244033, "percentage": 62.49, "elapsed_time": "1 day, 19:14:23", "remaining_time": "1 day, 1:57:34", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10970, "total_steps": 17540, "loss": 0.6758, "learning_rate": 7.397395174498416e-06, "epoch": 6.252939080869256, "percentage": 62.54, "elapsed_time": "1 day, 19:16:44", "remaining_time": "1 day, 1:55:12", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10980, "total_steps": 17540, "loss": 0.6769, "learning_rate": 7.3781850333559065e-06, "epoch": 6.258639116494478, "percentage": 62.6, "elapsed_time": "1 day, 19:19:03", "remaining_time": "1 day, 1:52:48", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 10990, "total_steps": 17540, "loss": 0.672, "learning_rate": 7.3589852760403845e-06, "epoch": 6.2643391521197005, "percentage": 62.66, "elapsed_time": "1 day, 19:21:29", "remaining_time": "1 day, 1:50:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11000, "total_steps": 17540, "loss": 0.6762, "learning_rate": 7.3397959785934305e-06, "epoch": 6.270039187744923, "percentage": 62.71, "elapsed_time": "1 day, 19:23:54", "remaining_time": "1 day, 1:48:08", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11010, "total_steps": 17540, "loss": 0.6711, "learning_rate": 7.3206172170152025e-06, "epoch": 6.275739223370146, "percentage": 62.77, "elapsed_time": "1 day, 19:26:20", "remaining_time": "1 day, 1:45:48", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11020, "total_steps": 17540, "loss": 0.6748, "learning_rate": 7.301449067264128e-06, "epoch": 6.281439258995369, "percentage": 62.83, "elapsed_time": "1 day, 19:28:41", "remaining_time": "1 day, 1:43:25", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11030, "total_steps": 17540, "loss": 0.673, "learning_rate": 7.282291605256604e-06, "epoch": 6.287139294620592, "percentage": 62.88, "elapsed_time": "1 day, 19:31:03", "remaining_time": "1 day, 1:41:03", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11040, "total_steps": 17540, "loss": 0.6695, "learning_rate": 7.263144906866701e-06, "epoch": 6.292839330245814, "percentage": 62.94, "elapsed_time": "1 day, 19:33:26", "remaining_time": "1 day, 1:38:42", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11050, "total_steps": 17540, "loss": 0.6782, "learning_rate": 7.244009047925858e-06, "epoch": 6.2985393658710365, "percentage": 63.0, "elapsed_time": "1 day, 19:35:47", "remaining_time": "1 day, 1:36:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11060, "total_steps": 17540, "loss": 0.6746, "learning_rate": 7.224884104222585e-06, "epoch": 6.304239401496259, "percentage": 63.06, "elapsed_time": "1 day, 19:38:08", "remaining_time": "1 day, 1:33:57", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11070, "total_steps": 17540, "loss": 0.6846, "learning_rate": 7.205770151502163e-06, "epoch": 6.309939437121482, "percentage": 63.11, "elapsed_time": "1 day, 19:40:30", "remaining_time": "1 day, 1:31:35", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11080, "total_steps": 17540, "loss": 0.668, "learning_rate": 7.186667265466337e-06, "epoch": 6.315639472746705, "percentage": 63.17, "elapsed_time": "1 day, 19:42:49", "remaining_time": "1 day, 1:29:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11090, "total_steps": 17540, "loss": 0.6764, "learning_rate": 7.1675755217730245e-06, "epoch": 6.321339508371928, "percentage": 63.23, "elapsed_time": "1 day, 19:45:13", "remaining_time": "1 day, 1:26:50", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11100, "total_steps": 17540, "loss": 0.6776, "learning_rate": 7.148494996036022e-06, "epoch": 6.32703954399715, "percentage": 63.28, "elapsed_time": "1 day, 19:47:35", "remaining_time": "1 day, 1:24:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11110, "total_steps": 17540, "loss": 0.6749, "learning_rate": 7.129425763824683e-06, "epoch": 6.332739579622372, "percentage": 63.34, "elapsed_time": "1 day, 19:49:55", "remaining_time": "1 day, 1:22:05", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11120, "total_steps": 17540, "loss": 0.6732, "learning_rate": 7.110367900663642e-06, "epoch": 6.338439615247595, "percentage": 63.4, "elapsed_time": "1 day, 19:52:21", "remaining_time": "1 day, 1:19:45", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11130, "total_steps": 17540, "loss": 0.6766, "learning_rate": 7.091321482032501e-06, "epoch": 6.344139650872818, "percentage": 63.45, "elapsed_time": "1 day, 19:54:46", "remaining_time": "1 day, 1:17:25", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11140, "total_steps": 17540, "loss": 0.6753, "learning_rate": 7.072286583365533e-06, "epoch": 6.349839686498041, "percentage": 63.51, "elapsed_time": "1 day, 19:57:06", "remaining_time": "1 day, 1:15:01", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11150, "total_steps": 17540, "loss": 0.6821, "learning_rate": 7.053263280051394e-06, "epoch": 6.355539722123264, "percentage": 63.57, "elapsed_time": "1 day, 19:59:29", "remaining_time": "1 day, 1:12:40", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11160, "total_steps": 17540, "loss": 0.6628, "learning_rate": 7.034251647432811e-06, "epoch": 6.361239757748486, "percentage": 63.63, "elapsed_time": "1 day, 20:01:51", "remaining_time": "1 day, 1:10:18", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11170, "total_steps": 17540, "loss": 0.6708, "learning_rate": 7.01525176080629e-06, "epoch": 6.366939793373708, "percentage": 63.68, "elapsed_time": "1 day, 20:04:17", "remaining_time": "1 day, 1:07:58", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11180, "total_steps": 17540, "loss": 0.6746, "learning_rate": 6.99626369542181e-06, "epoch": 6.372639828998931, "percentage": 63.74, "elapsed_time": "1 day, 20:06:40", "remaining_time": "1 day, 1:05:37", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11190, "total_steps": 17540, "loss": 0.6877, "learning_rate": 6.977287526482541e-06, "epoch": 6.378339864624154, "percentage": 63.8, "elapsed_time": "1 day, 20:09:00", "remaining_time": "1 day, 1:03:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11200, "total_steps": 17540, "loss": 0.6732, "learning_rate": 6.958323329144534e-06, "epoch": 6.384039900249377, "percentage": 63.85, "elapsed_time": "1 day, 20:11:22", "remaining_time": "1 day, 1:00:51", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11210, "total_steps": 17540, "loss": 0.677, "learning_rate": 6.939371178516423e-06, "epoch": 6.3897399358746, "percentage": 63.91, "elapsed_time": "1 day, 20:13:41", "remaining_time": "1 day, 0:58:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11220, "total_steps": 17540, "loss": 0.6673, "learning_rate": 6.920431149659128e-06, "epoch": 6.395439971499822, "percentage": 63.97, "elapsed_time": "1 day, 20:16:05", "remaining_time": "1 day, 0:56:07", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11230, "total_steps": 17540, "loss": 0.6773, "learning_rate": 6.901503317585565e-06, "epoch": 6.401140007125044, "percentage": 64.03, "elapsed_time": "1 day, 20:18:26", "remaining_time": "1 day, 0:53:45", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11240, "total_steps": 17540, "loss": 0.6767, "learning_rate": 6.882587757260349e-06, "epoch": 6.406840042750267, "percentage": 64.08, "elapsed_time": "1 day, 20:20:51", "remaining_time": "1 day, 0:51:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11250, "total_steps": 17540, "loss": 0.6848, "learning_rate": 6.86368454359948e-06, "epoch": 6.41254007837549, "percentage": 64.14, "elapsed_time": "1 day, 20:23:16", "remaining_time": "1 day, 0:49:03", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11260, "total_steps": 17540, "loss": 0.6827, "learning_rate": 6.844793751470069e-06, "epoch": 6.418240114000713, "percentage": 64.2, "elapsed_time": "1 day, 20:25:37", "remaining_time": "1 day, 0:46:41", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11270, "total_steps": 17540, "loss": 0.6712, "learning_rate": 6.825915455690015e-06, "epoch": 6.423940149625935, "percentage": 64.25, "elapsed_time": "1 day, 20:27:57", "remaining_time": "1 day, 0:44:18", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11280, "total_steps": 17540, "loss": 0.6856, "learning_rate": 6.807049731027751e-06, "epoch": 6.4296401852511575, "percentage": 64.31, "elapsed_time": "1 day, 20:30:19", "remaining_time": "1 day, 0:41:55", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11290, "total_steps": 17540, "loss": 0.6775, "learning_rate": 6.788196652201899e-06, "epoch": 6.43534022087638, "percentage": 64.37, "elapsed_time": "1 day, 20:32:43", "remaining_time": "1 day, 0:39:35", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11300, "total_steps": 17540, "loss": 0.6784, "learning_rate": 6.769356293881005e-06, "epoch": 6.441040256501603, "percentage": 64.42, "elapsed_time": "1 day, 20:35:06", "remaining_time": "1 day, 0:37:13", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11310, "total_steps": 17540, "loss": 0.6781, "learning_rate": 6.750528730683231e-06, "epoch": 6.446740292126826, "percentage": 64.48, "elapsed_time": "1 day, 20:37:25", "remaining_time": "1 day, 0:34:50", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11320, "total_steps": 17540, "loss": 0.6872, "learning_rate": 6.731714037176071e-06, "epoch": 6.452440327752049, "percentage": 64.54, "elapsed_time": "1 day, 20:39:47", "remaining_time": "1 day, 0:32:27", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11330, "total_steps": 17540, "loss": 0.6746, "learning_rate": 6.712912287876041e-06, "epoch": 6.458140363377271, "percentage": 64.6, "elapsed_time": "1 day, 20:42:05", "remaining_time": "1 day, 0:30:03", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11340, "total_steps": 17540, "loss": 0.6717, "learning_rate": 6.6941235572483905e-06, "epoch": 6.4638403990024935, "percentage": 64.65, "elapsed_time": "1 day, 20:44:25", "remaining_time": "1 day, 0:27:40", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11350, "total_steps": 17540, "loss": 0.6888, "learning_rate": 6.6753479197068136e-06, "epoch": 6.469540434627716, "percentage": 64.71, "elapsed_time": "1 day, 20:46:51", "remaining_time": "1 day, 0:25:20", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11360, "total_steps": 17540, "loss": 0.6704, "learning_rate": 6.65658544961314e-06, "epoch": 6.475240470252939, "percentage": 64.77, "elapsed_time": "1 day, 20:49:13", "remaining_time": "1 day, 0:22:58", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11370, "total_steps": 17540, "loss": 0.681, "learning_rate": 6.637836221277063e-06, "epoch": 6.480940505878162, "percentage": 64.82, "elapsed_time": "1 day, 20:51:42", "remaining_time": "1 day, 0:20:40", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11380, "total_steps": 17540, "loss": 0.68, "learning_rate": 6.619100308955817e-06, "epoch": 6.486640541503385, "percentage": 64.88, "elapsed_time": "1 day, 20:54:05", "remaining_time": "1 day, 0:18:18", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11390, "total_steps": 17540, "loss": 0.6787, "learning_rate": 6.600377786853903e-06, "epoch": 6.492340577128607, "percentage": 64.94, "elapsed_time": "1 day, 20:56:28", "remaining_time": "1 day, 0:15:57", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11400, "total_steps": 17540, "loss": 0.6819, "learning_rate": 6.581668729122788e-06, "epoch": 6.4980406127538295, "percentage": 64.99, "elapsed_time": "1 day, 20:58:49", "remaining_time": "1 day, 0:13:34", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11410, "total_steps": 17540, "loss": 0.6799, "learning_rate": 6.562973209860619e-06, "epoch": 6.503740648379052, "percentage": 65.05, "elapsed_time": "1 day, 21:01:08", "remaining_time": "1 day, 0:11:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11420, "total_steps": 17540, "loss": 0.6789, "learning_rate": 6.544291303111918e-06, "epoch": 6.509440684004275, "percentage": 65.11, "elapsed_time": "1 day, 21:03:32", "remaining_time": "1 day, 0:08:49", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11430, "total_steps": 17540, "loss": 0.6779, "learning_rate": 6.525623082867292e-06, "epoch": 6.515140719629498, "percentage": 65.17, "elapsed_time": "1 day, 21:05:55", "remaining_time": "1 day, 0:06:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11440, "total_steps": 17540, "loss": 0.6828, "learning_rate": 6.506968623063145e-06, "epoch": 6.520840755254721, "percentage": 65.22, "elapsed_time": "1 day, 21:08:15", "remaining_time": "1 day, 0:04:05", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11450, "total_steps": 17540, "loss": 0.6665, "learning_rate": 6.488327997581383e-06, "epoch": 6.526540790879943, "percentage": 65.28, "elapsed_time": "1 day, 21:10:35", "remaining_time": "1 day, 0:01:41", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11460, "total_steps": 17540, "loss": 0.675, "learning_rate": 6.469701280249118e-06, "epoch": 6.5322408265051655, "percentage": 65.34, "elapsed_time": "1 day, 21:12:55", "remaining_time": "23:59:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11470, "total_steps": 17540, "loss": 0.681, "learning_rate": 6.4510885448383796e-06, "epoch": 6.537940862130388, "percentage": 65.39, "elapsed_time": "1 day, 21:15:19", "remaining_time": "23:56:58", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11480, "total_steps": 17540, "loss": 0.6743, "learning_rate": 6.432489865065821e-06, "epoch": 6.543640897755611, "percentage": 65.45, "elapsed_time": "1 day, 21:17:40", "remaining_time": "23:54:35", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11490, "total_steps": 17540, "loss": 0.6714, "learning_rate": 6.4139053145924234e-06, "epoch": 6.549340933380834, "percentage": 65.51, "elapsed_time": "1 day, 21:20:03", "remaining_time": "23:52:13", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11500, "total_steps": 17540, "loss": 0.6763, "learning_rate": 6.395334967023219e-06, "epoch": 6.555040969006056, "percentage": 65.56, "elapsed_time": "1 day, 21:22:23", "remaining_time": "23:49:50", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11510, "total_steps": 17540, "loss": 0.6829, "learning_rate": 6.3767788959069765e-06, "epoch": 6.560741004631279, "percentage": 65.62, "elapsed_time": "1 day, 21:24:45", "remaining_time": "23:47:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11520, "total_steps": 17540, "loss": 0.6764, "learning_rate": 6.358237174735931e-06, "epoch": 6.566441040256501, "percentage": 65.68, "elapsed_time": "1 day, 21:27:08", "remaining_time": "23:45:07", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11530, "total_steps": 17540, "loss": 0.6869, "learning_rate": 6.339709876945475e-06, "epoch": 6.572141075881724, "percentage": 65.74, "elapsed_time": "1 day, 21:29:32", "remaining_time": "23:42:46", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11540, "total_steps": 17540, "loss": 0.6776, "learning_rate": 6.321197075913883e-06, "epoch": 6.577841111506947, "percentage": 65.79, "elapsed_time": "1 day, 21:31:56", "remaining_time": "23:40:25", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11550, "total_steps": 17540, "loss": 0.6768, "learning_rate": 6.302698844962019e-06, "epoch": 6.58354114713217, "percentage": 65.85, "elapsed_time": "1 day, 21:34:20", "remaining_time": "23:38:04", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11560, "total_steps": 17540, "loss": 0.6839, "learning_rate": 6.2842152573530294e-06, "epoch": 6.589241182757393, "percentage": 65.91, "elapsed_time": "1 day, 21:36:43", "remaining_time": "23:35:42", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11570, "total_steps": 17540, "loss": 0.6822, "learning_rate": 6.265746386292073e-06, "epoch": 6.594941218382615, "percentage": 65.96, "elapsed_time": "1 day, 21:39:06", "remaining_time": "23:33:20", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11580, "total_steps": 17540, "loss": 0.6687, "learning_rate": 6.24729230492602e-06, "epoch": 6.600641254007837, "percentage": 66.02, "elapsed_time": "1 day, 21:41:35", "remaining_time": "23:31:02", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11590, "total_steps": 17540, "loss": 0.6845, "learning_rate": 6.228853086343169e-06, "epoch": 6.60634128963306, "percentage": 66.08, "elapsed_time": "1 day, 21:43:54", "remaining_time": "23:28:39", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11600, "total_steps": 17540, "loss": 0.675, "learning_rate": 6.210428803572949e-06, "epoch": 6.612041325258283, "percentage": 66.13, "elapsed_time": "1 day, 21:46:14", "remaining_time": "23:26:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11610, "total_steps": 17540, "loss": 0.6877, "learning_rate": 6.192019529585638e-06, "epoch": 6.617741360883506, "percentage": 66.19, "elapsed_time": "1 day, 21:48:39", "remaining_time": "23:23:55", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11620, "total_steps": 17540, "loss": 0.6703, "learning_rate": 6.173625337292068e-06, "epoch": 6.623441396508728, "percentage": 66.25, "elapsed_time": "1 day, 21:51:04", "remaining_time": "23:21:34", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11630, "total_steps": 17540, "loss": 0.6641, "learning_rate": 6.155246299543342e-06, "epoch": 6.629141432133951, "percentage": 66.31, "elapsed_time": "1 day, 21:53:27", "remaining_time": "23:19:13", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11640, "total_steps": 17540, "loss": 0.6715, "learning_rate": 6.136882489130545e-06, "epoch": 6.634841467759173, "percentage": 66.36, "elapsed_time": "1 day, 21:55:46", "remaining_time": "23:16:49", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11650, "total_steps": 17540, "loss": 0.6773, "learning_rate": 6.1185339787844475e-06, "epoch": 6.640541503384396, "percentage": 66.42, "elapsed_time": "1 day, 21:58:12", "remaining_time": "23:14:29", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11660, "total_steps": 17540, "loss": 0.67, "learning_rate": 6.100200841175228e-06, "epoch": 6.646241539009619, "percentage": 66.48, "elapsed_time": "1 day, 22:00:40", "remaining_time": "23:12:10", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11670, "total_steps": 17540, "loss": 0.6761, "learning_rate": 6.081883148912174e-06, "epoch": 6.651941574634842, "percentage": 66.53, "elapsed_time": "1 day, 22:02:57", "remaining_time": "23:09:46", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11680, "total_steps": 17540, "loss": 0.6764, "learning_rate": 6.06358097454341e-06, "epoch": 6.657641610260065, "percentage": 66.59, "elapsed_time": "1 day, 22:05:14", "remaining_time": "23:07:21", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11690, "total_steps": 17540, "loss": 0.6778, "learning_rate": 6.045294390555598e-06, "epoch": 6.6633416458852865, "percentage": 66.65, "elapsed_time": "1 day, 22:07:40", "remaining_time": "23:05:01", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11700, "total_steps": 17540, "loss": 0.6683, "learning_rate": 6.027023469373654e-06, "epoch": 6.669041681510509, "percentage": 66.7, "elapsed_time": "1 day, 22:10:06", "remaining_time": "23:02:41", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11710, "total_steps": 17540, "loss": 0.6883, "learning_rate": 6.0087682833604475e-06, "epoch": 6.674741717135732, "percentage": 66.76, "elapsed_time": "1 day, 22:12:26", "remaining_time": "23:00:17", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11720, "total_steps": 17540, "loss": 0.6803, "learning_rate": 5.990528904816553e-06, "epoch": 6.680441752760955, "percentage": 66.82, "elapsed_time": "1 day, 22:14:51", "remaining_time": "22:57:57", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11730, "total_steps": 17540, "loss": 0.6711, "learning_rate": 5.972305405979919e-06, "epoch": 6.686141788386178, "percentage": 66.88, "elapsed_time": "1 day, 22:17:15", "remaining_time": "22:55:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11740, "total_steps": 17540, "loss": 0.6813, "learning_rate": 5.954097859025609e-06, "epoch": 6.6918418240114, "percentage": 66.93, "elapsed_time": "1 day, 22:19:34", "remaining_time": "22:53:13", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11750, "total_steps": 17540, "loss": 0.6802, "learning_rate": 5.9359063360655065e-06, "epoch": 6.6975418596366225, "percentage": 66.99, "elapsed_time": "1 day, 22:21:54", "remaining_time": "22:50:49", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11760, "total_steps": 17540, "loss": 0.6762, "learning_rate": 5.9177309091480295e-06, "epoch": 6.703241895261845, "percentage": 67.05, "elapsed_time": "1 day, 22:24:16", "remaining_time": "22:48:27", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11770, "total_steps": 17540, "loss": 0.674, "learning_rate": 5.899571650257856e-06, "epoch": 6.708941930887068, "percentage": 67.1, "elapsed_time": "1 day, 22:26:41", "remaining_time": "22:46:07", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11780, "total_steps": 17540, "loss": 0.6759, "learning_rate": 5.88142863131562e-06, "epoch": 6.714641966512291, "percentage": 67.16, "elapsed_time": "1 day, 22:29:01", "remaining_time": "22:43:44", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11790, "total_steps": 17540, "loss": 0.6806, "learning_rate": 5.863301924177638e-06, "epoch": 6.720342002137514, "percentage": 67.22, "elapsed_time": "1 day, 22:31:27", "remaining_time": "22:41:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11800, "total_steps": 17540, "loss": 0.6889, "learning_rate": 5.84519160063562e-06, "epoch": 6.726042037762736, "percentage": 67.27, "elapsed_time": "1 day, 22:33:48", "remaining_time": "22:39:01", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11810, "total_steps": 17540, "loss": 0.6768, "learning_rate": 5.827097732416404e-06, "epoch": 6.7317420733879585, "percentage": 67.33, "elapsed_time": "1 day, 22:36:05", "remaining_time": "22:36:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11820, "total_steps": 17540, "loss": 0.67, "learning_rate": 5.809020391181635e-06, "epoch": 6.737442109013181, "percentage": 67.39, "elapsed_time": "1 day, 22:38:29", "remaining_time": "22:34:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11830, "total_steps": 17540, "loss": 0.6825, "learning_rate": 5.790959648527513e-06, "epoch": 6.743142144638404, "percentage": 67.45, "elapsed_time": "1 day, 22:40:55", "remaining_time": "22:31:55", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11840, "total_steps": 17540, "loss": 0.6653, "learning_rate": 5.772915575984497e-06, "epoch": 6.748842180263627, "percentage": 67.5, "elapsed_time": "1 day, 22:43:13", "remaining_time": "22:29:31", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11850, "total_steps": 17540, "loss": 0.6715, "learning_rate": 5.754888245017019e-06, "epoch": 6.754542215888849, "percentage": 67.56, "elapsed_time": "1 day, 22:45:40", "remaining_time": "22:27:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11860, "total_steps": 17540, "loss": 0.6687, "learning_rate": 5.736877727023217e-06, "epoch": 6.760242251514072, "percentage": 67.62, "elapsed_time": "1 day, 22:48:03", "remaining_time": "22:24:50", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11870, "total_steps": 17540, "loss": 0.676, "learning_rate": 5.7188840933346265e-06, "epoch": 6.7659422871392945, "percentage": 67.67, "elapsed_time": "1 day, 22:50:26", "remaining_time": "22:22:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11880, "total_steps": 17540, "loss": 0.6783, "learning_rate": 5.700907415215922e-06, "epoch": 6.771642322764517, "percentage": 67.73, "elapsed_time": "1 day, 22:52:53", "remaining_time": "22:20:09", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11890, "total_steps": 17540, "loss": 0.6734, "learning_rate": 5.682947763864612e-06, "epoch": 6.77734235838974, "percentage": 67.79, "elapsed_time": "1 day, 22:55:16", "remaining_time": "22:17:47", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11900, "total_steps": 17540, "loss": 0.6719, "learning_rate": 5.665005210410788e-06, "epoch": 6.783042394014963, "percentage": 67.84, "elapsed_time": "1 day, 22:57:36", "remaining_time": "22:15:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11910, "total_steps": 17540, "loss": 0.6756, "learning_rate": 5.64707982591681e-06, "epoch": 6.788742429640186, "percentage": 67.9, "elapsed_time": "1 day, 23:00:00", "remaining_time": "22:13:03", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11920, "total_steps": 17540, "loss": 0.6682, "learning_rate": 5.629171681377049e-06, "epoch": 6.794442465265408, "percentage": 67.96, "elapsed_time": "1 day, 23:02:21", "remaining_time": "22:10:40", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11930, "total_steps": 17540, "loss": 0.6729, "learning_rate": 5.611280847717581e-06, "epoch": 6.80014250089063, "percentage": 68.02, "elapsed_time": "1 day, 23:04:40", "remaining_time": "22:08:17", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11940, "total_steps": 17540, "loss": 0.6746, "learning_rate": 5.593407395795936e-06, "epoch": 6.805842536515853, "percentage": 68.07, "elapsed_time": "1 day, 23:07:00", "remaining_time": "22:05:54", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11950, "total_steps": 17540, "loss": 0.6637, "learning_rate": 5.575551396400802e-06, "epoch": 6.811542572141076, "percentage": 68.13, "elapsed_time": "1 day, 23:09:22", "remaining_time": "22:03:32", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11960, "total_steps": 17540, "loss": 0.6861, "learning_rate": 5.557712920251741e-06, "epoch": 6.817242607766299, "percentage": 68.19, "elapsed_time": "1 day, 23:11:44", "remaining_time": "22:01:09", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11970, "total_steps": 17540, "loss": 0.6742, "learning_rate": 5.539892037998911e-06, "epoch": 6.822942643391521, "percentage": 68.24, "elapsed_time": "1 day, 23:14:15", "remaining_time": "21:58:51", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11980, "total_steps": 17540, "loss": 0.6707, "learning_rate": 5.5220888202227906e-06, "epoch": 6.828642679016744, "percentage": 68.3, "elapsed_time": "1 day, 23:16:39", "remaining_time": "21:56:30", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 11990, "total_steps": 17540, "loss": 0.6833, "learning_rate": 5.504303337433905e-06, "epoch": 6.834342714641966, "percentage": 68.36, "elapsed_time": "1 day, 23:19:01", "remaining_time": "21:54:08", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12000, "total_steps": 17540, "loss": 0.682, "learning_rate": 5.48653566007253e-06, "epoch": 6.840042750267189, "percentage": 68.42, "elapsed_time": "1 day, 23:21:29", "remaining_time": "21:51:49", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12010, "total_steps": 17540, "loss": 0.6661, "learning_rate": 5.468785858508423e-06, "epoch": 6.845742785892412, "percentage": 68.47, "elapsed_time": "1 day, 23:23:51", "remaining_time": "21:49:27", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12020, "total_steps": 17540, "loss": 0.6825, "learning_rate": 5.451054003040541e-06, "epoch": 6.851442821517635, "percentage": 68.53, "elapsed_time": "1 day, 23:26:10", "remaining_time": "21:47:03", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12030, "total_steps": 17540, "loss": 0.6817, "learning_rate": 5.4333401638967794e-06, "epoch": 6.857142857142857, "percentage": 68.59, "elapsed_time": "1 day, 23:28:31", "remaining_time": "21:44:40", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12040, "total_steps": 17540, "loss": 0.6756, "learning_rate": 5.415644411233667e-06, "epoch": 6.86284289276808, "percentage": 68.64, "elapsed_time": "1 day, 23:30:45", "remaining_time": "21:42:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12050, "total_steps": 17540, "loss": 0.6769, "learning_rate": 5.3979668151360905e-06, "epoch": 6.868542928393302, "percentage": 68.7, "elapsed_time": "1 day, 23:33:09", "remaining_time": "21:39:54", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12060, "total_steps": 17540, "loss": 0.6759, "learning_rate": 5.380307445617048e-06, "epoch": 6.874242964018525, "percentage": 68.76, "elapsed_time": "1 day, 23:35:29", "remaining_time": "21:37:31", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12070, "total_steps": 17540, "loss": 0.6758, "learning_rate": 5.362666372617331e-06, "epoch": 6.879942999643748, "percentage": 68.81, "elapsed_time": "1 day, 23:37:50", "remaining_time": "21:35:08", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12080, "total_steps": 17540, "loss": 0.6658, "learning_rate": 5.345043666005287e-06, "epoch": 6.885643035268971, "percentage": 68.87, "elapsed_time": "1 day, 23:40:12", "remaining_time": "21:32:46", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12090, "total_steps": 17540, "loss": 0.6705, "learning_rate": 5.327439395576503e-06, "epoch": 6.891343070894193, "percentage": 68.93, "elapsed_time": "1 day, 23:42:35", "remaining_time": "21:30:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12100, "total_steps": 17540, "loss": 0.6748, "learning_rate": 5.309853631053563e-06, "epoch": 6.8970431065194155, "percentage": 68.99, "elapsed_time": "1 day, 23:44:51", "remaining_time": "21:28:00", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12110, "total_steps": 17540, "loss": 0.6728, "learning_rate": 5.2922864420857425e-06, "epoch": 6.902743142144638, "percentage": 69.04, "elapsed_time": "1 day, 23:47:14", "remaining_time": "21:25:38", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12120, "total_steps": 17540, "loss": 0.6847, "learning_rate": 5.274737898248767e-06, "epoch": 6.908443177769861, "percentage": 69.1, "elapsed_time": "1 day, 23:49:37", "remaining_time": "21:23:17", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12130, "total_steps": 17540, "loss": 0.6755, "learning_rate": 5.257208069044501e-06, "epoch": 6.914143213395084, "percentage": 69.16, "elapsed_time": "1 day, 23:52:00", "remaining_time": "21:20:55", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12140, "total_steps": 17540, "loss": 0.6694, "learning_rate": 5.239697023900696e-06, "epoch": 6.919843249020307, "percentage": 69.21, "elapsed_time": "1 day, 23:54:20", "remaining_time": "21:18:32", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12150, "total_steps": 17540, "loss": 0.6787, "learning_rate": 5.222204832170705e-06, "epoch": 6.925543284645529, "percentage": 69.27, "elapsed_time": "1 day, 23:56:41", "remaining_time": "21:16:09", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12160, "total_steps": 17540, "loss": 0.6771, "learning_rate": 5.204731563133214e-06, "epoch": 6.9312433202707515, "percentage": 69.33, "elapsed_time": "1 day, 23:59:03", "remaining_time": "21:13:47", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12170, "total_steps": 17540, "loss": 0.6743, "learning_rate": 5.187277285991963e-06, "epoch": 6.936943355895974, "percentage": 69.38, "elapsed_time": "2 days, 0:01:20", "remaining_time": "21:11:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12180, "total_steps": 17540, "loss": 0.6817, "learning_rate": 5.169842069875474e-06, "epoch": 6.942643391521197, "percentage": 69.44, "elapsed_time": "2 days, 0:03:41", "remaining_time": "21:09:01", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12190, "total_steps": 17540, "loss": 0.6808, "learning_rate": 5.152425983836777e-06, "epoch": 6.94834342714642, "percentage": 69.5, "elapsed_time": "2 days, 0:05:59", "remaining_time": "21:06:37", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12200, "total_steps": 17540, "loss": 0.6699, "learning_rate": 5.135029096853132e-06, "epoch": 6.954043462771642, "percentage": 69.56, "elapsed_time": "2 days, 0:08:23", "remaining_time": "21:04:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12210, "total_steps": 17540, "loss": 0.6749, "learning_rate": 5.117651477825776e-06, "epoch": 6.959743498396865, "percentage": 69.61, "elapsed_time": "2 days, 0:10:46", "remaining_time": "21:01:54", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12220, "total_steps": 17540, "loss": 0.6681, "learning_rate": 5.100293195579613e-06, "epoch": 6.9654435340220875, "percentage": 69.67, "elapsed_time": "2 days, 0:13:05", "remaining_time": "20:59:30", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12230, "total_steps": 17540, "loss": 0.6765, "learning_rate": 5.082954318862978e-06, "epoch": 6.97114356964731, "percentage": 69.73, "elapsed_time": "2 days, 0:15:22", "remaining_time": "20:57:06", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12240, "total_steps": 17540, "loss": 0.6758, "learning_rate": 5.0656349163473405e-06, "epoch": 6.976843605272533, "percentage": 69.78, "elapsed_time": "2 days, 0:17:44", "remaining_time": "20:54:44", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12250, "total_steps": 17540, "loss": 0.6793, "learning_rate": 5.048335056627043e-06, "epoch": 6.982543640897756, "percentage": 69.84, "elapsed_time": "2 days, 0:20:07", "remaining_time": "20:52:22", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12260, "total_steps": 17540, "loss": 0.6733, "learning_rate": 5.031054808219038e-06, "epoch": 6.988243676522979, "percentage": 69.9, "elapsed_time": "2 days, 0:22:31", "remaining_time": "20:50:01", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12270, "total_steps": 17540, "loss": 0.6736, "learning_rate": 5.013794239562593e-06, "epoch": 6.993943712148201, "percentage": 69.95, "elapsed_time": "2 days, 0:24:52", "remaining_time": "20:47:39", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12280, "total_steps": 17540, "loss": 0.6801, "learning_rate": 4.996553419019039e-06, "epoch": 6.9996437477734235, "percentage": 70.01, "elapsed_time": "2 days, 0:27:09", "remaining_time": "20:45:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12290, "total_steps": 17540, "loss": 0.66, "learning_rate": 4.9793324148714935e-06, "epoch": 7.005343783398646, "percentage": 70.07, "elapsed_time": "2 days, 0:29:33", "remaining_time": "20:42:53", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12300, "total_steps": 17540, "loss": 0.6675, "learning_rate": 4.962131295324588e-06, "epoch": 7.011043819023869, "percentage": 70.13, "elapsed_time": "2 days, 0:31:55", "remaining_time": "20:40:31", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12310, "total_steps": 17540, "loss": 0.6717, "learning_rate": 4.944950128504202e-06, "epoch": 7.016743854649092, "percentage": 70.18, "elapsed_time": "2 days, 0:34:22", "remaining_time": "20:38:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12320, "total_steps": 17540, "loss": 0.6669, "learning_rate": 4.9277889824571925e-06, "epoch": 7.022443890274314, "percentage": 70.24, "elapsed_time": "2 days, 0:36:49", "remaining_time": "20:35:51", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12330, "total_steps": 17540, "loss": 0.6622, "learning_rate": 4.910647925151115e-06, "epoch": 7.028143925899537, "percentage": 70.3, "elapsed_time": "2 days, 0:39:10", "remaining_time": "20:33:29", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12340, "total_steps": 17540, "loss": 0.6572, "learning_rate": 4.893527024473979e-06, "epoch": 7.033843961524759, "percentage": 70.35, "elapsed_time": "2 days, 0:41:30", "remaining_time": "20:31:06", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12350, "total_steps": 17540, "loss": 0.6626, "learning_rate": 4.876426348233948e-06, "epoch": 7.039543997149982, "percentage": 70.41, "elapsed_time": "2 days, 0:43:50", "remaining_time": "20:28:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12360, "total_steps": 17540, "loss": 0.6636, "learning_rate": 4.85934596415909e-06, "epoch": 7.045244032775205, "percentage": 70.47, "elapsed_time": "2 days, 0:46:14", "remaining_time": "20:26:22", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12370, "total_steps": 17540, "loss": 0.6621, "learning_rate": 4.842285939897107e-06, "epoch": 7.050944068400428, "percentage": 70.52, "elapsed_time": "2 days, 0:48:35", "remaining_time": "20:23:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12380, "total_steps": 17540, "loss": 0.657, "learning_rate": 4.825246343015056e-06, "epoch": 7.05664410402565, "percentage": 70.58, "elapsed_time": "2 days, 0:50:58", "remaining_time": "20:21:37", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12390, "total_steps": 17540, "loss": 0.6591, "learning_rate": 4.808227240999109e-06, "epoch": 7.062344139650873, "percentage": 70.64, "elapsed_time": "2 days, 0:53:17", "remaining_time": "20:19:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12400, "total_steps": 17540, "loss": 0.6561, "learning_rate": 4.791228701254251e-06, "epoch": 7.068044175276095, "percentage": 70.7, "elapsed_time": "2 days, 0:55:36", "remaining_time": "20:16:51", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12410, "total_steps": 17540, "loss": 0.6647, "learning_rate": 4.774250791104033e-06, "epoch": 7.073744210901318, "percentage": 70.75, "elapsed_time": "2 days, 0:57:57", "remaining_time": "20:14:29", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12420, "total_steps": 17540, "loss": 0.6634, "learning_rate": 4.757293577790302e-06, "epoch": 7.079444246526541, "percentage": 70.81, "elapsed_time": "2 days, 1:00:25", "remaining_time": "20:12:09", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12430, "total_steps": 17540, "loss": 0.6785, "learning_rate": 4.740357128472936e-06, "epoch": 7.085144282151764, "percentage": 70.87, "elapsed_time": "2 days, 1:02:41", "remaining_time": "20:09:44", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12440, "total_steps": 17540, "loss": 0.6785, "learning_rate": 4.723441510229572e-06, "epoch": 7.090844317776986, "percentage": 70.92, "elapsed_time": "2 days, 1:05:02", "remaining_time": "20:07:22", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12450, "total_steps": 17540, "loss": 0.6596, "learning_rate": 4.70654679005535e-06, "epoch": 7.096544353402209, "percentage": 70.98, "elapsed_time": "2 days, 1:07:25", "remaining_time": "20:05:00", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12460, "total_steps": 17540, "loss": 0.6594, "learning_rate": 4.689673034862637e-06, "epoch": 7.102244389027431, "percentage": 71.04, "elapsed_time": "2 days, 1:09:53", "remaining_time": "20:02:40", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12470, "total_steps": 17540, "loss": 0.6627, "learning_rate": 4.672820311480768e-06, "epoch": 7.107944424652654, "percentage": 71.09, "elapsed_time": "2 days, 1:12:13", "remaining_time": "20:00:18", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12480, "total_steps": 17540, "loss": 0.6667, "learning_rate": 4.655988686655787e-06, "epoch": 7.113644460277877, "percentage": 71.15, "elapsed_time": "2 days, 1:14:32", "remaining_time": "19:57:55", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12490, "total_steps": 17540, "loss": 0.6582, "learning_rate": 4.639178227050169e-06, "epoch": 7.1193444959031, "percentage": 71.21, "elapsed_time": "2 days, 1:16:56", "remaining_time": "19:55:33", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12500, "total_steps": 17540, "loss": 0.6558, "learning_rate": 4.622388999242564e-06, "epoch": 7.125044531528322, "percentage": 71.27, "elapsed_time": "2 days, 1:19:14", "remaining_time": "19:53:09", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12510, "total_steps": 17540, "loss": 0.666, "learning_rate": 4.6056210697275315e-06, "epoch": 7.1307445671535445, "percentage": 71.32, "elapsed_time": "2 days, 1:21:30", "remaining_time": "19:50:45", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12520, "total_steps": 17540, "loss": 0.6659, "learning_rate": 4.588874504915287e-06, "epoch": 7.136444602778767, "percentage": 71.38, "elapsed_time": "2 days, 1:23:56", "remaining_time": "19:48:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12530, "total_steps": 17540, "loss": 0.6569, "learning_rate": 4.572149371131419e-06, "epoch": 7.14214463840399, "percentage": 71.44, "elapsed_time": "2 days, 1:26:25", "remaining_time": "19:46:05", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12540, "total_steps": 17540, "loss": 0.6671, "learning_rate": 4.555445734616641e-06, "epoch": 7.147844674029213, "percentage": 71.49, "elapsed_time": "2 days, 1:28:46", "remaining_time": "19:43:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12550, "total_steps": 17540, "loss": 0.6711, "learning_rate": 4.538763661526527e-06, "epoch": 7.153544709654435, "percentage": 71.55, "elapsed_time": "2 days, 1:31:03", "remaining_time": "19:41:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12560, "total_steps": 17540, "loss": 0.6503, "learning_rate": 4.522103217931247e-06, "epoch": 7.159244745279658, "percentage": 71.61, "elapsed_time": "2 days, 1:33:26", "remaining_time": "19:38:57", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12570, "total_steps": 17540, "loss": 0.6661, "learning_rate": 4.505464469815307e-06, "epoch": 7.1649447809048805, "percentage": 71.66, "elapsed_time": "2 days, 1:35:51", "remaining_time": "19:36:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12580, "total_steps": 17540, "loss": 0.666, "learning_rate": 4.488847483077285e-06, "epoch": 7.170644816530103, "percentage": 71.72, "elapsed_time": "2 days, 1:38:09", "remaining_time": "19:34:13", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12590, "total_steps": 17540, "loss": 0.6674, "learning_rate": 4.472252323529575e-06, "epoch": 7.176344852155326, "percentage": 71.78, "elapsed_time": "2 days, 1:40:29", "remaining_time": "19:31:50", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12600, "total_steps": 17540, "loss": 0.6597, "learning_rate": 4.455679056898116e-06, "epoch": 7.182044887780549, "percentage": 71.84, "elapsed_time": "2 days, 1:42:51", "remaining_time": "19:29:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12610, "total_steps": 17540, "loss": 0.6648, "learning_rate": 4.439127748822153e-06, "epoch": 7.187744923405771, "percentage": 71.89, "elapsed_time": "2 days, 1:45:20", "remaining_time": "19:27:08", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12620, "total_steps": 17540, "loss": 0.677, "learning_rate": 4.4225984648539525e-06, "epoch": 7.193444959030994, "percentage": 71.95, "elapsed_time": "2 days, 1:47:45", "remaining_time": "19:24:47", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12630, "total_steps": 17540, "loss": 0.6709, "learning_rate": 4.406091270458553e-06, "epoch": 7.1991449946562165, "percentage": 72.01, "elapsed_time": "2 days, 1:50:11", "remaining_time": "19:22:27", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12640, "total_steps": 17540, "loss": 0.6582, "learning_rate": 4.389606231013512e-06, "epoch": 7.204845030281439, "percentage": 72.06, "elapsed_time": "2 days, 1:52:28", "remaining_time": "19:20:03", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12650, "total_steps": 17540, "loss": 0.6633, "learning_rate": 4.3731434118086324e-06, "epoch": 7.210545065906662, "percentage": 72.12, "elapsed_time": "2 days, 1:54:51", "remaining_time": "19:17:41", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12660, "total_steps": 17540, "loss": 0.6662, "learning_rate": 4.356702878045728e-06, "epoch": 7.216245101531885, "percentage": 72.18, "elapsed_time": "2 days, 1:57:11", "remaining_time": "19:15:18", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12670, "total_steps": 17540, "loss": 0.6622, "learning_rate": 4.3402846948383334e-06, "epoch": 7.221945137157107, "percentage": 72.23, "elapsed_time": "2 days, 1:59:29", "remaining_time": "19:12:55", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12680, "total_steps": 17540, "loss": 0.6759, "learning_rate": 4.323888927211472e-06, "epoch": 7.22764517278233, "percentage": 72.29, "elapsed_time": "2 days, 2:01:53", "remaining_time": "19:10:34", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12690, "total_steps": 17540, "loss": 0.6648, "learning_rate": 4.307515640101387e-06, "epoch": 7.2333452084075525, "percentage": 72.35, "elapsed_time": "2 days, 2:04:18", "remaining_time": "19:08:12", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12700, "total_steps": 17540, "loss": 0.6614, "learning_rate": 4.291164898355286e-06, "epoch": 7.239045244032775, "percentage": 72.41, "elapsed_time": "2 days, 2:06:37", "remaining_time": "19:05:50", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12710, "total_steps": 17540, "loss": 0.6583, "learning_rate": 4.274836766731087e-06, "epoch": 7.244745279657998, "percentage": 72.46, "elapsed_time": "2 days, 2:08:56", "remaining_time": "19:03:26", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12720, "total_steps": 17540, "loss": 0.6676, "learning_rate": 4.2585313098971535e-06, "epoch": 7.250445315283221, "percentage": 72.52, "elapsed_time": "2 days, 2:11:23", "remaining_time": "19:01:06", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12730, "total_steps": 17540, "loss": 0.6629, "learning_rate": 4.242248592432048e-06, "epoch": 7.256145350908443, "percentage": 72.58, "elapsed_time": "2 days, 2:13:43", "remaining_time": "18:58:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12740, "total_steps": 17540, "loss": 0.6704, "learning_rate": 4.225988678824279e-06, "epoch": 7.261845386533666, "percentage": 72.63, "elapsed_time": "2 days, 2:16:02", "remaining_time": "18:56:20", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12750, "total_steps": 17540, "loss": 0.676, "learning_rate": 4.209751633472029e-06, "epoch": 7.267545422158888, "percentage": 72.69, "elapsed_time": "2 days, 2:18:29", "remaining_time": "18:54:00", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12760, "total_steps": 17540, "loss": 0.6634, "learning_rate": 4.1935375206829156e-06, "epoch": 7.273245457784111, "percentage": 72.75, "elapsed_time": "2 days, 2:20:55", "remaining_time": "18:51:39", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12770, "total_steps": 17540, "loss": 0.6745, "learning_rate": 4.1773464046737275e-06, "epoch": 7.278945493409334, "percentage": 72.81, "elapsed_time": "2 days, 2:23:17", "remaining_time": "18:49:17", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12780, "total_steps": 17540, "loss": 0.6689, "learning_rate": 4.161178349570173e-06, "epoch": 7.284645529034557, "percentage": 72.86, "elapsed_time": "2 days, 2:25:41", "remaining_time": "18:46:56", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12790, "total_steps": 17540, "loss": 0.6625, "learning_rate": 4.145033419406635e-06, "epoch": 7.290345564659779, "percentage": 72.92, "elapsed_time": "2 days, 2:28:04", "remaining_time": "18:44:34", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12800, "total_steps": 17540, "loss": 0.6645, "learning_rate": 4.128911678125902e-06, "epoch": 7.296045600285002, "percentage": 72.98, "elapsed_time": "2 days, 2:30:25", "remaining_time": "18:42:12", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12810, "total_steps": 17540, "loss": 0.6658, "learning_rate": 4.112813189578917e-06, "epoch": 7.301745635910224, "percentage": 73.03, "elapsed_time": "2 days, 2:32:45", "remaining_time": "18:39:49", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12820, "total_steps": 17540, "loss": 0.6608, "learning_rate": 4.096738017524533e-06, "epoch": 7.307445671535447, "percentage": 73.09, "elapsed_time": "2 days, 2:35:10", "remaining_time": "18:37:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12830, "total_steps": 17540, "loss": 0.6643, "learning_rate": 4.080686225629267e-06, "epoch": 7.31314570716067, "percentage": 73.15, "elapsed_time": "2 days, 2:37:36", "remaining_time": "18:35:07", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12840, "total_steps": 17540, "loss": 0.6463, "learning_rate": 4.064657877467025e-06, "epoch": 7.318845742785893, "percentage": 73.2, "elapsed_time": "2 days, 2:39:54", "remaining_time": "18:32:44", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12850, "total_steps": 17540, "loss": 0.6593, "learning_rate": 4.048653036518869e-06, "epoch": 7.324545778411115, "percentage": 73.26, "elapsed_time": "2 days, 2:42:13", "remaining_time": "18:30:21", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12860, "total_steps": 17540, "loss": 0.6589, "learning_rate": 4.032671766172756e-06, "epoch": 7.330245814036338, "percentage": 73.32, "elapsed_time": "2 days, 2:44:32", "remaining_time": "18:27:58", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12870, "total_steps": 17540, "loss": 0.6707, "learning_rate": 4.016714129723291e-06, "epoch": 7.33594584966156, "percentage": 73.38, "elapsed_time": "2 days, 2:46:58", "remaining_time": "18:25:37", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12880, "total_steps": 17540, "loss": 0.6701, "learning_rate": 4.00078019037148e-06, "epoch": 7.341645885286783, "percentage": 73.43, "elapsed_time": "2 days, 2:49:22", "remaining_time": "18:23:16", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12890, "total_steps": 17540, "loss": 0.6648, "learning_rate": 3.984870011224474e-06, "epoch": 7.347345920912006, "percentage": 73.49, "elapsed_time": "2 days, 2:51:46", "remaining_time": "18:20:54", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12900, "total_steps": 17540, "loss": 0.6736, "learning_rate": 3.968983655295317e-06, "epoch": 7.353045956537228, "percentage": 73.55, "elapsed_time": "2 days, 2:54:12", "remaining_time": "18:18:34", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12910, "total_steps": 17540, "loss": 0.6745, "learning_rate": 3.953121185502699e-06, "epoch": 7.358745992162451, "percentage": 73.6, "elapsed_time": "2 days, 2:56:34", "remaining_time": "18:16:12", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12920, "total_steps": 17540, "loss": 0.6576, "learning_rate": 3.9372826646707215e-06, "epoch": 7.3644460277876735, "percentage": 73.66, "elapsed_time": "2 days, 2:58:55", "remaining_time": "18:13:49", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12930, "total_steps": 17540, "loss": 0.6681, "learning_rate": 3.921468155528614e-06, "epoch": 7.370146063412896, "percentage": 73.72, "elapsed_time": "2 days, 3:01:17", "remaining_time": "18:11:27", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12940, "total_steps": 17540, "loss": 0.658, "learning_rate": 3.90567772071052e-06, "epoch": 7.375846099038119, "percentage": 73.77, "elapsed_time": "2 days, 3:03:46", "remaining_time": "18:09:07", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12950, "total_steps": 17540, "loss": 0.6643, "learning_rate": 3.8899114227552315e-06, "epoch": 7.381546134663342, "percentage": 73.83, "elapsed_time": "2 days, 3:06:04", "remaining_time": "18:06:44", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12960, "total_steps": 17540, "loss": 0.6682, "learning_rate": 3.874169324105945e-06, "epoch": 7.387246170288564, "percentage": 73.89, "elapsed_time": "2 days, 3:08:19", "remaining_time": "18:04:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12970, "total_steps": 17540, "loss": 0.6643, "learning_rate": 3.8584514871100206e-06, "epoch": 7.392946205913787, "percentage": 73.95, "elapsed_time": "2 days, 3:10:38", "remaining_time": "18:01:56", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12980, "total_steps": 17540, "loss": 0.6674, "learning_rate": 3.842757974018721e-06, "epoch": 7.3986462415390095, "percentage": 74.0, "elapsed_time": "2 days, 3:13:04", "remaining_time": "17:59:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 12990, "total_steps": 17540, "loss": 0.6578, "learning_rate": 3.827088846986977e-06, "epoch": 7.404346277164232, "percentage": 74.06, "elapsed_time": "2 days, 3:15:29", "remaining_time": "17:57:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13000, "total_steps": 17540, "loss": 0.6627, "learning_rate": 3.8114441680731317e-06, "epoch": 7.410046312789455, "percentage": 74.12, "elapsed_time": "2 days, 3:17:51", "remaining_time": "17:54:52", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13010, "total_steps": 17540, "loss": 0.6672, "learning_rate": 3.7958239992387113e-06, "epoch": 7.415746348414678, "percentage": 74.17, "elapsed_time": "2 days, 3:20:11", "remaining_time": "17:52:30", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13020, "total_steps": 17540, "loss": 0.6591, "learning_rate": 3.7802284023481582e-06, "epoch": 7.4214463840399, "percentage": 74.23, "elapsed_time": "2 days, 3:22:32", "remaining_time": "17:50:07", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13030, "total_steps": 17540, "loss": 0.6593, "learning_rate": 3.7646574391686007e-06, "epoch": 7.427146419665123, "percentage": 74.29, "elapsed_time": "2 days, 3:24:58", "remaining_time": "17:47:47", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13040, "total_steps": 17540, "loss": 0.6728, "learning_rate": 3.7491111713696026e-06, "epoch": 7.4328464552903455, "percentage": 74.34, "elapsed_time": "2 days, 3:27:19", "remaining_time": "17:45:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13050, "total_steps": 17540, "loss": 0.6656, "learning_rate": 3.733589660522923e-06, "epoch": 7.438546490915568, "percentage": 74.4, "elapsed_time": "2 days, 3:29:40", "remaining_time": "17:43:02", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13060, "total_steps": 17540, "loss": 0.6544, "learning_rate": 3.718092968102267e-06, "epoch": 7.444246526540791, "percentage": 74.46, "elapsed_time": "2 days, 3:32:09", "remaining_time": "17:40:42", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13070, "total_steps": 17540, "loss": 0.6719, "learning_rate": 3.702621155483046e-06, "epoch": 7.449946562166014, "percentage": 74.52, "elapsed_time": "2 days, 3:34:39", "remaining_time": "17:38:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13080, "total_steps": 17540, "loss": 0.663, "learning_rate": 3.6871742839421344e-06, "epoch": 7.455646597791236, "percentage": 74.57, "elapsed_time": "2 days, 3:36:58", "remaining_time": "17:36:00", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13090, "total_steps": 17540, "loss": 0.6627, "learning_rate": 3.6717524146576234e-06, "epoch": 7.461346633416459, "percentage": 74.63, "elapsed_time": "2 days, 3:39:20", "remaining_time": "17:33:38", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13100, "total_steps": 17540, "loss": 0.6607, "learning_rate": 3.6563556087085894e-06, "epoch": 7.4670466690416815, "percentage": 74.69, "elapsed_time": "2 days, 3:41:47", "remaining_time": "17:31:17", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13110, "total_steps": 17540, "loss": 0.6718, "learning_rate": 3.640983927074836e-06, "epoch": 7.472746704666904, "percentage": 74.74, "elapsed_time": "2 days, 3:44:13", "remaining_time": "17:28:56", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13120, "total_steps": 17540, "loss": 0.6601, "learning_rate": 3.6256374306366635e-06, "epoch": 7.478446740292127, "percentage": 74.8, "elapsed_time": "2 days, 3:46:33", "remaining_time": "17:26:34", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13130, "total_steps": 17540, "loss": 0.6634, "learning_rate": 3.6103161801746224e-06, "epoch": 7.48414677591735, "percentage": 74.86, "elapsed_time": "2 days, 3:48:50", "remaining_time": "17:24:10", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13140, "total_steps": 17540, "loss": 0.6626, "learning_rate": 3.5950202363692822e-06, "epoch": 7.489846811542572, "percentage": 74.91, "elapsed_time": "2 days, 3:51:16", "remaining_time": "17:21:49", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13150, "total_steps": 17540, "loss": 0.6632, "learning_rate": 3.5797496598009794e-06, "epoch": 7.495546847167795, "percentage": 74.97, "elapsed_time": "2 days, 3:53:38", "remaining_time": "17:19:27", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13160, "total_steps": 17540, "loss": 0.6693, "learning_rate": 3.564504510949581e-06, "epoch": 7.501246882793017, "percentage": 75.03, "elapsed_time": "2 days, 3:55:59", "remaining_time": "17:17:05", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13170, "total_steps": 17540, "loss": 0.6685, "learning_rate": 3.54928485019425e-06, "epoch": 7.50694691841824, "percentage": 75.09, "elapsed_time": "2 days, 3:58:15", "remaining_time": "17:14:41", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13180, "total_steps": 17540, "loss": 0.669, "learning_rate": 3.534090737813198e-06, "epoch": 7.512646954043463, "percentage": 75.14, "elapsed_time": "2 days, 4:00:42", "remaining_time": "17:12:20", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13190, "total_steps": 17540, "loss": 0.6648, "learning_rate": 3.518922233983455e-06, "epoch": 7.518346989668686, "percentage": 75.2, "elapsed_time": "2 days, 4:03:07", "remaining_time": "17:09:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13200, "total_steps": 17540, "loss": 0.6674, "learning_rate": 3.503779398780626e-06, "epoch": 7.524047025293908, "percentage": 75.26, "elapsed_time": "2 days, 4:05:30", "remaining_time": "17:07:37", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13210, "total_steps": 17540, "loss": 0.6679, "learning_rate": 3.4886622921786517e-06, "epoch": 7.529747060919131, "percentage": 75.31, "elapsed_time": "2 days, 4:07:47", "remaining_time": "17:05:13", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13220, "total_steps": 17540, "loss": 0.6731, "learning_rate": 3.4735709740495748e-06, "epoch": 7.535447096544353, "percentage": 75.37, "elapsed_time": "2 days, 4:10:08", "remaining_time": "17:02:51", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13230, "total_steps": 17540, "loss": 0.6609, "learning_rate": 3.4585055041633076e-06, "epoch": 7.541147132169576, "percentage": 75.43, "elapsed_time": "2 days, 4:12:28", "remaining_time": "17:00:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13240, "total_steps": 17540, "loss": 0.6629, "learning_rate": 3.4434659421873807e-06, "epoch": 7.546847167794799, "percentage": 75.48, "elapsed_time": "2 days, 4:14:49", "remaining_time": "16:58:06", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13250, "total_steps": 17540, "loss": 0.6712, "learning_rate": 3.428452347686717e-06, "epoch": 7.552547203420021, "percentage": 75.54, "elapsed_time": "2 days, 4:17:09", "remaining_time": "16:55:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13260, "total_steps": 17540, "loss": 0.6684, "learning_rate": 3.4134647801233976e-06, "epoch": 7.558247239045244, "percentage": 75.6, "elapsed_time": "2 days, 4:19:30", "remaining_time": "16:53:21", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13270, "total_steps": 17540, "loss": 0.6651, "learning_rate": 3.3985032988564147e-06, "epoch": 7.563947274670467, "percentage": 75.66, "elapsed_time": "2 days, 4:21:53", "remaining_time": "16:50:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13280, "total_steps": 17540, "loss": 0.6653, "learning_rate": 3.3835679631414588e-06, "epoch": 7.569647310295689, "percentage": 75.71, "elapsed_time": "2 days, 4:24:14", "remaining_time": "16:48:37", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13290, "total_steps": 17540, "loss": 0.6603, "learning_rate": 3.3686588321306546e-06, "epoch": 7.575347345920912, "percentage": 75.77, "elapsed_time": "2 days, 4:26:35", "remaining_time": "16:46:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13300, "total_steps": 17540, "loss": 0.6591, "learning_rate": 3.35377596487235e-06, "epoch": 7.581047381546135, "percentage": 75.83, "elapsed_time": "2 days, 4:28:57", "remaining_time": "16:43:52", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13310, "total_steps": 17540, "loss": 0.6793, "learning_rate": 3.338919420310871e-06, "epoch": 7.586747417171358, "percentage": 75.88, "elapsed_time": "2 days, 4:31:18", "remaining_time": "16:41:30", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13320, "total_steps": 17540, "loss": 0.6711, "learning_rate": 3.3240892572862924e-06, "epoch": 7.59244745279658, "percentage": 75.94, "elapsed_time": "2 days, 4:33:43", "remaining_time": "16:39:09", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13330, "total_steps": 17540, "loss": 0.6655, "learning_rate": 3.3092855345342047e-06, "epoch": 7.5981474884218025, "percentage": 76.0, "elapsed_time": "2 days, 4:36:07", "remaining_time": "16:36:47", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13340, "total_steps": 17540, "loss": 0.661, "learning_rate": 3.294508310685478e-06, "epoch": 7.603847524047025, "percentage": 76.05, "elapsed_time": "2 days, 4:38:28", "remaining_time": "16:34:25", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13350, "total_steps": 17540, "loss": 0.6635, "learning_rate": 3.2797576442660293e-06, "epoch": 7.609547559672248, "percentage": 76.11, "elapsed_time": "2 days, 4:40:49", "remaining_time": "16:32:03", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13360, "total_steps": 17540, "loss": 0.6627, "learning_rate": 3.265033593696606e-06, "epoch": 7.615247595297471, "percentage": 76.17, "elapsed_time": "2 days, 4:43:09", "remaining_time": "16:29:40", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13370, "total_steps": 17540, "loss": 0.6675, "learning_rate": 3.25033621729253e-06, "epoch": 7.620947630922693, "percentage": 76.23, "elapsed_time": "2 days, 4:45:35", "remaining_time": "16:27:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13380, "total_steps": 17540, "loss": 0.667, "learning_rate": 3.2356655732634825e-06, "epoch": 7.626647666547916, "percentage": 76.28, "elapsed_time": "2 days, 4:47:56", "remaining_time": "16:24:56", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13390, "total_steps": 17540, "loss": 0.6647, "learning_rate": 3.2210217197132685e-06, "epoch": 7.6323477021731385, "percentage": 76.34, "elapsed_time": "2 days, 4:50:13", "remaining_time": "16:22:33", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13400, "total_steps": 17540, "loss": 0.6582, "learning_rate": 3.2064047146395894e-06, "epoch": 7.638047737798361, "percentage": 76.4, "elapsed_time": "2 days, 4:52:38", "remaining_time": "16:20:12", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13410, "total_steps": 17540, "loss": 0.6694, "learning_rate": 3.191814615933816e-06, "epoch": 7.643747773423584, "percentage": 76.45, "elapsed_time": "2 days, 4:55:02", "remaining_time": "16:17:50", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13420, "total_steps": 17540, "loss": 0.664, "learning_rate": 3.1772514813807474e-06, "epoch": 7.649447809048807, "percentage": 76.51, "elapsed_time": "2 days, 4:57:25", "remaining_time": "16:15:29", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13430, "total_steps": 17540, "loss": 0.6665, "learning_rate": 3.1627153686583954e-06, "epoch": 7.655147844674029, "percentage": 76.57, "elapsed_time": "2 days, 4:59:47", "remaining_time": "16:13:07", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13440, "total_steps": 17540, "loss": 0.6608, "learning_rate": 3.1482063353377468e-06, "epoch": 7.660847880299252, "percentage": 76.62, "elapsed_time": "2 days, 5:02:08", "remaining_time": "16:10:44", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13450, "total_steps": 17540, "loss": 0.6662, "learning_rate": 3.1337244388825428e-06, "epoch": 7.6665479159244745, "percentage": 76.68, "elapsed_time": "2 days, 5:04:25", "remaining_time": "16:08:21", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13460, "total_steps": 17540, "loss": 0.6691, "learning_rate": 3.1192697366490443e-06, "epoch": 7.672247951549697, "percentage": 76.74, "elapsed_time": "2 days, 5:06:46", "remaining_time": "16:05:58", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13470, "total_steps": 17540, "loss": 0.6597, "learning_rate": 3.104842285885811e-06, "epoch": 7.67794798717492, "percentage": 76.8, "elapsed_time": "2 days, 5:09:05", "remaining_time": "16:03:35", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13480, "total_steps": 17540, "loss": 0.647, "learning_rate": 3.0904421437334685e-06, "epoch": 7.683648022800142, "percentage": 76.85, "elapsed_time": "2 days, 5:11:28", "remaining_time": "16:01:13", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13490, "total_steps": 17540, "loss": 0.6608, "learning_rate": 3.0760693672244858e-06, "epoch": 7.689348058425365, "percentage": 76.91, "elapsed_time": "2 days, 5:13:48", "remaining_time": "15:58:51", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13500, "total_steps": 17540, "loss": 0.6575, "learning_rate": 3.061724013282956e-06, "epoch": 7.695048094050588, "percentage": 76.97, "elapsed_time": "2 days, 5:16:09", "remaining_time": "15:56:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13510, "total_steps": 17540, "loss": 0.6635, "learning_rate": 3.047406138724355e-06, "epoch": 7.7007481296758105, "percentage": 77.02, "elapsed_time": "2 days, 5:18:33", "remaining_time": "15:54:07", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13520, "total_steps": 17540, "loss": 0.6638, "learning_rate": 3.0331158002553296e-06, "epoch": 7.706448165301033, "percentage": 77.08, "elapsed_time": "2 days, 5:20:54", "remaining_time": "15:51:44", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13530, "total_steps": 17540, "loss": 0.665, "learning_rate": 3.018853054473463e-06, "epoch": 7.712148200926256, "percentage": 77.14, "elapsed_time": "2 days, 5:23:19", "remaining_time": "15:49:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13540, "total_steps": 17540, "loss": 0.6632, "learning_rate": 3.0046179578670664e-06, "epoch": 7.717848236551479, "percentage": 77.19, "elapsed_time": "2 days, 5:25:42", "remaining_time": "15:47:01", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13550, "total_steps": 17540, "loss": 0.668, "learning_rate": 2.9904105668149374e-06, "epoch": 7.723548272176701, "percentage": 77.25, "elapsed_time": "2 days, 5:28:08", "remaining_time": "15:44:40", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13560, "total_steps": 17540, "loss": 0.6633, "learning_rate": 2.9762309375861462e-06, "epoch": 7.729248307801924, "percentage": 77.31, "elapsed_time": "2 days, 5:30:26", "remaining_time": "15:42:17", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13570, "total_steps": 17540, "loss": 0.6619, "learning_rate": 2.9620791263398142e-06, "epoch": 7.734948343427146, "percentage": 77.37, "elapsed_time": "2 days, 5:32:45", "remaining_time": "15:39:54", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13580, "total_steps": 17540, "loss": 0.6591, "learning_rate": 2.9479551891248746e-06, "epoch": 7.740648379052369, "percentage": 77.42, "elapsed_time": "2 days, 5:35:10", "remaining_time": "15:37:33", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13590, "total_steps": 17540, "loss": 0.6642, "learning_rate": 2.9338591818798856e-06, "epoch": 7.746348414677592, "percentage": 77.48, "elapsed_time": "2 days, 5:37:36", "remaining_time": "15:35:12", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13600, "total_steps": 17540, "loss": 0.6644, "learning_rate": 2.919791160432772e-06, "epoch": 7.752048450302814, "percentage": 77.54, "elapsed_time": "2 days, 5:40:03", "remaining_time": "15:32:52", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13610, "total_steps": 17540, "loss": 0.6637, "learning_rate": 2.9057511805006246e-06, "epoch": 7.757748485928037, "percentage": 77.59, "elapsed_time": "2 days, 5:42:27", "remaining_time": "15:30:30", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13620, "total_steps": 17540, "loss": 0.6672, "learning_rate": 2.89173929768947e-06, "epoch": 7.76344852155326, "percentage": 77.65, "elapsed_time": "2 days, 5:44:45", "remaining_time": "15:28:07", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13630, "total_steps": 17540, "loss": 0.6566, "learning_rate": 2.877755567494066e-06, "epoch": 7.769148557178482, "percentage": 77.71, "elapsed_time": "2 days, 5:47:05", "remaining_time": "15:25:44", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13640, "total_steps": 17540, "loss": 0.6713, "learning_rate": 2.863800045297659e-06, "epoch": 7.774848592803705, "percentage": 77.77, "elapsed_time": "2 days, 5:49:22", "remaining_time": "15:23:21", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13650, "total_steps": 17540, "loss": 0.6689, "learning_rate": 2.8498727863717803e-06, "epoch": 7.780548628428928, "percentage": 77.82, "elapsed_time": "2 days, 5:51:48", "remaining_time": "15:21:00", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13660, "total_steps": 17540, "loss": 0.6716, "learning_rate": 2.835973845876022e-06, "epoch": 7.786248664054151, "percentage": 77.88, "elapsed_time": "2 days, 5:54:10", "remaining_time": "15:18:38", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13670, "total_steps": 17540, "loss": 0.6732, "learning_rate": 2.8221032788578206e-06, "epoch": 7.791948699679373, "percentage": 77.94, "elapsed_time": "2 days, 5:56:30", "remaining_time": "15:16:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13680, "total_steps": 17540, "loss": 0.6718, "learning_rate": 2.808261140252242e-06, "epoch": 7.797648735304596, "percentage": 77.99, "elapsed_time": "2 days, 5:58:55", "remaining_time": "15:13:54", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13690, "total_steps": 17540, "loss": 0.6619, "learning_rate": 2.7944474848817572e-06, "epoch": 7.803348770929818, "percentage": 78.05, "elapsed_time": "2 days, 6:01:20", "remaining_time": "15:11:33", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13700, "total_steps": 17540, "loss": 0.6655, "learning_rate": 2.780662367456021e-06, "epoch": 7.809048806555041, "percentage": 78.11, "elapsed_time": "2 days, 6:03:44", "remaining_time": "15:09:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13710, "total_steps": 17540, "loss": 0.6602, "learning_rate": 2.7669058425716676e-06, "epoch": 7.814748842180264, "percentage": 78.16, "elapsed_time": "2 days, 6:06:07", "remaining_time": "15:06:49", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13720, "total_steps": 17540, "loss": 0.6596, "learning_rate": 2.753177964712096e-06, "epoch": 7.820448877805486, "percentage": 78.22, "elapsed_time": "2 days, 6:08:28", "remaining_time": "15:04:27", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13730, "total_steps": 17540, "loss": 0.6644, "learning_rate": 2.7394787882472374e-06, "epoch": 7.826148913430709, "percentage": 78.28, "elapsed_time": "2 days, 6:10:47", "remaining_time": "15:02:04", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13740, "total_steps": 17540, "loss": 0.6616, "learning_rate": 2.7258083674333545e-06, "epoch": 7.8318489490559315, "percentage": 78.34, "elapsed_time": "2 days, 6:13:06", "remaining_time": "14:59:41", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13750, "total_steps": 17540, "loss": 0.6535, "learning_rate": 2.7121667564128173e-06, "epoch": 7.837548984681154, "percentage": 78.39, "elapsed_time": "2 days, 6:15:28", "remaining_time": "14:57:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13760, "total_steps": 17540, "loss": 0.6774, "learning_rate": 2.698554009213902e-06, "epoch": 7.843249020306377, "percentage": 78.45, "elapsed_time": "2 days, 6:17:54", "remaining_time": "14:54:58", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13770, "total_steps": 17540, "loss": 0.6659, "learning_rate": 2.684970179750559e-06, "epoch": 7.8489490559316, "percentage": 78.51, "elapsed_time": "2 days, 6:20:24", "remaining_time": "14:52:38", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13780, "total_steps": 17540, "loss": 0.6699, "learning_rate": 2.6714153218222127e-06, "epoch": 7.854649091556822, "percentage": 78.56, "elapsed_time": "2 days, 6:22:43", "remaining_time": "14:50:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13790, "total_steps": 17540, "loss": 0.6633, "learning_rate": 2.6578894891135455e-06, "epoch": 7.860349127182045, "percentage": 78.62, "elapsed_time": "2 days, 6:25:06", "remaining_time": "14:47:53", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13800, "total_steps": 17540, "loss": 0.6624, "learning_rate": 2.6443927351942798e-06, "epoch": 7.8660491628072675, "percentage": 78.68, "elapsed_time": "2 days, 6:27:25", "remaining_time": "14:45:31", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13810, "total_steps": 17540, "loss": 0.6643, "learning_rate": 2.630925113518974e-06, "epoch": 7.87174919843249, "percentage": 78.73, "elapsed_time": "2 days, 6:29:46", "remaining_time": "14:43:08", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13820, "total_steps": 17540, "loss": 0.6627, "learning_rate": 2.617486677426806e-06, "epoch": 7.877449234057713, "percentage": 78.79, "elapsed_time": "2 days, 6:32:03", "remaining_time": "14:40:45", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13830, "total_steps": 17540, "loss": 0.6582, "learning_rate": 2.6040774801413616e-06, "epoch": 7.883149269682935, "percentage": 78.85, "elapsed_time": "2 days, 6:34:23", "remaining_time": "14:38:22", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13840, "total_steps": 17540, "loss": 0.6633, "learning_rate": 2.590697574770421e-06, "epoch": 7.888849305308158, "percentage": 78.91, "elapsed_time": "2 days, 6:36:50", "remaining_time": "14:36:02", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13850, "total_steps": 17540, "loss": 0.6605, "learning_rate": 2.5773470143057657e-06, "epoch": 7.894549340933381, "percentage": 78.96, "elapsed_time": "2 days, 6:39:11", "remaining_time": "14:33:39", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13860, "total_steps": 17540, "loss": 0.6654, "learning_rate": 2.564025851622941e-06, "epoch": 7.9002493765586035, "percentage": 79.02, "elapsed_time": "2 days, 6:41:30", "remaining_time": "14:31:16", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13870, "total_steps": 17540, "loss": 0.6674, "learning_rate": 2.550734139481067e-06, "epoch": 7.905949412183826, "percentage": 79.08, "elapsed_time": "2 days, 6:43:54", "remaining_time": "14:28:55", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13880, "total_steps": 17540, "loss": 0.6709, "learning_rate": 2.5374719305226226e-06, "epoch": 7.911649447809049, "percentage": 79.13, "elapsed_time": "2 days, 6:46:13", "remaining_time": "14:26:32", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13890, "total_steps": 17540, "loss": 0.671, "learning_rate": 2.524239277273235e-06, "epoch": 7.917349483434272, "percentage": 79.19, "elapsed_time": "2 days, 6:48:35", "remaining_time": "14:24:10", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13900, "total_steps": 17540, "loss": 0.6658, "learning_rate": 2.511036232141484e-06, "epoch": 7.923049519059494, "percentage": 79.25, "elapsed_time": "2 days, 6:50:59", "remaining_time": "14:21:48", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13910, "total_steps": 17540, "loss": 0.6588, "learning_rate": 2.497862847418674e-06, "epoch": 7.928749554684717, "percentage": 79.3, "elapsed_time": "2 days, 6:53:22", "remaining_time": "14:19:26", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13920, "total_steps": 17540, "loss": 0.6611, "learning_rate": 2.4847191752786437e-06, "epoch": 7.9344495903099395, "percentage": 79.36, "elapsed_time": "2 days, 6:55:44", "remaining_time": "14:17:05", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13930, "total_steps": 17540, "loss": 0.6594, "learning_rate": 2.4716052677775524e-06, "epoch": 7.940149625935162, "percentage": 79.42, "elapsed_time": "2 days, 6:58:08", "remaining_time": "14:14:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13940, "total_steps": 17540, "loss": 0.6682, "learning_rate": 2.4585211768536754e-06, "epoch": 7.945849661560385, "percentage": 79.48, "elapsed_time": "2 days, 7:00:29", "remaining_time": "14:12:21", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13950, "total_steps": 17540, "loss": 0.6636, "learning_rate": 2.445466954327196e-06, "epoch": 7.951549697185607, "percentage": 79.53, "elapsed_time": "2 days, 7:02:53", "remaining_time": "14:09:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13960, "total_steps": 17540, "loss": 0.6693, "learning_rate": 2.4324426519000056e-06, "epoch": 7.95724973281083, "percentage": 79.59, "elapsed_time": "2 days, 7:05:14", "remaining_time": "14:07:37", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13970, "total_steps": 17540, "loss": 0.6661, "learning_rate": 2.419448321155493e-06, "epoch": 7.962949768436053, "percentage": 79.65, "elapsed_time": "2 days, 7:07:36", "remaining_time": "14:05:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13980, "total_steps": 17540, "loss": 0.6511, "learning_rate": 2.4064840135583413e-06, "epoch": 7.968649804061275, "percentage": 79.7, "elapsed_time": "2 days, 7:09:55", "remaining_time": "14:02:52", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 13990, "total_steps": 17540, "loss": 0.66, "learning_rate": 2.3935497804543317e-06, "epoch": 7.974349839686498, "percentage": 79.76, "elapsed_time": "2 days, 7:12:14", "remaining_time": "14:00:29", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14000, "total_steps": 17540, "loss": 0.6638, "learning_rate": 2.380645673070129e-06, "epoch": 7.980049875311721, "percentage": 79.82, "elapsed_time": "2 days, 7:14:43", "remaining_time": "13:58:09", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14010, "total_steps": 17540, "loss": 0.6664, "learning_rate": 2.3677717425130832e-06, "epoch": 7.985749910936943, "percentage": 79.87, "elapsed_time": "2 days, 7:17:01", "remaining_time": "13:55:45", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14020, "total_steps": 17540, "loss": 0.6536, "learning_rate": 2.3549280397710273e-06, "epoch": 7.991449946562166, "percentage": 79.93, "elapsed_time": "2 days, 7:19:23", "remaining_time": "13:53:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14030, "total_steps": 17540, "loss": 0.674, "learning_rate": 2.3421146157120813e-06, "epoch": 7.997149982187389, "percentage": 79.99, "elapsed_time": "2 days, 7:21:43", "remaining_time": "13:51:01", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14040, "total_steps": 17540, "loss": 0.663, "learning_rate": 2.329331521084439e-06, "epoch": 8.00285001781261, "percentage": 80.05, "elapsed_time": "2 days, 7:24:04", "remaining_time": "13:48:39", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14050, "total_steps": 17540, "loss": 0.6537, "learning_rate": 2.3165788065161742e-06, "epoch": 8.008550053437833, "percentage": 80.1, "elapsed_time": "2 days, 7:26:22", "remaining_time": "13:46:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14060, "total_steps": 17540, "loss": 0.6553, "learning_rate": 2.303856522515039e-06, "epoch": 8.014250089063056, "percentage": 80.16, "elapsed_time": "2 days, 7:28:42", "remaining_time": "13:43:53", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14070, "total_steps": 17540, "loss": 0.646, "learning_rate": 2.291164719468265e-06, "epoch": 8.019950124688279, "percentage": 80.22, "elapsed_time": "2 days, 7:31:05", "remaining_time": "13:41:31", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14080, "total_steps": 17540, "loss": 0.6645, "learning_rate": 2.2785034476423608e-06, "epoch": 8.025650160313502, "percentage": 80.27, "elapsed_time": "2 days, 7:33:30", "remaining_time": "13:39:10", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14090, "total_steps": 17540, "loss": 0.6647, "learning_rate": 2.2658727571829176e-06, "epoch": 8.031350195938725, "percentage": 80.33, "elapsed_time": "2 days, 7:35:51", "remaining_time": "13:36:48", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14100, "total_steps": 17540, "loss": 0.6608, "learning_rate": 2.2532726981144028e-06, "epoch": 8.037050231563947, "percentage": 80.39, "elapsed_time": "2 days, 7:38:16", "remaining_time": "13:34:26", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14110, "total_steps": 17540, "loss": 0.6525, "learning_rate": 2.2407033203399687e-06, "epoch": 8.04275026718917, "percentage": 80.44, "elapsed_time": "2 days, 7:40:37", "remaining_time": "13:32:04", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14120, "total_steps": 17540, "loss": 0.6555, "learning_rate": 2.2281646736412575e-06, "epoch": 8.048450302814393, "percentage": 80.5, "elapsed_time": "2 days, 7:42:53", "remaining_time": "13:29:40", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14130, "total_steps": 17540, "loss": 0.6531, "learning_rate": 2.215656807678194e-06, "epoch": 8.054150338439616, "percentage": 80.56, "elapsed_time": "2 days, 7:45:11", "remaining_time": "13:27:17", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14140, "total_steps": 17540, "loss": 0.652, "learning_rate": 2.203179771988796e-06, "epoch": 8.059850374064839, "percentage": 80.62, "elapsed_time": "2 days, 7:47:33", "remaining_time": "13:24:55", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14150, "total_steps": 17540, "loss": 0.6641, "learning_rate": 2.1907336159889712e-06, "epoch": 8.065550409690061, "percentage": 80.67, "elapsed_time": "2 days, 7:49:51", "remaining_time": "13:22:32", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14160, "total_steps": 17540, "loss": 0.6556, "learning_rate": 2.1783183889723415e-06, "epoch": 8.071250445315282, "percentage": 80.73, "elapsed_time": "2 days, 7:52:18", "remaining_time": "13:20:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14170, "total_steps": 17540, "loss": 0.6625, "learning_rate": 2.1659341401100165e-06, "epoch": 8.076950480940505, "percentage": 80.79, "elapsed_time": "2 days, 7:54:40", "remaining_time": "13:17:49", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14180, "total_steps": 17540, "loss": 0.6495, "learning_rate": 2.1535809184504255e-06, "epoch": 8.082650516565728, "percentage": 80.84, "elapsed_time": "2 days, 7:57:04", "remaining_time": "13:15:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14190, "total_steps": 17540, "loss": 0.6603, "learning_rate": 2.141258772919108e-06, "epoch": 8.088350552190951, "percentage": 80.9, "elapsed_time": "2 days, 7:59:24", "remaining_time": "13:13:05", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14200, "total_steps": 17540, "loss": 0.6551, "learning_rate": 2.128967752318527e-06, "epoch": 8.094050587816174, "percentage": 80.96, "elapsed_time": "2 days, 8:01:47", "remaining_time": "13:10:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14210, "total_steps": 17540, "loss": 0.6511, "learning_rate": 2.116707905327874e-06, "epoch": 8.099750623441397, "percentage": 81.01, "elapsed_time": "2 days, 8:04:05", "remaining_time": "13:08:20", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14220, "total_steps": 17540, "loss": 0.6607, "learning_rate": 2.1044792805028756e-06, "epoch": 8.10545065906662, "percentage": 81.07, "elapsed_time": "2 days, 8:06:27", "remaining_time": "13:05:58", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14230, "total_steps": 17540, "loss": 0.6453, "learning_rate": 2.0922819262756e-06, "epoch": 8.111150694691842, "percentage": 81.13, "elapsed_time": "2 days, 8:08:43", "remaining_time": "13:03:35", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14240, "total_steps": 17540, "loss": 0.6517, "learning_rate": 2.080115890954266e-06, "epoch": 8.116850730317065, "percentage": 81.19, "elapsed_time": "2 days, 8:11:05", "remaining_time": "13:01:13", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14250, "total_steps": 17540, "loss": 0.6485, "learning_rate": 2.06798122272306e-06, "epoch": 8.122550765942288, "percentage": 81.24, "elapsed_time": "2 days, 8:13:25", "remaining_time": "12:58:50", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14260, "total_steps": 17540, "loss": 0.6633, "learning_rate": 2.0558779696419274e-06, "epoch": 8.12825080156751, "percentage": 81.3, "elapsed_time": "2 days, 8:15:42", "remaining_time": "12:56:27", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14270, "total_steps": 17540, "loss": 0.665, "learning_rate": 2.043806179646399e-06, "epoch": 8.133950837192732, "percentage": 81.36, "elapsed_time": "2 days, 8:18:04", "remaining_time": "12:54:05", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14280, "total_steps": 17540, "loss": 0.6639, "learning_rate": 2.03176590054739e-06, "epoch": 8.139650872817954, "percentage": 81.41, "elapsed_time": "2 days, 8:20:24", "remaining_time": "12:51:42", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14290, "total_steps": 17540, "loss": 0.6618, "learning_rate": 2.019757180031017e-06, "epoch": 8.145350908443177, "percentage": 81.47, "elapsed_time": "2 days, 8:22:45", "remaining_time": "12:49:20", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14300, "total_steps": 17540, "loss": 0.6589, "learning_rate": 2.0077800656584102e-06, "epoch": 8.1510509440684, "percentage": 81.53, "elapsed_time": "2 days, 8:25:09", "remaining_time": "12:46:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14310, "total_steps": 17540, "loss": 0.6497, "learning_rate": 1.9958346048655188e-06, "epoch": 8.156750979693623, "percentage": 81.58, "elapsed_time": "2 days, 8:27:25", "remaining_time": "12:44:35", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14320, "total_steps": 17540, "loss": 0.6612, "learning_rate": 1.9839208449629265e-06, "epoch": 8.162451015318846, "percentage": 81.64, "elapsed_time": "2 days, 8:29:45", "remaining_time": "12:42:13", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14330, "total_steps": 17540, "loss": 0.6544, "learning_rate": 1.9720388331356643e-06, "epoch": 8.168151050944068, "percentage": 81.7, "elapsed_time": "2 days, 8:32:07", "remaining_time": "12:39:51", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14340, "total_steps": 17540, "loss": 0.6577, "learning_rate": 1.960188616443025e-06, "epoch": 8.173851086569291, "percentage": 81.76, "elapsed_time": "2 days, 8:34:28", "remaining_time": "12:37:29", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14350, "total_steps": 17540, "loss": 0.64, "learning_rate": 1.9483702418183725e-06, "epoch": 8.179551122194514, "percentage": 81.81, "elapsed_time": "2 days, 8:36:47", "remaining_time": "12:35:06", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14360, "total_steps": 17540, "loss": 0.6573, "learning_rate": 1.9365837560689626e-06, "epoch": 8.185251157819737, "percentage": 81.87, "elapsed_time": "2 days, 8:39:13", "remaining_time": "12:32:45", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14370, "total_steps": 17540, "loss": 0.6627, "learning_rate": 1.924829205875746e-06, "epoch": 8.19095119344496, "percentage": 81.93, "elapsed_time": "2 days, 8:41:35", "remaining_time": "12:30:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14380, "total_steps": 17540, "loss": 0.661, "learning_rate": 1.9131066377932017e-06, "epoch": 8.196651229070183, "percentage": 81.98, "elapsed_time": "2 days, 8:43:52", "remaining_time": "12:27:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14390, "total_steps": 17540, "loss": 0.6467, "learning_rate": 1.901416098249136e-06, "epoch": 8.202351264695404, "percentage": 82.04, "elapsed_time": "2 days, 8:46:12", "remaining_time": "12:25:37", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14400, "total_steps": 17540, "loss": 0.6597, "learning_rate": 1.8897576335445023e-06, "epoch": 8.208051300320626, "percentage": 82.1, "elapsed_time": "2 days, 8:48:30", "remaining_time": "12:23:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14410, "total_steps": 17540, "loss": 0.6534, "learning_rate": 1.8781312898532256e-06, "epoch": 8.21375133594585, "percentage": 82.16, "elapsed_time": "2 days, 8:50:55", "remaining_time": "12:20:53", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14420, "total_steps": 17540, "loss": 0.6431, "learning_rate": 1.8665371132220068e-06, "epoch": 8.219451371571072, "percentage": 82.21, "elapsed_time": "2 days, 8:53:19", "remaining_time": "12:18:31", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14430, "total_steps": 17540, "loss": 0.6552, "learning_rate": 1.8549751495701584e-06, "epoch": 8.225151407196295, "percentage": 82.27, "elapsed_time": "2 days, 8:55:44", "remaining_time": "12:16:10", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14440, "total_steps": 17540, "loss": 0.6562, "learning_rate": 1.8434454446894023e-06, "epoch": 8.230851442821518, "percentage": 82.33, "elapsed_time": "2 days, 8:58:05", "remaining_time": "12:13:47", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14450, "total_steps": 17540, "loss": 0.6656, "learning_rate": 1.8319480442437043e-06, "epoch": 8.23655147844674, "percentage": 82.38, "elapsed_time": "2 days, 9:00:29", "remaining_time": "12:11:26", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14460, "total_steps": 17540, "loss": 0.647, "learning_rate": 1.8204829937690748e-06, "epoch": 8.242251514071963, "percentage": 82.44, "elapsed_time": "2 days, 9:02:53", "remaining_time": "12:09:04", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14470, "total_steps": 17540, "loss": 0.6562, "learning_rate": 1.8090503386734181e-06, "epoch": 8.247951549697186, "percentage": 82.5, "elapsed_time": "2 days, 9:05:16", "remaining_time": "12:06:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14480, "total_steps": 17540, "loss": 0.6632, "learning_rate": 1.7976501242363242e-06, "epoch": 8.253651585322409, "percentage": 82.55, "elapsed_time": "2 days, 9:07:43", "remaining_time": "12:04:21", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14490, "total_steps": 17540, "loss": 0.6603, "learning_rate": 1.7862823956089014e-06, "epoch": 8.259351620947632, "percentage": 82.61, "elapsed_time": "2 days, 9:09:59", "remaining_time": "12:01:58", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14500, "total_steps": 17540, "loss": 0.653, "learning_rate": 1.774947197813598e-06, "epoch": 8.265051656572854, "percentage": 82.67, "elapsed_time": "2 days, 9:12:28", "remaining_time": "11:59:38", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14510, "total_steps": 17540, "loss": 0.6568, "learning_rate": 1.763644575744019e-06, "epoch": 8.270751692198075, "percentage": 82.73, "elapsed_time": "2 days, 9:14:54", "remaining_time": "11:57:16", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14520, "total_steps": 17540, "loss": 0.6526, "learning_rate": 1.7523745741647602e-06, "epoch": 8.276451727823298, "percentage": 82.78, "elapsed_time": "2 days, 9:17:14", "remaining_time": "11:54:54", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14530, "total_steps": 17540, "loss": 0.6552, "learning_rate": 1.7411372377112146e-06, "epoch": 8.282151763448521, "percentage": 82.84, "elapsed_time": "2 days, 9:19:32", "remaining_time": "11:52:31", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14540, "total_steps": 17540, "loss": 0.6571, "learning_rate": 1.7299326108894033e-06, "epoch": 8.287851799073744, "percentage": 82.9, "elapsed_time": "2 days, 9:21:54", "remaining_time": "11:50:09", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14550, "total_steps": 17540, "loss": 0.6634, "learning_rate": 1.7187607380757998e-06, "epoch": 8.293551834698967, "percentage": 82.95, "elapsed_time": "2 days, 9:24:13", "remaining_time": "11:47:46", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14560, "total_steps": 17540, "loss": 0.6518, "learning_rate": 1.7076216635171594e-06, "epoch": 8.29925187032419, "percentage": 83.01, "elapsed_time": "2 days, 9:26:37", "remaining_time": "11:45:25", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14570, "total_steps": 17540, "loss": 0.6652, "learning_rate": 1.6965154313303367e-06, "epoch": 8.304951905949412, "percentage": 83.07, "elapsed_time": "2 days, 9:29:01", "remaining_time": "11:43:03", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14580, "total_steps": 17540, "loss": 0.6661, "learning_rate": 1.6854420855021026e-06, "epoch": 8.310651941574635, "percentage": 83.12, "elapsed_time": "2 days, 9:31:27", "remaining_time": "11:40:42", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14590, "total_steps": 17540, "loss": 0.6517, "learning_rate": 1.6744016698889897e-06, "epoch": 8.316351977199858, "percentage": 83.18, "elapsed_time": "2 days, 9:33:50", "remaining_time": "11:38:20", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14600, "total_steps": 17540, "loss": 0.6551, "learning_rate": 1.6633942282171056e-06, "epoch": 8.32205201282508, "percentage": 83.24, "elapsed_time": "2 days, 9:36:13", "remaining_time": "11:35:58", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14610, "total_steps": 17540, "loss": 0.6543, "learning_rate": 1.6524198040819683e-06, "epoch": 8.327752048450304, "percentage": 83.3, "elapsed_time": "2 days, 9:38:38", "remaining_time": "11:33:37", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14620, "total_steps": 17540, "loss": 0.6569, "learning_rate": 1.6414784409483197e-06, "epoch": 8.333452084075525, "percentage": 83.35, "elapsed_time": "2 days, 9:40:57", "remaining_time": "11:31:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14630, "total_steps": 17540, "loss": 0.6535, "learning_rate": 1.6305701821499686e-06, "epoch": 8.339152119700747, "percentage": 83.41, "elapsed_time": "2 days, 9:43:17", "remaining_time": "11:28:52", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14640, "total_steps": 17540, "loss": 0.6643, "learning_rate": 1.6196950708896053e-06, "epoch": 8.34485215532597, "percentage": 83.47, "elapsed_time": "2 days, 9:45:40", "remaining_time": "11:26:30", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14650, "total_steps": 17540, "loss": 0.6509, "learning_rate": 1.6088531502386484e-06, "epoch": 8.350552190951193, "percentage": 83.52, "elapsed_time": "2 days, 9:47:58", "remaining_time": "11:24:07", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14660, "total_steps": 17540, "loss": 0.6601, "learning_rate": 1.598044463137054e-06, "epoch": 8.356252226576416, "percentage": 83.58, "elapsed_time": "2 days, 9:50:15", "remaining_time": "11:21:44", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14670, "total_steps": 17540, "loss": 0.657, "learning_rate": 1.58726905239316e-06, "epoch": 8.361952262201639, "percentage": 83.64, "elapsed_time": "2 days, 9:52:40", "remaining_time": "11:19:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14680, "total_steps": 17540, "loss": 0.6679, "learning_rate": 1.5765269606835054e-06, "epoch": 8.367652297826861, "percentage": 83.69, "elapsed_time": "2 days, 9:55:05", "remaining_time": "11:17:01", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14690, "total_steps": 17540, "loss": 0.6565, "learning_rate": 1.5658182305526815e-06, "epoch": 8.373352333452084, "percentage": 83.75, "elapsed_time": "2 days, 9:57:24", "remaining_time": "11:14:39", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14700, "total_steps": 17540, "loss": 0.6595, "learning_rate": 1.5551429044131305e-06, "epoch": 8.379052369077307, "percentage": 83.81, "elapsed_time": "2 days, 9:59:44", "remaining_time": "11:12:16", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14710, "total_steps": 17540, "loss": 0.6591, "learning_rate": 1.544501024545011e-06, "epoch": 8.38475240470253, "percentage": 83.87, "elapsed_time": "2 days, 10:02:05", "remaining_time": "11:09:54", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14720, "total_steps": 17540, "loss": 0.6619, "learning_rate": 1.5338926330960102e-06, "epoch": 8.390452440327753, "percentage": 83.92, "elapsed_time": "2 days, 10:04:34", "remaining_time": "11:07:33", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14730, "total_steps": 17540, "loss": 0.6543, "learning_rate": 1.5233177720811798e-06, "epoch": 8.396152475952976, "percentage": 83.98, "elapsed_time": "2 days, 10:06:56", "remaining_time": "11:05:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14740, "total_steps": 17540, "loss": 0.6609, "learning_rate": 1.512776483382783e-06, "epoch": 8.401852511578197, "percentage": 84.04, "elapsed_time": "2 days, 10:09:13", "remaining_time": "11:02:48", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14750, "total_steps": 17540, "loss": 0.6643, "learning_rate": 1.5022688087501092e-06, "epoch": 8.40755254720342, "percentage": 84.09, "elapsed_time": "2 days, 10:11:32", "remaining_time": "11:00:26", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14760, "total_steps": 17540, "loss": 0.6641, "learning_rate": 1.491794789799319e-06, "epoch": 8.413252582828642, "percentage": 84.15, "elapsed_time": "2 days, 10:13:58", "remaining_time": "10:58:04", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14770, "total_steps": 17540, "loss": 0.6536, "learning_rate": 1.4813544680132763e-06, "epoch": 8.418952618453865, "percentage": 84.21, "elapsed_time": "2 days, 10:16:22", "remaining_time": "10:55:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14780, "total_steps": 17540, "loss": 0.6467, "learning_rate": 1.4709478847413948e-06, "epoch": 8.424652654079088, "percentage": 84.26, "elapsed_time": "2 days, 10:18:49", "remaining_time": "10:53:22", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14790, "total_steps": 17540, "loss": 0.662, "learning_rate": 1.4605750811994557e-06, "epoch": 8.43035268970431, "percentage": 84.32, "elapsed_time": "2 days, 10:21:09", "remaining_time": "10:50:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14800, "total_steps": 17540, "loss": 0.6532, "learning_rate": 1.4502360984694563e-06, "epoch": 8.436052725329533, "percentage": 84.38, "elapsed_time": "2 days, 10:23:31", "remaining_time": "10:48:37", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14810, "total_steps": 17540, "loss": 0.6584, "learning_rate": 1.4399309774994475e-06, "epoch": 8.441752760954756, "percentage": 84.44, "elapsed_time": "2 days, 10:25:52", "remaining_time": "10:46:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14820, "total_steps": 17540, "loss": 0.6614, "learning_rate": 1.4296597591033656e-06, "epoch": 8.447452796579979, "percentage": 84.49, "elapsed_time": "2 days, 10:28:18", "remaining_time": "10:43:54", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14830, "total_steps": 17540, "loss": 0.6451, "learning_rate": 1.4194224839608761e-06, "epoch": 8.453152832205202, "percentage": 84.55, "elapsed_time": "2 days, 10:30:43", "remaining_time": "10:41:32", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14840, "total_steps": 17540, "loss": 0.6543, "learning_rate": 1.4092191926172106e-06, "epoch": 8.458852867830425, "percentage": 84.61, "elapsed_time": "2 days, 10:33:09", "remaining_time": "10:39:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14850, "total_steps": 17540, "loss": 0.6595, "learning_rate": 1.3990499254830047e-06, "epoch": 8.464552903455647, "percentage": 84.66, "elapsed_time": "2 days, 10:35:32", "remaining_time": "10:36:49", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14860, "total_steps": 17540, "loss": 0.664, "learning_rate": 1.3889147228341394e-06, "epoch": 8.470252939080869, "percentage": 84.72, "elapsed_time": "2 days, 10:37:53", "remaining_time": "10:34:27", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14870, "total_steps": 17540, "loss": 0.6629, "learning_rate": 1.3788136248115869e-06, "epoch": 8.475952974706091, "percentage": 84.78, "elapsed_time": "2 days, 10:40:11", "remaining_time": "10:32:04", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14880, "total_steps": 17540, "loss": 0.6577, "learning_rate": 1.3687466714212393e-06, "epoch": 8.481653010331314, "percentage": 84.83, "elapsed_time": "2 days, 10:42:38", "remaining_time": "10:29:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14890, "total_steps": 17540, "loss": 0.658, "learning_rate": 1.3587139025337615e-06, "epoch": 8.487353045956537, "percentage": 84.89, "elapsed_time": "2 days, 10:45:04", "remaining_time": "10:27:21", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14900, "total_steps": 17540, "loss": 0.6579, "learning_rate": 1.348715357884427e-06, "epoch": 8.49305308158176, "percentage": 84.95, "elapsed_time": "2 days, 10:47:23", "remaining_time": "10:24:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14910, "total_steps": 17540, "loss": 0.665, "learning_rate": 1.3387510770729595e-06, "epoch": 8.498753117206983, "percentage": 85.01, "elapsed_time": "2 days, 10:49:44", "remaining_time": "10:22:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14920, "total_steps": 17540, "loss": 0.6547, "learning_rate": 1.3288210995633888e-06, "epoch": 8.504453152832205, "percentage": 85.06, "elapsed_time": "2 days, 10:52:08", "remaining_time": "10:20:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14930, "total_steps": 17540, "loss": 0.6652, "learning_rate": 1.3189254646838766e-06, "epoch": 8.510153188457428, "percentage": 85.12, "elapsed_time": "2 days, 10:54:30", "remaining_time": "10:17:53", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14940, "total_steps": 17540, "loss": 0.6568, "learning_rate": 1.3090642116265695e-06, "epoch": 8.515853224082651, "percentage": 85.18, "elapsed_time": "2 days, 10:56:56", "remaining_time": "10:15:31", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14950, "total_steps": 17540, "loss": 0.6551, "learning_rate": 1.2992373794474466e-06, "epoch": 8.521553259707874, "percentage": 85.23, "elapsed_time": "2 days, 10:59:19", "remaining_time": "10:13:10", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14960, "total_steps": 17540, "loss": 0.6494, "learning_rate": 1.289445007066158e-06, "epoch": 8.527253295333097, "percentage": 85.29, "elapsed_time": "2 days, 11:01:42", "remaining_time": "10:10:48", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14970, "total_steps": 17540, "loss": 0.6558, "learning_rate": 1.2796871332658756e-06, "epoch": 8.532953330958318, "percentage": 85.35, "elapsed_time": "2 days, 11:04:01", "remaining_time": "10:08:25", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14980, "total_steps": 17540, "loss": 0.6602, "learning_rate": 1.26996379669314e-06, "epoch": 8.53865336658354, "percentage": 85.4, "elapsed_time": "2 days, 11:06:23", "remaining_time": "10:06:03", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 14990, "total_steps": 17540, "loss": 0.6609, "learning_rate": 1.260275035857701e-06, "epoch": 8.544353402208763, "percentage": 85.46, "elapsed_time": "2 days, 11:08:49", "remaining_time": "10:03:42", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15000, "total_steps": 17540, "loss": 0.6567, "learning_rate": 1.2506208891323711e-06, "epoch": 8.550053437833986, "percentage": 85.52, "elapsed_time": "2 days, 11:11:11", "remaining_time": "10:01:20", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15010, "total_steps": 17540, "loss": 0.6589, "learning_rate": 1.2410013947528766e-06, "epoch": 8.555753473459209, "percentage": 85.58, "elapsed_time": "2 days, 11:13:43", "remaining_time": "9:58:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15020, "total_steps": 17540, "loss": 0.6559, "learning_rate": 1.2314165908176956e-06, "epoch": 8.561453509084432, "percentage": 85.63, "elapsed_time": "2 days, 11:16:09", "remaining_time": "9:56:38", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15030, "total_steps": 17540, "loss": 0.6575, "learning_rate": 1.221866515287915e-06, "epoch": 8.567153544709655, "percentage": 85.69, "elapsed_time": "2 days, 11:18:35", "remaining_time": "9:54:16", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15040, "total_steps": 17540, "loss": 0.6535, "learning_rate": 1.2123512059870756e-06, "epoch": 8.572853580334877, "percentage": 85.75, "elapsed_time": "2 days, 11:21:01", "remaining_time": "9:51:55", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15050, "total_steps": 17540, "loss": 0.6605, "learning_rate": 1.202870700601032e-06, "epoch": 8.5785536159601, "percentage": 85.8, "elapsed_time": "2 days, 11:23:25", "remaining_time": "9:49:33", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15060, "total_steps": 17540, "loss": 0.6649, "learning_rate": 1.1934250366777899e-06, "epoch": 8.584253651585323, "percentage": 85.86, "elapsed_time": "2 days, 11:25:44", "remaining_time": "9:47:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15070, "total_steps": 17540, "loss": 0.6587, "learning_rate": 1.1840142516273644e-06, "epoch": 8.589953687210546, "percentage": 85.92, "elapsed_time": "2 days, 11:28:06", "remaining_time": "9:44:49", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15080, "total_steps": 17540, "loss": 0.6598, "learning_rate": 1.1746383827216334e-06, "epoch": 8.595653722835767, "percentage": 85.97, "elapsed_time": "2 days, 11:30:27", "remaining_time": "9:42:26", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15090, "total_steps": 17540, "loss": 0.6604, "learning_rate": 1.165297467094184e-06, "epoch": 8.60135375846099, "percentage": 86.03, "elapsed_time": "2 days, 11:32:48", "remaining_time": "9:40:04", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15100, "total_steps": 17540, "loss": 0.6616, "learning_rate": 1.1559915417401746e-06, "epoch": 8.607053794086212, "percentage": 86.09, "elapsed_time": "2 days, 11:35:07", "remaining_time": "9:37:42", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15110, "total_steps": 17540, "loss": 0.6556, "learning_rate": 1.146720643516177e-06, "epoch": 8.612753829711435, "percentage": 86.15, "elapsed_time": "2 days, 11:37:29", "remaining_time": "9:35:20", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15120, "total_steps": 17540, "loss": 0.656, "learning_rate": 1.1374848091400403e-06, "epoch": 8.618453865336658, "percentage": 86.2, "elapsed_time": "2 days, 11:39:52", "remaining_time": "9:32:58", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15130, "total_steps": 17540, "loss": 0.6586, "learning_rate": 1.1282840751907387e-06, "epoch": 8.62415390096188, "percentage": 86.26, "elapsed_time": "2 days, 11:42:21", "remaining_time": "9:30:37", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15140, "total_steps": 17540, "loss": 0.6555, "learning_rate": 1.1191184781082342e-06, "epoch": 8.629853936587104, "percentage": 86.32, "elapsed_time": "2 days, 11:44:47", "remaining_time": "9:28:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15150, "total_steps": 17540, "loss": 0.6593, "learning_rate": 1.1099880541933228e-06, "epoch": 8.635553972212326, "percentage": 86.37, "elapsed_time": "2 days, 11:47:11", "remaining_time": "9:25:54", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15160, "total_steps": 17540, "loss": 0.6502, "learning_rate": 1.100892839607497e-06, "epoch": 8.64125400783755, "percentage": 86.43, "elapsed_time": "2 days, 11:49:33", "remaining_time": "9:23:31", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15170, "total_steps": 17540, "loss": 0.6616, "learning_rate": 1.0918328703727998e-06, "epoch": 8.646954043462772, "percentage": 86.49, "elapsed_time": "2 days, 11:51:57", "remaining_time": "9:21:10", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15180, "total_steps": 17540, "loss": 0.6489, "learning_rate": 1.0828081823716862e-06, "epoch": 8.652654079087995, "percentage": 86.55, "elapsed_time": "2 days, 11:54:17", "remaining_time": "9:18:47", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15190, "total_steps": 17540, "loss": 0.6563, "learning_rate": 1.0738188113468762e-06, "epoch": 8.658354114713218, "percentage": 86.6, "elapsed_time": "2 days, 11:56:47", "remaining_time": "9:16:26", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15200, "total_steps": 17540, "loss": 0.6626, "learning_rate": 1.0648647929012157e-06, "epoch": 8.66405415033844, "percentage": 86.66, "elapsed_time": "2 days, 11:59:03", "remaining_time": "9:14:03", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15210, "total_steps": 17540, "loss": 0.6599, "learning_rate": 1.0559461624975343e-06, "epoch": 8.669754185963662, "percentage": 86.72, "elapsed_time": "2 days, 12:01:26", "remaining_time": "9:11:41", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15220, "total_steps": 17540, "loss": 0.656, "learning_rate": 1.0470629554585043e-06, "epoch": 8.675454221588884, "percentage": 86.77, "elapsed_time": "2 days, 12:03:48", "remaining_time": "9:09:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15230, "total_steps": 17540, "loss": 0.6534, "learning_rate": 1.0382152069665063e-06, "epoch": 8.681154257214107, "percentage": 86.83, "elapsed_time": "2 days, 12:06:07", "remaining_time": "9:06:57", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15240, "total_steps": 17540, "loss": 0.6569, "learning_rate": 1.0294029520634806e-06, "epoch": 8.68685429283933, "percentage": 86.89, "elapsed_time": "2 days, 12:08:30", "remaining_time": "9:04:35", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15250, "total_steps": 17540, "loss": 0.6516, "learning_rate": 1.020626225650797e-06, "epoch": 8.692554328464553, "percentage": 86.94, "elapsed_time": "2 days, 12:10:54", "remaining_time": "9:02:13", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15260, "total_steps": 17540, "loss": 0.6611, "learning_rate": 1.0118850624891097e-06, "epoch": 8.698254364089776, "percentage": 87.0, "elapsed_time": "2 days, 12:13:15", "remaining_time": "8:59:51", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15270, "total_steps": 17540, "loss": 0.657, "learning_rate": 1.0031794971982278e-06, "epoch": 8.703954399714998, "percentage": 87.06, "elapsed_time": "2 days, 12:15:32", "remaining_time": "8:57:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15280, "total_steps": 17540, "loss": 0.6549, "learning_rate": 9.945095642569692e-07, "epoch": 8.709654435340221, "percentage": 87.12, "elapsed_time": "2 days, 12:17:48", "remaining_time": "8:55:05", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15290, "total_steps": 17540, "loss": 0.658, "learning_rate": 9.858752980030295e-07, "epoch": 8.715354470965444, "percentage": 87.17, "elapsed_time": "2 days, 12:20:07", "remaining_time": "8:52:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15300, "total_steps": 17540, "loss": 0.6627, "learning_rate": 9.772767326328435e-07, "epoch": 8.721054506590667, "percentage": 87.23, "elapsed_time": "2 days, 12:22:30", "remaining_time": "8:50:21", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15310, "total_steps": 17540, "loss": 0.6614, "learning_rate": 9.687139022014502e-07, "epoch": 8.72675454221589, "percentage": 87.29, "elapsed_time": "2 days, 12:24:55", "remaining_time": "8:47:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15320, "total_steps": 17540, "loss": 0.6589, "learning_rate": 9.601868406223647e-07, "epoch": 8.73245457784111, "percentage": 87.34, "elapsed_time": "2 days, 12:27:13", "remaining_time": "8:45:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15330, "total_steps": 17540, "loss": 0.6512, "learning_rate": 9.516955816674311e-07, "epoch": 8.738154613466333, "percentage": 87.4, "elapsed_time": "2 days, 12:29:38", "remaining_time": "8:43:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15340, "total_steps": 17540, "loss": 0.6547, "learning_rate": 9.432401589666984e-07, "epoch": 8.743854649091556, "percentage": 87.46, "elapsed_time": "2 days, 12:32:03", "remaining_time": "8:40:53", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15350, "total_steps": 17540, "loss": 0.6517, "learning_rate": 9.348206060082799e-07, "epoch": 8.749554684716779, "percentage": 87.51, "elapsed_time": "2 days, 12:34:24", "remaining_time": "8:38:31", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15360, "total_steps": 17540, "loss": 0.6548, "learning_rate": 9.264369561382336e-07, "epoch": 8.755254720342002, "percentage": 87.57, "elapsed_time": "2 days, 12:36:49", "remaining_time": "8:36:09", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15370, "total_steps": 17540, "loss": 0.6598, "learning_rate": 9.180892425604149e-07, "epoch": 8.760954755967225, "percentage": 87.63, "elapsed_time": "2 days, 12:39:14", "remaining_time": "8:33:48", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15380, "total_steps": 17540, "loss": 0.6623, "learning_rate": 9.097774983363527e-07, "epoch": 8.766654791592448, "percentage": 87.69, "elapsed_time": "2 days, 12:41:35", "remaining_time": "8:31:25", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15390, "total_steps": 17540, "loss": 0.6563, "learning_rate": 9.01501756385117e-07, "epoch": 8.77235482721767, "percentage": 87.74, "elapsed_time": "2 days, 12:44:01", "remaining_time": "8:29:04", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15400, "total_steps": 17540, "loss": 0.6652, "learning_rate": 8.932620494831945e-07, "epoch": 8.778054862842893, "percentage": 87.8, "elapsed_time": "2 days, 12:46:24", "remaining_time": "8:26:42", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15410, "total_steps": 17540, "loss": 0.6536, "learning_rate": 8.850584102643478e-07, "epoch": 8.783754898468116, "percentage": 87.86, "elapsed_time": "2 days, 12:48:46", "remaining_time": "8:24:20", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15420, "total_steps": 17540, "loss": 0.6548, "learning_rate": 8.768908712194913e-07, "epoch": 8.789454934093339, "percentage": 87.91, "elapsed_time": "2 days, 12:51:11", "remaining_time": "8:21:58", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15430, "total_steps": 17540, "loss": 0.6535, "learning_rate": 8.687594646965669e-07, "epoch": 8.79515496971856, "percentage": 87.97, "elapsed_time": "2 days, 12:53:27", "remaining_time": "8:19:35", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15440, "total_steps": 17540, "loss": 0.6576, "learning_rate": 8.606642229004059e-07, "epoch": 8.800855005343783, "percentage": 88.03, "elapsed_time": "2 days, 12:55:51", "remaining_time": "8:17:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15450, "total_steps": 17540, "loss": 0.6542, "learning_rate": 8.526051778926181e-07, "epoch": 8.806555040969005, "percentage": 88.08, "elapsed_time": "2 days, 12:58:14", "remaining_time": "8:14:52", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15460, "total_steps": 17540, "loss": 0.6521, "learning_rate": 8.445823615914405e-07, "epoch": 8.812255076594228, "percentage": 88.14, "elapsed_time": "2 days, 13:00:40", "remaining_time": "8:12:30", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15470, "total_steps": 17540, "loss": 0.6491, "learning_rate": 8.365958057716339e-07, "epoch": 8.817955112219451, "percentage": 88.2, "elapsed_time": "2 days, 13:03:04", "remaining_time": "8:10:08", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15480, "total_steps": 17540, "loss": 0.6709, "learning_rate": 8.286455420643424e-07, "epoch": 8.823655147844674, "percentage": 88.26, "elapsed_time": "2 days, 13:05:28", "remaining_time": "8:07:47", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15490, "total_steps": 17540, "loss": 0.6671, "learning_rate": 8.207316019569811e-07, "epoch": 8.829355183469897, "percentage": 88.31, "elapsed_time": "2 days, 13:07:50", "remaining_time": "8:05:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15500, "total_steps": 17540, "loss": 0.6555, "learning_rate": 8.128540167930942e-07, "epoch": 8.83505521909512, "percentage": 88.37, "elapsed_time": "2 days, 13:10:13", "remaining_time": "8:03:02", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15510, "total_steps": 17540, "loss": 0.6479, "learning_rate": 8.050128177722482e-07, "epoch": 8.840755254720342, "percentage": 88.43, "elapsed_time": "2 days, 13:12:36", "remaining_time": "8:00:41", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15520, "total_steps": 17540, "loss": 0.6602, "learning_rate": 7.972080359498946e-07, "epoch": 8.846455290345565, "percentage": 88.48, "elapsed_time": "2 days, 13:15:00", "remaining_time": "7:58:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15530, "total_steps": 17540, "loss": 0.6522, "learning_rate": 7.894397022372535e-07, "epoch": 8.852155325970788, "percentage": 88.54, "elapsed_time": "2 days, 13:17:19", "remaining_time": "7:55:56", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15540, "total_steps": 17540, "loss": 0.6524, "learning_rate": 7.817078474011974e-07, "epoch": 8.85785536159601, "percentage": 88.6, "elapsed_time": "2 days, 13:19:43", "remaining_time": "7:53:34", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15550, "total_steps": 17540, "loss": 0.6525, "learning_rate": 7.740125020641143e-07, "epoch": 8.863555397221234, "percentage": 88.65, "elapsed_time": "2 days, 13:22:07", "remaining_time": "7:51:13", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15560, "total_steps": 17540, "loss": 0.6563, "learning_rate": 7.663536967037977e-07, "epoch": 8.869255432846455, "percentage": 88.71, "elapsed_time": "2 days, 13:24:26", "remaining_time": "7:48:50", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15570, "total_steps": 17540, "loss": 0.6604, "learning_rate": 7.587314616533226e-07, "epoch": 8.874955468471677, "percentage": 88.77, "elapsed_time": "2 days, 13:26:50", "remaining_time": "7:46:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15580, "total_steps": 17540, "loss": 0.6509, "learning_rate": 7.511458271009254e-07, "epoch": 8.8806555040969, "percentage": 88.83, "elapsed_time": "2 days, 13:29:05", "remaining_time": "7:44:05", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15590, "total_steps": 17540, "loss": 0.65, "learning_rate": 7.435968230898838e-07, "epoch": 8.886355539722123, "percentage": 88.88, "elapsed_time": "2 days, 13:31:35", "remaining_time": "7:41:44", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15600, "total_steps": 17540, "loss": 0.6594, "learning_rate": 7.360844795184007e-07, "epoch": 8.892055575347346, "percentage": 88.94, "elapsed_time": "2 days, 13:33:59", "remaining_time": "7:39:22", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15610, "total_steps": 17540, "loss": 0.6592, "learning_rate": 7.286088261394797e-07, "epoch": 8.897755610972569, "percentage": 89.0, "elapsed_time": "2 days, 13:36:22", "remaining_time": "7:37:00", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15620, "total_steps": 17540, "loss": 0.6699, "learning_rate": 7.211698925608134e-07, "epoch": 8.903455646597791, "percentage": 89.05, "elapsed_time": "2 days, 13:38:51", "remaining_time": "7:34:39", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15630, "total_steps": 17540, "loss": 0.6596, "learning_rate": 7.137677082446659e-07, "epoch": 8.909155682223014, "percentage": 89.11, "elapsed_time": "2 days, 13:41:16", "remaining_time": "7:32:17", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15640, "total_steps": 17540, "loss": 0.6435, "learning_rate": 7.064023025077516e-07, "epoch": 8.914855717848237, "percentage": 89.17, "elapsed_time": "2 days, 13:43:36", "remaining_time": "7:29:55", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15650, "total_steps": 17540, "loss": 0.6607, "learning_rate": 6.990737045211204e-07, "epoch": 8.92055575347346, "percentage": 89.22, "elapsed_time": "2 days, 13:45:55", "remaining_time": "7:27:33", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15660, "total_steps": 17540, "loss": 0.6544, "learning_rate": 6.917819433100436e-07, "epoch": 8.926255789098683, "percentage": 89.28, "elapsed_time": "2 days, 13:48:18", "remaining_time": "7:25:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15670, "total_steps": 17540, "loss": 0.6585, "learning_rate": 6.845270477539034e-07, "epoch": 8.931955824723904, "percentage": 89.34, "elapsed_time": "2 days, 13:50:44", "remaining_time": "7:22:49", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15680, "total_steps": 17540, "loss": 0.654, "learning_rate": 6.773090465860677e-07, "epoch": 8.937655860349127, "percentage": 89.4, "elapsed_time": "2 days, 13:53:10", "remaining_time": "7:20:27", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15690, "total_steps": 17540, "loss": 0.6533, "learning_rate": 6.701279683937844e-07, "epoch": 8.94335589597435, "percentage": 89.45, "elapsed_time": "2 days, 13:55:25", "remaining_time": "7:18:05", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15700, "total_steps": 17540, "loss": 0.6567, "learning_rate": 6.629838416180679e-07, "epoch": 8.949055931599572, "percentage": 89.51, "elapsed_time": "2 days, 13:57:46", "remaining_time": "7:15:42", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15710, "total_steps": 17540, "loss": 0.6597, "learning_rate": 6.558766945535822e-07, "epoch": 8.954755967224795, "percentage": 89.57, "elapsed_time": "2 days, 14:00:06", "remaining_time": "7:13:20", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15720, "total_steps": 17540, "loss": 0.6563, "learning_rate": 6.488065553485334e-07, "epoch": 8.960456002850018, "percentage": 89.62, "elapsed_time": "2 days, 14:02:28", "remaining_time": "7:10:58", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15730, "total_steps": 17540, "loss": 0.6586, "learning_rate": 6.417734520045537e-07, "epoch": 8.96615603847524, "percentage": 89.68, "elapsed_time": "2 days, 14:04:48", "remaining_time": "7:08:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15740, "total_steps": 17540, "loss": 0.6543, "learning_rate": 6.34777412376596e-07, "epoch": 8.971856074100463, "percentage": 89.74, "elapsed_time": "2 days, 14:07:10", "remaining_time": "7:06:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15750, "total_steps": 17540, "loss": 0.6444, "learning_rate": 6.278184641728169e-07, "epoch": 8.977556109725686, "percentage": 89.79, "elapsed_time": "2 days, 14:09:37", "remaining_time": "7:03:52", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15760, "total_steps": 17540, "loss": 0.6622, "learning_rate": 6.208966349544754e-07, "epoch": 8.983256145350909, "percentage": 89.85, "elapsed_time": "2 days, 14:12:02", "remaining_time": "7:01:30", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15770, "total_steps": 17540, "loss": 0.646, "learning_rate": 6.140119521358146e-07, "epoch": 8.988956180976132, "percentage": 89.91, "elapsed_time": "2 days, 14:14:23", "remaining_time": "6:59:08", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15780, "total_steps": 17540, "loss": 0.6581, "learning_rate": 6.071644429839585e-07, "epoch": 8.994656216601353, "percentage": 89.97, "elapsed_time": "2 days, 14:16:45", "remaining_time": "6:56:46", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15790, "total_steps": 17540, "loss": 0.6535, "learning_rate": 6.003541346188036e-07, "epoch": 9.000356252226576, "percentage": 90.02, "elapsed_time": "2 days, 14:19:10", "remaining_time": "6:54:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15800, "total_steps": 17540, "loss": 0.6461, "learning_rate": 5.935810540129128e-07, "epoch": 9.006056287851798, "percentage": 90.08, "elapsed_time": "2 days, 14:21:29", "remaining_time": "6:52:02", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15810, "total_steps": 17540, "loss": 0.6532, "learning_rate": 5.868452279914039e-07, "epoch": 9.011756323477021, "percentage": 90.14, "elapsed_time": "2 days, 14:23:53", "remaining_time": "6:49:40", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15820, "total_steps": 17540, "loss": 0.6554, "learning_rate": 5.801466832318458e-07, "epoch": 9.017456359102244, "percentage": 90.19, "elapsed_time": "2 days, 14:26:17", "remaining_time": "6:47:18", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15830, "total_steps": 17540, "loss": 0.649, "learning_rate": 5.734854462641548e-07, "epoch": 9.023156394727467, "percentage": 90.25, "elapsed_time": "2 days, 14:28:37", "remaining_time": "6:44:56", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15840, "total_steps": 17540, "loss": 0.652, "learning_rate": 5.66861543470486e-07, "epoch": 9.02885643035269, "percentage": 90.31, "elapsed_time": "2 days, 14:30:59", "remaining_time": "6:42:34", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15850, "total_steps": 17540, "loss": 0.6498, "learning_rate": 5.602750010851332e-07, "epoch": 9.034556465977913, "percentage": 90.36, "elapsed_time": "2 days, 14:33:16", "remaining_time": "6:40:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15860, "total_steps": 17540, "loss": 0.6462, "learning_rate": 5.537258451944206e-07, "epoch": 9.040256501603135, "percentage": 90.42, "elapsed_time": "2 days, 14:35:41", "remaining_time": "6:37:49", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15870, "total_steps": 17540, "loss": 0.6529, "learning_rate": 5.472141017366029e-07, "epoch": 9.045956537228358, "percentage": 90.48, "elapsed_time": "2 days, 14:38:04", "remaining_time": "6:35:27", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15880, "total_steps": 17540, "loss": 0.6579, "learning_rate": 5.407397965017569e-07, "epoch": 9.051656572853581, "percentage": 90.54, "elapsed_time": "2 days, 14:40:25", "remaining_time": "6:33:05", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15890, "total_steps": 17540, "loss": 0.6475, "learning_rate": 5.343029551316892e-07, "epoch": 9.057356608478804, "percentage": 90.59, "elapsed_time": "2 days, 14:42:50", "remaining_time": "6:30:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15900, "total_steps": 17540, "loss": 0.6593, "learning_rate": 5.27903603119827e-07, "epoch": 9.063056644104025, "percentage": 90.65, "elapsed_time": "2 days, 14:45:16", "remaining_time": "6:28:22", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15910, "total_steps": 17540, "loss": 0.6513, "learning_rate": 5.215417658111166e-07, "epoch": 9.068756679729248, "percentage": 90.71, "elapsed_time": "2 days, 14:47:37", "remaining_time": "6:25:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15920, "total_steps": 17540, "loss": 0.6504, "learning_rate": 5.152174684019285e-07, "epoch": 9.07445671535447, "percentage": 90.76, "elapsed_time": "2 days, 14:49:59", "remaining_time": "6:23:37", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15930, "total_steps": 17540, "loss": 0.6496, "learning_rate": 5.089307359399498e-07, "epoch": 9.080156750979693, "percentage": 90.82, "elapsed_time": "2 days, 14:52:17", "remaining_time": "6:21:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15940, "total_steps": 17540, "loss": 0.6581, "learning_rate": 5.02681593324098e-07, "epoch": 9.085856786604916, "percentage": 90.88, "elapsed_time": "2 days, 14:54:36", "remaining_time": "6:18:52", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15950, "total_steps": 17540, "loss": 0.65, "learning_rate": 4.964700653044086e-07, "epoch": 9.091556822230139, "percentage": 90.94, "elapsed_time": "2 days, 14:56:59", "remaining_time": "6:16:30", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15960, "total_steps": 17540, "loss": 0.651, "learning_rate": 4.902961764819414e-07, "epoch": 9.097256857855362, "percentage": 90.99, "elapsed_time": "2 days, 14:59:23", "remaining_time": "6:14:08", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15970, "total_steps": 17540, "loss": 0.6549, "learning_rate": 4.84159951308687e-07, "epoch": 9.102956893480584, "percentage": 91.05, "elapsed_time": "2 days, 15:01:45", "remaining_time": "6:11:46", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15980, "total_steps": 17540, "loss": 0.6602, "learning_rate": 4.780614140874685e-07, "epoch": 9.108656929105807, "percentage": 91.11, "elapsed_time": "2 days, 15:04:06", "remaining_time": "6:09:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 15990, "total_steps": 17540, "loss": 0.654, "learning_rate": 4.720005889718393e-07, "epoch": 9.11435696473103, "percentage": 91.16, "elapsed_time": "2 days, 15:06:25", "remaining_time": "6:07:02", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16000, "total_steps": 17540, "loss": 0.6563, "learning_rate": 4.6597749996599716e-07, "epoch": 9.120057000356253, "percentage": 91.22, "elapsed_time": "2 days, 15:08:44", "remaining_time": "6:04:39", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16010, "total_steps": 17540, "loss": 0.6552, "learning_rate": 4.5999217092468127e-07, "epoch": 9.125757035981476, "percentage": 91.28, "elapsed_time": "2 days, 15:11:04", "remaining_time": "6:02:17", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16020, "total_steps": 17540, "loss": 0.6536, "learning_rate": 4.540446255530806e-07, "epoch": 9.131457071606697, "percentage": 91.33, "elapsed_time": "2 days, 15:13:29", "remaining_time": "5:59:55", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16030, "total_steps": 17540, "loss": 0.6496, "learning_rate": 4.481348874067426e-07, "epoch": 9.13715710723192, "percentage": 91.39, "elapsed_time": "2 days, 15:15:51", "remaining_time": "5:57:33", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16040, "total_steps": 17540, "loss": 0.6557, "learning_rate": 4.422629798914757e-07, "epoch": 9.142857142857142, "percentage": 91.45, "elapsed_time": "2 days, 15:18:09", "remaining_time": "5:55:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16050, "total_steps": 17540, "loss": 0.6613, "learning_rate": 4.3642892626325595e-07, "epoch": 9.148557178482365, "percentage": 91.51, "elapsed_time": "2 days, 15:20:28", "remaining_time": "5:52:49", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16060, "total_steps": 17540, "loss": 0.6552, "learning_rate": 4.3063274962813926e-07, "epoch": 9.154257214107588, "percentage": 91.56, "elapsed_time": "2 days, 15:22:51", "remaining_time": "5:50:27", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16070, "total_steps": 17540, "loss": 0.6644, "learning_rate": 4.2487447294217056e-07, "epoch": 9.15995724973281, "percentage": 91.62, "elapsed_time": "2 days, 15:25:13", "remaining_time": "5:48:04", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16080, "total_steps": 17540, "loss": 0.6597, "learning_rate": 4.1915411901128577e-07, "epoch": 9.165657285358034, "percentage": 91.68, "elapsed_time": "2 days, 15:27:40", "remaining_time": "5:45:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16090, "total_steps": 17540, "loss": 0.6537, "learning_rate": 4.1347171049122894e-07, "epoch": 9.171357320983256, "percentage": 91.73, "elapsed_time": "2 days, 15:29:59", "remaining_time": "5:43:20", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16100, "total_steps": 17540, "loss": 0.6544, "learning_rate": 4.0782726988745634e-07, "epoch": 9.17705735660848, "percentage": 91.79, "elapsed_time": "2 days, 15:32:18", "remaining_time": "5:40:58", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16110, "total_steps": 17540, "loss": 0.6612, "learning_rate": 4.0222081955505367e-07, "epoch": 9.182757392233702, "percentage": 91.85, "elapsed_time": "2 days, 15:34:41", "remaining_time": "5:38:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16120, "total_steps": 17540, "loss": 0.6628, "learning_rate": 3.966523816986434e-07, "epoch": 9.188457427858925, "percentage": 91.9, "elapsed_time": "2 days, 15:37:07", "remaining_time": "5:36:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16130, "total_steps": 17540, "loss": 0.6578, "learning_rate": 3.911219783722953e-07, "epoch": 9.194157463484148, "percentage": 91.96, "elapsed_time": "2 days, 15:39:26", "remaining_time": "5:33:52", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16140, "total_steps": 17540, "loss": 0.6494, "learning_rate": 3.85629631479445e-07, "epoch": 9.199857499109369, "percentage": 92.02, "elapsed_time": "2 days, 15:41:51", "remaining_time": "5:31:30", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16150, "total_steps": 17540, "loss": 0.6538, "learning_rate": 3.801753627728011e-07, "epoch": 9.205557534734591, "percentage": 92.08, "elapsed_time": "2 days, 15:44:06", "remaining_time": "5:29:08", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16160, "total_steps": 17540, "loss": 0.6484, "learning_rate": 3.7475919385426384e-07, "epoch": 9.211257570359814, "percentage": 92.13, "elapsed_time": "2 days, 15:46:26", "remaining_time": "5:26:45", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16170, "total_steps": 17540, "loss": 0.655, "learning_rate": 3.6938114617483646e-07, "epoch": 9.216957605985037, "percentage": 92.19, "elapsed_time": "2 days, 15:48:43", "remaining_time": "5:24:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16180, "total_steps": 17540, "loss": 0.6551, "learning_rate": 3.6404124103453954e-07, "epoch": 9.22265764161026, "percentage": 92.25, "elapsed_time": "2 days, 15:51:09", "remaining_time": "5:22:01", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16190, "total_steps": 17540, "loss": 0.6588, "learning_rate": 3.587394995823301e-07, "epoch": 9.228357677235483, "percentage": 92.3, "elapsed_time": "2 days, 15:53:27", "remaining_time": "5:19:39", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16200, "total_steps": 17540, "loss": 0.6569, "learning_rate": 3.5347594281601837e-07, "epoch": 9.234057712860706, "percentage": 92.36, "elapsed_time": "2 days, 15:55:46", "remaining_time": "5:17:16", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16210, "total_steps": 17540, "loss": 0.6579, "learning_rate": 3.482505915821766e-07, "epoch": 9.239757748485928, "percentage": 92.42, "elapsed_time": "2 days, 15:58:10", "remaining_time": "5:14:54", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16220, "total_steps": 17540, "loss": 0.65, "learning_rate": 3.430634665760668e-07, "epoch": 9.245457784111151, "percentage": 92.47, "elapsed_time": "2 days, 16:00:30", "remaining_time": "5:12:32", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16230, "total_steps": 17540, "loss": 0.6534, "learning_rate": 3.379145883415502e-07, "epoch": 9.251157819736374, "percentage": 92.53, "elapsed_time": "2 days, 16:02:48", "remaining_time": "5:10:10", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16240, "total_steps": 17540, "loss": 0.6572, "learning_rate": 3.328039772710123e-07, "epoch": 9.256857855361597, "percentage": 92.59, "elapsed_time": "2 days, 16:05:08", "remaining_time": "5:07:48", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16250, "total_steps": 17540, "loss": 0.6572, "learning_rate": 3.277316536052821e-07, "epoch": 9.262557890986818, "percentage": 92.65, "elapsed_time": "2 days, 16:07:27", "remaining_time": "5:05:25", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16260, "total_steps": 17540, "loss": 0.6466, "learning_rate": 3.2269763743354445e-07, "epoch": 9.26825792661204, "percentage": 92.7, "elapsed_time": "2 days, 16:09:51", "remaining_time": "5:03:03", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16270, "total_steps": 17540, "loss": 0.6632, "learning_rate": 3.1770194869326864e-07, "epoch": 9.273957962237263, "percentage": 92.76, "elapsed_time": "2 days, 16:12:10", "remaining_time": "5:00:41", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16280, "total_steps": 17540, "loss": 0.6521, "learning_rate": 3.1274460717012346e-07, "epoch": 9.279657997862486, "percentage": 92.82, "elapsed_time": "2 days, 16:14:36", "remaining_time": "4:58:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16290, "total_steps": 17540, "loss": 0.6517, "learning_rate": 3.0782563249790567e-07, "epoch": 9.285358033487709, "percentage": 92.87, "elapsed_time": "2 days, 16:16:49", "remaining_time": "4:55:57", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16300, "total_steps": 17540, "loss": 0.6584, "learning_rate": 3.0294504415845585e-07, "epoch": 9.291058069112932, "percentage": 92.93, "elapsed_time": "2 days, 16:19:07", "remaining_time": "4:53:34", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16310, "total_steps": 17540, "loss": 0.6456, "learning_rate": 2.98102861481584e-07, "epoch": 9.296758104738155, "percentage": 92.99, "elapsed_time": "2 days, 16:21:30", "remaining_time": "4:51:12", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16320, "total_steps": 17540, "loss": 0.6613, "learning_rate": 2.932991036449917e-07, "epoch": 9.302458140363377, "percentage": 93.04, "elapsed_time": "2 days, 16:23:50", "remaining_time": "4:48:50", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16330, "total_steps": 17540, "loss": 0.655, "learning_rate": 2.8853378967419686e-07, "epoch": 9.3081581759886, "percentage": 93.1, "elapsed_time": "2 days, 16:26:12", "remaining_time": "4:46:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16340, "total_steps": 17540, "loss": 0.6502, "learning_rate": 2.8380693844246355e-07, "epoch": 9.313858211613823, "percentage": 93.16, "elapsed_time": "2 days, 16:28:35", "remaining_time": "4:44:06", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16350, "total_steps": 17540, "loss": 0.6409, "learning_rate": 2.7911856867071427e-07, "epoch": 9.319558247239046, "percentage": 93.22, "elapsed_time": "2 days, 16:30:59", "remaining_time": "4:41:44", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16360, "total_steps": 17540, "loss": 0.6592, "learning_rate": 2.744686989274692e-07, "epoch": 9.325258282864269, "percentage": 93.27, "elapsed_time": "2 days, 16:33:20", "remaining_time": "4:39:22", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16370, "total_steps": 17540, "loss": 0.6581, "learning_rate": 2.698573476287658e-07, "epoch": 9.33095831848949, "percentage": 93.33, "elapsed_time": "2 days, 16:35:38", "remaining_time": "4:37:00", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16380, "total_steps": 17540, "loss": 0.6515, "learning_rate": 2.652845330380882e-07, "epoch": 9.336658354114713, "percentage": 93.39, "elapsed_time": "2 days, 16:37:59", "remaining_time": "4:34:37", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16390, "total_steps": 17540, "loss": 0.639, "learning_rate": 2.6075027326629253e-07, "epoch": 9.342358389739935, "percentage": 93.44, "elapsed_time": "2 days, 16:40:17", "remaining_time": "4:32:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16400, "total_steps": 17540, "loss": 0.6417, "learning_rate": 2.562545862715382e-07, "epoch": 9.348058425365158, "percentage": 93.5, "elapsed_time": "2 days, 16:42:37", "remaining_time": "4:29:53", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16410, "total_steps": 17540, "loss": 0.6574, "learning_rate": 2.517974898592124e-07, "epoch": 9.353758460990381, "percentage": 93.56, "elapsed_time": "2 days, 16:45:05", "remaining_time": "4:27:31", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16420, "total_steps": 17540, "loss": 0.6549, "learning_rate": 2.4737900168186667e-07, "epoch": 9.359458496615604, "percentage": 93.61, "elapsed_time": "2 days, 16:47:31", "remaining_time": "4:25:09", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16430, "total_steps": 17540, "loss": 0.6415, "learning_rate": 2.429991392391395e-07, "epoch": 9.365158532240827, "percentage": 93.67, "elapsed_time": "2 days, 16:49:54", "remaining_time": "4:22:47", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16440, "total_steps": 17540, "loss": 0.652, "learning_rate": 2.386579198776917e-07, "epoch": 9.37085856786605, "percentage": 93.73, "elapsed_time": "2 days, 16:52:14", "remaining_time": "4:20:25", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16450, "total_steps": 17540, "loss": 0.6512, "learning_rate": 2.343553607911353e-07, "epoch": 9.376558603491272, "percentage": 93.79, "elapsed_time": "2 days, 16:54:41", "remaining_time": "4:18:04", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16460, "total_steps": 17540, "loss": 0.6601, "learning_rate": 2.300914790199682e-07, "epoch": 9.382258639116495, "percentage": 93.84, "elapsed_time": "2 days, 16:57:00", "remaining_time": "4:15:41", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16470, "total_steps": 17540, "loss": 0.6557, "learning_rate": 2.2586629145150195e-07, "epoch": 9.387958674741718, "percentage": 93.9, "elapsed_time": "2 days, 16:59:19", "remaining_time": "4:13:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16480, "total_steps": 17540, "loss": 0.6476, "learning_rate": 2.2167981481980073e-07, "epoch": 9.393658710366939, "percentage": 93.96, "elapsed_time": "2 days, 17:01:45", "remaining_time": "4:10:57", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16490, "total_steps": 17540, "loss": 0.6503, "learning_rate": 2.1753206570561015e-07, "epoch": 9.399358745992162, "percentage": 94.01, "elapsed_time": "2 days, 17:04:05", "remaining_time": "4:08:35", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16500, "total_steps": 17540, "loss": 0.6379, "learning_rate": 2.1342306053629414e-07, "epoch": 9.405058781617385, "percentage": 94.07, "elapsed_time": "2 days, 17:06:27", "remaining_time": "4:06:13", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16510, "total_steps": 17540, "loss": 0.659, "learning_rate": 2.0935281558577048e-07, "epoch": 9.410758817242607, "percentage": 94.13, "elapsed_time": "2 days, 17:08:51", "remaining_time": "4:03:51", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16520, "total_steps": 17540, "loss": 0.6543, "learning_rate": 2.0532134697444417e-07, "epoch": 9.41645885286783, "percentage": 94.18, "elapsed_time": "2 days, 17:11:10", "remaining_time": "4:01:29", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16530, "total_steps": 17540, "loss": 0.6632, "learning_rate": 2.0132867066914418e-07, "epoch": 9.422158888493053, "percentage": 94.24, "elapsed_time": "2 days, 17:13:33", "remaining_time": "3:59:07", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16540, "total_steps": 17540, "loss": 0.657, "learning_rate": 1.9737480248306128e-07, "epoch": 9.427858924118276, "percentage": 94.3, "elapsed_time": "2 days, 17:15:55", "remaining_time": "3:56:45", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16550, "total_steps": 17540, "loss": 0.6472, "learning_rate": 1.9345975807568473e-07, "epoch": 9.433558959743499, "percentage": 94.36, "elapsed_time": "2 days, 17:18:15", "remaining_time": "3:54:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16560, "total_steps": 17540, "loss": 0.6545, "learning_rate": 1.8958355295274012e-07, "epoch": 9.439258995368721, "percentage": 94.41, "elapsed_time": "2 days, 17:20:33", "remaining_time": "3:52:00", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16570, "total_steps": 17540, "loss": 0.6336, "learning_rate": 1.857462024661294e-07, "epoch": 9.444959030993944, "percentage": 94.47, "elapsed_time": "2 days, 17:22:56", "remaining_time": "3:49:38", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16580, "total_steps": 17540, "loss": 0.6443, "learning_rate": 1.8194772181386655e-07, "epoch": 9.450659066619167, "percentage": 94.53, "elapsed_time": "2 days, 17:25:16", "remaining_time": "3:47:16", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16590, "total_steps": 17540, "loss": 0.6504, "learning_rate": 1.781881260400209e-07, "epoch": 9.45635910224439, "percentage": 94.58, "elapsed_time": "2 days, 17:27:39", "remaining_time": "3:44:54", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16600, "total_steps": 17540, "loss": 0.6561, "learning_rate": 1.7446743003465606e-07, "epoch": 9.46205913786961, "percentage": 94.64, "elapsed_time": "2 days, 17:30:02", "remaining_time": "3:42:32", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16610, "total_steps": 17540, "loss": 0.6542, "learning_rate": 1.707856485337722e-07, "epoch": 9.467759173494834, "percentage": 94.7, "elapsed_time": "2 days, 17:32:27", "remaining_time": "3:40:10", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16620, "total_steps": 17540, "loss": 0.6548, "learning_rate": 1.6714279611924512e-07, "epoch": 9.473459209120056, "percentage": 94.75, "elapsed_time": "2 days, 17:34:49", "remaining_time": "3:37:48", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16630, "total_steps": 17540, "loss": 0.6549, "learning_rate": 1.6353888721877154e-07, "epoch": 9.47915924474528, "percentage": 94.81, "elapsed_time": "2 days, 17:37:12", "remaining_time": "3:35:26", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16640, "total_steps": 17540, "loss": 0.6508, "learning_rate": 1.5997393610580837e-07, "epoch": 9.484859280370502, "percentage": 94.87, "elapsed_time": "2 days, 17:39:36", "remaining_time": "3:33:04", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16650, "total_steps": 17540, "loss": 0.6548, "learning_rate": 1.564479568995203e-07, "epoch": 9.490559315995725, "percentage": 94.93, "elapsed_time": "2 days, 17:42:01", "remaining_time": "3:30:42", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16660, "total_steps": 17540, "loss": 0.6529, "learning_rate": 1.5296096356472223e-07, "epoch": 9.496259351620948, "percentage": 94.98, "elapsed_time": "2 days, 17:44:23", "remaining_time": "3:28:20", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16670, "total_steps": 17540, "loss": 0.6486, "learning_rate": 1.495129699118214e-07, "epoch": 9.50195938724617, "percentage": 95.04, "elapsed_time": "2 days, 17:46:43", "remaining_time": "3:25:58", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16680, "total_steps": 17540, "loss": 0.6591, "learning_rate": 1.461039895967653e-07, "epoch": 9.507659422871393, "percentage": 95.1, "elapsed_time": "2 days, 17:49:09", "remaining_time": "3:23:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16690, "total_steps": 17540, "loss": 0.6589, "learning_rate": 1.4273403612099057e-07, "epoch": 9.513359458496616, "percentage": 95.15, "elapsed_time": "2 days, 17:51:31", "remaining_time": "3:21:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16700, "total_steps": 17540, "loss": 0.6573, "learning_rate": 1.3940312283136192e-07, "epoch": 9.519059494121839, "percentage": 95.21, "elapsed_time": "2 days, 17:53:55", "remaining_time": "3:18:52", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16710, "total_steps": 17540, "loss": 0.6528, "learning_rate": 1.3611126292012444e-07, "epoch": 9.524759529747062, "percentage": 95.27, "elapsed_time": "2 days, 17:56:18", "remaining_time": "3:16:30", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16720, "total_steps": 17540, "loss": 0.642, "learning_rate": 1.3285846942485247e-07, "epoch": 9.530459565372283, "percentage": 95.32, "elapsed_time": "2 days, 17:58:39", "remaining_time": "3:14:08", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16730, "total_steps": 17540, "loss": 0.6513, "learning_rate": 1.2964475522839304e-07, "epoch": 9.536159600997506, "percentage": 95.38, "elapsed_time": "2 days, 18:00:58", "remaining_time": "3:11:46", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16740, "total_steps": 17540, "loss": 0.6521, "learning_rate": 1.2647013305882138e-07, "epoch": 9.541859636622728, "percentage": 95.44, "elapsed_time": "2 days, 18:03:20", "remaining_time": "3:09:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16750, "total_steps": 17540, "loss": 0.6556, "learning_rate": 1.2333461548938109e-07, "epoch": 9.547559672247951, "percentage": 95.5, "elapsed_time": "2 days, 18:05:41", "remaining_time": "3:07:02", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16760, "total_steps": 17540, "loss": 0.6442, "learning_rate": 1.2023821493844623e-07, "epoch": 9.553259707873174, "percentage": 95.55, "elapsed_time": "2 days, 18:08:03", "remaining_time": "3:04:40", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16770, "total_steps": 17540, "loss": 0.6393, "learning_rate": 1.1718094366946264e-07, "epoch": 9.558959743498397, "percentage": 95.61, "elapsed_time": "2 days, 18:10:25", "remaining_time": "3:02:18", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16780, "total_steps": 17540, "loss": 0.65, "learning_rate": 1.1416281379090343e-07, "epoch": 9.56465977912362, "percentage": 95.67, "elapsed_time": "2 days, 18:12:52", "remaining_time": "2:59:56", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16790, "total_steps": 17540, "loss": 0.6435, "learning_rate": 1.1118383725622018e-07, "epoch": 9.570359814748842, "percentage": 95.72, "elapsed_time": "2 days, 18:15:14", "remaining_time": "2:57:34", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16800, "total_steps": 17540, "loss": 0.6551, "learning_rate": 1.0824402586379512e-07, "epoch": 9.576059850374065, "percentage": 95.78, "elapsed_time": "2 days, 18:17:35", "remaining_time": "2:55:12", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16810, "total_steps": 17540, "loss": 0.6567, "learning_rate": 1.0534339125689686e-07, "epoch": 9.581759885999288, "percentage": 95.84, "elapsed_time": "2 days, 18:20:01", "remaining_time": "2:52:50", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16820, "total_steps": 17540, "loss": 0.6511, "learning_rate": 1.0248194492363028e-07, "epoch": 9.58745992162451, "percentage": 95.9, "elapsed_time": "2 days, 18:22:22", "remaining_time": "2:50:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16830, "total_steps": 17540, "loss": 0.656, "learning_rate": 9.965969819689558e-08, "epoch": 9.593159957249732, "percentage": 95.95, "elapsed_time": "2 days, 18:24:43", "remaining_time": "2:48:06", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16840, "total_steps": 17540, "loss": 0.6529, "learning_rate": 9.687666225433823e-08, "epoch": 9.598859992874955, "percentage": 96.01, "elapsed_time": "2 days, 18:27:09", "remaining_time": "2:45:44", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16850, "total_steps": 17540, "loss": 0.652, "learning_rate": 9.413284811830903e-08, "epoch": 9.604560028500178, "percentage": 96.07, "elapsed_time": "2 days, 18:29:30", "remaining_time": "2:43:22", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16860, "total_steps": 17540, "loss": 0.6439, "learning_rate": 9.142826665581972e-08, "epoch": 9.6102600641254, "percentage": 96.12, "elapsed_time": "2 days, 18:31:49", "remaining_time": "2:40:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16870, "total_steps": 17540, "loss": 0.6484, "learning_rate": 8.876292857849633e-08, "epoch": 9.615960099750623, "percentage": 96.18, "elapsed_time": "2 days, 18:34:08", "remaining_time": "2:38:37", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16880, "total_steps": 17540, "loss": 0.6562, "learning_rate": 8.613684444254256e-08, "epoch": 9.621660135375846, "percentage": 96.24, "elapsed_time": "2 days, 18:36:29", "remaining_time": "2:36:15", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16890, "total_steps": 17540, "loss": 0.6523, "learning_rate": 8.35500246486931e-08, "epoch": 9.627360171001069, "percentage": 96.29, "elapsed_time": "2 days, 18:38:55", "remaining_time": "2:33:53", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16900, "total_steps": 17540, "loss": 0.6578, "learning_rate": 8.100247944217488e-08, "epoch": 9.633060206626292, "percentage": 96.35, "elapsed_time": "2 days, 18:41:20", "remaining_time": "2:31:31", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16910, "total_steps": 17540, "loss": 0.6588, "learning_rate": 7.849421891266585e-08, "epoch": 9.638760242251514, "percentage": 96.41, "elapsed_time": "2 days, 18:43:49", "remaining_time": "2:29:10", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16920, "total_steps": 17540, "loss": 0.6483, "learning_rate": 7.602525299425623e-08, "epoch": 9.644460277876737, "percentage": 96.47, "elapsed_time": "2 days, 18:46:14", "remaining_time": "2:26:48", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16930, "total_steps": 17540, "loss": 0.6587, "learning_rate": 7.359559146540518e-08, "epoch": 9.65016031350196, "percentage": 96.52, "elapsed_time": "2 days, 18:48:39", "remaining_time": "2:24:26", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16940, "total_steps": 17540, "loss": 0.6544, "learning_rate": 7.120524394890748e-08, "epoch": 9.655860349127183, "percentage": 96.58, "elapsed_time": "2 days, 18:51:03", "remaining_time": "2:22:04", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16950, "total_steps": 17540, "loss": 0.6523, "learning_rate": 6.885421991185027e-08, "epoch": 9.661560384752406, "percentage": 96.64, "elapsed_time": "2 days, 18:53:21", "remaining_time": "2:19:41", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16960, "total_steps": 17540, "loss": 0.6407, "learning_rate": 6.654252866558186e-08, "epoch": 9.667260420377627, "percentage": 96.69, "elapsed_time": "2 days, 18:55:42", "remaining_time": "2:17:19", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16970, "total_steps": 17540, "loss": 0.6548, "learning_rate": 6.427017936566859e-08, "epoch": 9.67296045600285, "percentage": 96.75, "elapsed_time": "2 days, 18:58:09", "remaining_time": "2:14:57", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16980, "total_steps": 17540, "loss": 0.6543, "learning_rate": 6.203718101186141e-08, "epoch": 9.678660491628072, "percentage": 96.81, "elapsed_time": "2 days, 19:00:32", "remaining_time": "2:12:35", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 16990, "total_steps": 17540, "loss": 0.658, "learning_rate": 5.984354244805924e-08, "epoch": 9.684360527253295, "percentage": 96.86, "elapsed_time": "2 days, 19:02:54", "remaining_time": "2:10:13", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17000, "total_steps": 17540, "loss": 0.6614, "learning_rate": 5.768927236227684e-08, "epoch": 9.690060562878518, "percentage": 96.92, "elapsed_time": "2 days, 19:05:17", "remaining_time": "2:07:51", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17010, "total_steps": 17540, "loss": 0.6502, "learning_rate": 5.5574379286604805e-08, "epoch": 9.69576059850374, "percentage": 96.98, "elapsed_time": "2 days, 19:07:37", "remaining_time": "2:05:29", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17020, "total_steps": 17540, "loss": 0.6548, "learning_rate": 5.349887159718181e-08, "epoch": 9.701460634128964, "percentage": 97.04, "elapsed_time": "2 days, 19:10:04", "remaining_time": "2:03:07", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17030, "total_steps": 17540, "loss": 0.6551, "learning_rate": 5.146275751415908e-08, "epoch": 9.707160669754186, "percentage": 97.09, "elapsed_time": "2 days, 19:12:22", "remaining_time": "2:00:45", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17040, "total_steps": 17540, "loss": 0.6532, "learning_rate": 4.9466045101664864e-08, "epoch": 9.71286070537941, "percentage": 97.15, "elapsed_time": "2 days, 19:14:48", "remaining_time": "1:58:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17050, "total_steps": 17540, "loss": 0.6569, "learning_rate": 4.750874226777891e-08, "epoch": 9.718560741004632, "percentage": 97.21, "elapsed_time": "2 days, 19:17:06", "remaining_time": "1:56:01", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17060, "total_steps": 17540, "loss": 0.6481, "learning_rate": 4.5590856764492486e-08, "epoch": 9.724260776629855, "percentage": 97.26, "elapsed_time": "2 days, 19:19:26", "remaining_time": "1:53:39", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17070, "total_steps": 17540, "loss": 0.6484, "learning_rate": 4.37123961876873e-08, "epoch": 9.729960812255076, "percentage": 97.32, "elapsed_time": "2 days, 19:21:51", "remaining_time": "1:51:17", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17080, "total_steps": 17540, "loss": 0.6547, "learning_rate": 4.187336797709884e-08, "epoch": 9.735660847880299, "percentage": 97.38, "elapsed_time": "2 days, 19:24:12", "remaining_time": "1:48:55", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17090, "total_steps": 17540, "loss": 0.6528, "learning_rate": 4.007377941628754e-08, "epoch": 9.741360883505521, "percentage": 97.43, "elapsed_time": "2 days, 19:26:37", "remaining_time": "1:46:33", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17100, "total_steps": 17540, "loss": 0.6545, "learning_rate": 3.8313637632613196e-08, "epoch": 9.747060919130744, "percentage": 97.49, "elapsed_time": "2 days, 19:29:00", "remaining_time": "1:44:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17110, "total_steps": 17540, "loss": 0.6599, "learning_rate": 3.659294959720283e-08, "epoch": 9.752760954755967, "percentage": 97.55, "elapsed_time": "2 days, 19:31:17", "remaining_time": "1:41:48", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17120, "total_steps": 17540, "loss": 0.6463, "learning_rate": 3.491172212492733e-08, "epoch": 9.75846099038119, "percentage": 97.61, "elapsed_time": "2 days, 19:33:44", "remaining_time": "1:39:26", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17130, "total_steps": 17540, "loss": 0.6538, "learning_rate": 3.326996187436926e-08, "epoch": 9.764161026006413, "percentage": 97.66, "elapsed_time": "2 days, 19:36:05", "remaining_time": "1:37:04", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17140, "total_steps": 17540, "loss": 0.6571, "learning_rate": 3.1667675347801795e-08, "epoch": 9.769861061631635, "percentage": 97.72, "elapsed_time": "2 days, 19:38:25", "remaining_time": "1:34:42", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17150, "total_steps": 17540, "loss": 0.6555, "learning_rate": 3.0104868891159825e-08, "epoch": 9.775561097256858, "percentage": 97.78, "elapsed_time": "2 days, 19:40:47", "remaining_time": "1:32:20", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17160, "total_steps": 17540, "loss": 0.6623, "learning_rate": 2.8581548694013304e-08, "epoch": 9.781261132882081, "percentage": 97.83, "elapsed_time": "2 days, 19:43:08", "remaining_time": "1:29:58", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17170, "total_steps": 17540, "loss": 0.6466, "learning_rate": 2.709772078954842e-08, "epoch": 9.786961168507304, "percentage": 97.89, "elapsed_time": "2 days, 19:45:33", "remaining_time": "1:27:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17180, "total_steps": 17540, "loss": 0.653, "learning_rate": 2.565339105453757e-08, "epoch": 9.792661204132525, "percentage": 97.95, "elapsed_time": "2 days, 19:47:53", "remaining_time": "1:25:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17190, "total_steps": 17540, "loss": 0.651, "learning_rate": 2.4248565209320507e-08, "epoch": 9.798361239757748, "percentage": 98.0, "elapsed_time": "2 days, 19:50:14", "remaining_time": "1:22:52", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17200, "total_steps": 17540, "loss": 0.6567, "learning_rate": 2.2883248817777703e-08, "epoch": 9.80406127538297, "percentage": 98.06, "elapsed_time": "2 days, 19:52:34", "remaining_time": "1:20:30", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17210, "total_steps": 17540, "loss": 0.6516, "learning_rate": 2.1557447287312572e-08, "epoch": 9.809761311008193, "percentage": 98.12, "elapsed_time": "2 days, 19:54:52", "remaining_time": "1:18:08", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17220, "total_steps": 17540, "loss": 0.6609, "learning_rate": 2.0271165868828157e-08, "epoch": 9.815461346633416, "percentage": 98.18, "elapsed_time": "2 days, 19:57:13", "remaining_time": "1:15:46", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17230, "total_steps": 17540, "loss": 0.6652, "learning_rate": 1.9024409656703824e-08, "epoch": 9.821161382258639, "percentage": 98.23, "elapsed_time": "2 days, 19:59:30", "remaining_time": "1:13:23", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17240, "total_steps": 17540, "loss": 0.6531, "learning_rate": 1.7817183588778596e-08, "epoch": 9.826861417883862, "percentage": 98.29, "elapsed_time": "2 days, 20:01:55", "remaining_time": "1:11:01", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17250, "total_steps": 17540, "loss": 0.6479, "learning_rate": 1.6649492446332292e-08, "epoch": 9.832561453509085, "percentage": 98.35, "elapsed_time": "2 days, 20:04:16", "remaining_time": "1:08:39", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17260, "total_steps": 17540, "loss": 0.654, "learning_rate": 1.5521340854061097e-08, "epoch": 9.838261489134307, "percentage": 98.4, "elapsed_time": "2 days, 20:06:38", "remaining_time": "1:06:17", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17270, "total_steps": 17540, "loss": 0.6469, "learning_rate": 1.4432733280065336e-08, "epoch": 9.84396152475953, "percentage": 98.46, "elapsed_time": "2 days, 20:08:59", "remaining_time": "1:03:55", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17280, "total_steps": 17540, "loss": 0.6663, "learning_rate": 1.338367403583063e-08, "epoch": 9.849661560384753, "percentage": 98.52, "elapsed_time": "2 days, 20:11:26", "remaining_time": "1:01:33", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17290, "total_steps": 17540, "loss": 0.6425, "learning_rate": 1.2374167276205663e-08, "epoch": 9.855361596009976, "percentage": 98.57, "elapsed_time": "2 days, 20:13:49", "remaining_time": "0:59:11", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17300, "total_steps": 17540, "loss": 0.6497, "learning_rate": 1.1404216999391093e-08, "epoch": 9.861061631635197, "percentage": 98.63, "elapsed_time": "2 days, 20:16:06", "remaining_time": "0:56:49", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17310, "total_steps": 17540, "loss": 0.6605, "learning_rate": 1.0473827046925122e-08, "epoch": 9.86676166726042, "percentage": 98.69, "elapsed_time": "2 days, 20:18:23", "remaining_time": "0:54:27", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17320, "total_steps": 17540, "loss": 0.6522, "learning_rate": 9.583001103661283e-09, "epoch": 9.872461702885643, "percentage": 98.75, "elapsed_time": "2 days, 20:20:42", "remaining_time": "0:52:05", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17330, "total_steps": 17540, "loss": 0.6512, "learning_rate": 8.731742697758449e-09, "epoch": 9.878161738510865, "percentage": 98.8, "elapsed_time": "2 days, 20:23:01", "remaining_time": "0:49:43", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17340, "total_steps": 17540, "loss": 0.6636, "learning_rate": 7.92005520066974e-09, "epoch": 9.883861774136088, "percentage": 98.86, "elapsed_time": "2 days, 20:25:22", "remaining_time": "0:47:21", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17350, "total_steps": 17540, "loss": 0.6404, "learning_rate": 7.147941827121419e-09, "epoch": 9.889561809761311, "percentage": 98.92, "elapsed_time": "2 days, 20:27:45", "remaining_time": "0:44:59", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17360, "total_steps": 17540, "loss": 0.6488, "learning_rate": 6.415405635107341e-09, "epoch": 9.895261845386534, "percentage": 98.97, "elapsed_time": "2 days, 20:30:08", "remaining_time": "0:42:36", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17370, "total_steps": 17540, "loss": 0.6595, "learning_rate": 5.722449525873419e-09, "epoch": 9.900961881011757, "percentage": 99.03, "elapsed_time": "2 days, 20:32:31", "remaining_time": "0:40:14", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17380, "total_steps": 17540, "loss": 0.6578, "learning_rate": 5.069076243905402e-09, "epoch": 9.90666191663698, "percentage": 99.09, "elapsed_time": "2 days, 20:34:54", "remaining_time": "0:37:52", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17390, "total_steps": 17540, "loss": 0.6498, "learning_rate": 4.455288376921108e-09, "epoch": 9.912361952262202, "percentage": 99.14, "elapsed_time": "2 days, 20:37:17", "remaining_time": "0:35:30", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17400, "total_steps": 17540, "loss": 0.6547, "learning_rate": 3.881088355855989e-09, "epoch": 9.918061987887425, "percentage": 99.2, "elapsed_time": "2 days, 20:39:44", "remaining_time": "0:33:08", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17410, "total_steps": 17540, "loss": 0.651, "learning_rate": 3.346478454859803e-09, "epoch": 9.923762023512648, "percentage": 99.26, "elapsed_time": "2 days, 20:42:05", "remaining_time": "0:30:46", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17420, "total_steps": 17540, "loss": 0.6503, "learning_rate": 2.8514607912799586e-09, "epoch": 9.929462059137869, "percentage": 99.32, "elapsed_time": "2 days, 20:44:28", "remaining_time": "0:28:24", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17430, "total_steps": 17540, "loss": 0.6525, "learning_rate": 2.3960373256581846e-09, "epoch": 9.935162094763092, "percentage": 99.37, "elapsed_time": "2 days, 20:46:51", "remaining_time": "0:26:02", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17440, "total_steps": 17540, "loss": 0.6562, "learning_rate": 1.9802098617216494e-09, "epoch": 9.940862130388314, "percentage": 99.43, "elapsed_time": "2 days, 20:49:09", "remaining_time": "0:23:40", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17450, "total_steps": 17540, "loss": 0.6554, "learning_rate": 1.6039800463762966e-09, "epoch": 9.946562166013537, "percentage": 99.49, "elapsed_time": "2 days, 20:51:32", "remaining_time": "0:21:18", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17460, "total_steps": 17540, "loss": 0.6471, "learning_rate": 1.2673493696979677e-09, "epoch": 9.95226220163876, "percentage": 99.54, "elapsed_time": "2 days, 20:53:57", "remaining_time": "0:18:56", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17470, "total_steps": 17540, "loss": 0.6512, "learning_rate": 9.703191649279574e-10, "epoch": 9.957962237263983, "percentage": 99.6, "elapsed_time": "2 days, 20:56:17", "remaining_time": "0:16:34", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17480, "total_steps": 17540, "loss": 0.6526, "learning_rate": 7.128906084707954e-10, "epoch": 9.963662272889206, "percentage": 99.66, "elapsed_time": "2 days, 20:58:38", "remaining_time": "0:14:12", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17490, "total_steps": 17540, "loss": 0.6455, "learning_rate": 4.950647198842529e-10, "epoch": 9.969362308514429, "percentage": 99.71, "elapsed_time": "2 days, 21:01:00", "remaining_time": "0:11:50", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17500, "total_steps": 17540, "loss": 0.645, "learning_rate": 3.1684236187823345e-10, "epoch": 9.975062344139651, "percentage": 99.77, "elapsed_time": "2 days, 21:03:22", "remaining_time": "0:09:28", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17510, "total_steps": 17540, "loss": 0.6454, "learning_rate": 1.7822424031144203e-10, "epoch": 9.980762379764874, "percentage": 99.83, "elapsed_time": "2 days, 21:05:47", "remaining_time": "0:07:06", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17520, "total_steps": 17540, "loss": 0.6525, "learning_rate": 7.921090418805399e-11, "epoch": 9.986462415390097, "percentage": 99.89, "elapsed_time": "2 days, 21:08:09", "remaining_time": "0:04:44", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17530, "total_steps": 17540, "loss": 0.6616, "learning_rate": 1.980274565438478e-11, "epoch": 9.992162451015318, "percentage": 99.94, "elapsed_time": "2 days, 21:10:31", "remaining_time": "0:02:22", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17540, "total_steps": 17540, "loss": 0.6481, "learning_rate": 0.0, "epoch": 9.99786248664054, "percentage": 100.0, "elapsed_time": "2 days, 21:12:51", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0} +{"current_steps": 17540, "total_steps": 17540, "epoch": 9.99786248664054, "percentage": 100.0, "elapsed_time": "2 days, 21:13:00", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}