{"current_steps": 1, "total_steps": 150, "loss": 4.0982, "learning_rate": 6.000000000000001e-08, "epoch": 0.06349206349206349, "percentage": 0.67, "elapsed_time": "0:00:32", "remaining_time": "1:21:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2, "total_steps": 150, "loss": 3.8959, "learning_rate": 1.2000000000000002e-07, "epoch": 0.12698412698412698, "percentage": 1.33, "elapsed_time": "0:00:49", "remaining_time": "1:01:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3, "total_steps": 150, "loss": 4.0292, "learning_rate": 1.8e-07, "epoch": 0.19047619047619047, "percentage": 2.0, "elapsed_time": "0:00:57", "remaining_time": "0:47:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4, "total_steps": 150, "loss": 4.1284, "learning_rate": 2.4000000000000003e-07, "epoch": 0.25396825396825395, "percentage": 2.67, "elapsed_time": "0:01:08", "remaining_time": "0:41:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5, "total_steps": 150, "loss": 4.188, "learning_rate": 3.0000000000000004e-07, "epoch": 0.31746031746031744, "percentage": 3.33, "elapsed_time": "0:01:17", "remaining_time": "0:37:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6, "total_steps": 150, "loss": 3.9705, "learning_rate": 3.6e-07, "epoch": 0.38095238095238093, "percentage": 4.0, "elapsed_time": "0:01:26", "remaining_time": "0:34:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7, "total_steps": 150, "loss": 3.8838, "learning_rate": 4.2000000000000006e-07, "epoch": 0.4444444444444444, "percentage": 4.67, "elapsed_time": "0:01:31", "remaining_time": "0:31:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8, "total_steps": 150, "loss": 4.1963, "learning_rate": 4.800000000000001e-07, "epoch": 0.5079365079365079, "percentage": 5.33, "elapsed_time": "0:01:37", "remaining_time": "0:28:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9, "total_steps": 150, "loss": 3.9283, "learning_rate": 5.4e-07, "epoch": 0.5714285714285714, "percentage": 6.0, "elapsed_time": "0:01:43", "remaining_time": "0:27:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10, "total_steps": 150, "loss": 3.8356, "learning_rate": 6.000000000000001e-07, "epoch": 0.6349206349206349, "percentage": 6.67, "elapsed_time": "0:01:49", "remaining_time": "0:25:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11, "total_steps": 150, "loss": 3.7757, "learning_rate": 6.6e-07, "epoch": 0.6984126984126984, "percentage": 7.33, "elapsed_time": "0:01:55", "remaining_time": "0:24:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12, "total_steps": 150, "loss": 3.9636, "learning_rate": 7.2e-07, "epoch": 0.7619047619047619, "percentage": 8.0, "elapsed_time": "0:02:01", "remaining_time": "0:23:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13, "total_steps": 150, "loss": 3.6742, "learning_rate": 7.8e-07, "epoch": 0.8253968253968254, "percentage": 8.67, "elapsed_time": "0:02:10", "remaining_time": "0:22:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14, "total_steps": 150, "loss": 3.768, "learning_rate": 8.400000000000001e-07, "epoch": 0.8888888888888888, "percentage": 9.33, "elapsed_time": "0:05:39", "remaining_time": "0:54:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15, "total_steps": 150, "loss": 3.8381, "learning_rate": 9e-07, "epoch": 0.9523809523809523, "percentage": 10.0, "elapsed_time": "0:05:53", "remaining_time": "0:53:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16, "total_steps": 150, "loss": 3.7314, "learning_rate": 9.600000000000001e-07, "epoch": 1.0158730158730158, "percentage": 10.67, "elapsed_time": "0:06:06", "remaining_time": "0:51:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17, "total_steps": 150, "loss": 3.8718, "learning_rate": 1.0200000000000002e-06, "epoch": 1.0793650793650793, "percentage": 11.33, "elapsed_time": "0:06:13", "remaining_time": "0:48:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18, "total_steps": 150, "loss": 3.3766, "learning_rate": 1.08e-06, "epoch": 1.1428571428571428, "percentage": 12.0, "elapsed_time": "0:06:23", "remaining_time": "0:46:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19, "total_steps": 150, "loss": 3.3699, "learning_rate": 1.14e-06, "epoch": 1.2063492063492063, "percentage": 12.67, "elapsed_time": "0:06:28", "remaining_time": "0:44:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20, "total_steps": 150, "loss": 3.4645, "learning_rate": 1.2000000000000002e-06, "epoch": 1.2698412698412698, "percentage": 13.33, "elapsed_time": "0:07:25", "remaining_time": "0:48:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21, "total_steps": 150, "loss": 3.2721, "learning_rate": 1.26e-06, "epoch": 1.3333333333333333, "percentage": 14.0, "elapsed_time": "0:08:34", "remaining_time": "0:52:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22, "total_steps": 150, "loss": 3.1558, "learning_rate": 1.32e-06, "epoch": 1.3968253968253967, "percentage": 14.67, "elapsed_time": "0:08:40", "remaining_time": "0:50:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23, "total_steps": 150, "loss": 3.2164, "learning_rate": 1.3800000000000001e-06, "epoch": 1.4603174603174602, "percentage": 15.33, "elapsed_time": "0:08:48", "remaining_time": "0:48:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24, "total_steps": 150, "loss": 3.0664, "learning_rate": 1.44e-06, "epoch": 1.5238095238095237, "percentage": 16.0, "elapsed_time": "0:08:58", "remaining_time": "0:47:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25, "total_steps": 150, "loss": 2.7536, "learning_rate": 1.5e-06, "epoch": 1.5873015873015874, "percentage": 16.67, "elapsed_time": "0:09:04", "remaining_time": "0:45:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26, "total_steps": 150, "loss": 2.4849, "learning_rate": 1.56e-06, "epoch": 1.6507936507936507, "percentage": 17.33, "elapsed_time": "0:09:12", "remaining_time": "0:43:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 27, "total_steps": 150, "loss": 2.6918, "learning_rate": 1.6200000000000002e-06, "epoch": 1.7142857142857144, "percentage": 18.0, "elapsed_time": "0:09:21", "remaining_time": "0:42:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28, "total_steps": 150, "loss": 2.6273, "learning_rate": 1.6800000000000002e-06, "epoch": 1.7777777777777777, "percentage": 18.67, "elapsed_time": "0:09:27", "remaining_time": "0:41:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 29, "total_steps": 150, "loss": 2.5829, "learning_rate": 1.7399999999999999e-06, "epoch": 1.8412698412698414, "percentage": 19.33, "elapsed_time": "0:09:33", "remaining_time": "0:39:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 30, "total_steps": 150, "loss": 2.6698, "learning_rate": 1.8e-06, "epoch": 1.9047619047619047, "percentage": 20.0, "elapsed_time": "0:09:43", "remaining_time": "0:38:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 31, "total_steps": 150, "loss": 2.7849, "learning_rate": 1.86e-06, "epoch": 1.9682539682539684, "percentage": 20.67, "elapsed_time": "0:10:00", "remaining_time": "0:38:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 32, "total_steps": 150, "loss": 2.6262, "learning_rate": 1.9200000000000003e-06, "epoch": 2.0317460317460316, "percentage": 21.33, "elapsed_time": "0:10:15", "remaining_time": "0:37:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 33, "total_steps": 150, "loss": 2.405, "learning_rate": 1.98e-06, "epoch": 2.0952380952380953, "percentage": 22.0, "elapsed_time": "0:10:25", "remaining_time": "0:36:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 34, "total_steps": 150, "loss": 2.3917, "learning_rate": 2.0400000000000004e-06, "epoch": 2.1587301587301586, "percentage": 22.67, "elapsed_time": "0:10:30", "remaining_time": "0:35:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 35, "total_steps": 150, "loss": 2.2996, "learning_rate": 2.1e-06, "epoch": 2.2222222222222223, "percentage": 23.33, "elapsed_time": "0:10:36", "remaining_time": "0:34:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 36, "total_steps": 150, "loss": 2.4617, "learning_rate": 2.16e-06, "epoch": 2.2857142857142856, "percentage": 24.0, "elapsed_time": "0:10:48", "remaining_time": "0:34:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 37, "total_steps": 150, "loss": 2.4845, "learning_rate": 2.22e-06, "epoch": 2.3492063492063493, "percentage": 24.67, "elapsed_time": "0:10:54", "remaining_time": "0:33:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 38, "total_steps": 150, "loss": 2.2293, "learning_rate": 2.28e-06, "epoch": 2.4126984126984126, "percentage": 25.33, "elapsed_time": "0:10:59", "remaining_time": "0:32:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 39, "total_steps": 150, "loss": 2.2445, "learning_rate": 2.34e-06, "epoch": 2.4761904761904763, "percentage": 26.0, "elapsed_time": "0:11:08", "remaining_time": "0:31:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 40, "total_steps": 150, "loss": 2.5632, "learning_rate": 2.4000000000000003e-06, "epoch": 2.5396825396825395, "percentage": 26.67, "elapsed_time": "0:11:15", "remaining_time": "0:30:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 41, "total_steps": 150, "loss": 1.9954, "learning_rate": 2.4599999999999997e-06, "epoch": 2.6031746031746033, "percentage": 27.33, "elapsed_time": "0:11:20", "remaining_time": "0:30:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 42, "total_steps": 150, "loss": 1.8782, "learning_rate": 2.52e-06, "epoch": 2.6666666666666665, "percentage": 28.0, "elapsed_time": "0:11:26", "remaining_time": "0:29:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 43, "total_steps": 150, "loss": 1.9382, "learning_rate": 2.58e-06, "epoch": 2.7301587301587302, "percentage": 28.67, "elapsed_time": "0:11:31", "remaining_time": "0:28:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 44, "total_steps": 150, "loss": 1.752, "learning_rate": 2.64e-06, "epoch": 2.7936507936507935, "percentage": 29.33, "elapsed_time": "0:11:37", "remaining_time": "0:27:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 45, "total_steps": 150, "loss": 1.9237, "learning_rate": 2.7e-06, "epoch": 2.857142857142857, "percentage": 30.0, "elapsed_time": "0:11:43", "remaining_time": "0:27:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 46, "total_steps": 150, "loss": 1.5944, "learning_rate": 2.7600000000000003e-06, "epoch": 2.9206349206349205, "percentage": 30.67, "elapsed_time": "0:12:40", "remaining_time": "0:28:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 47, "total_steps": 150, "loss": 1.6411, "learning_rate": 2.82e-06, "epoch": 2.984126984126984, "percentage": 31.33, "elapsed_time": "0:12:46", "remaining_time": "0:27:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 48, "total_steps": 150, "loss": 1.4512, "learning_rate": 2.88e-06, "epoch": 3.0476190476190474, "percentage": 32.0, "elapsed_time": "0:12:51", "remaining_time": "0:27:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 49, "total_steps": 150, "loss": 1.6913, "learning_rate": 2.9400000000000002e-06, "epoch": 3.111111111111111, "percentage": 32.67, "elapsed_time": "0:12:57", "remaining_time": "0:26:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 50, "total_steps": 150, "loss": 1.6158, "learning_rate": 3e-06, "epoch": 3.1746031746031744, "percentage": 33.33, "elapsed_time": "0:13:03", "remaining_time": "0:26:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 51, "total_steps": 150, "loss": 1.6304, "learning_rate": 2.9992598405485977e-06, "epoch": 3.238095238095238, "percentage": 34.0, "elapsed_time": "0:13:32", "remaining_time": "0:26:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 52, "total_steps": 150, "loss": 1.3412, "learning_rate": 2.9970400926424076e-06, "epoch": 3.3015873015873014, "percentage": 34.67, "elapsed_time": "0:13:37", "remaining_time": "0:25:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 53, "total_steps": 150, "loss": 1.308, "learning_rate": 2.99334294690462e-06, "epoch": 3.365079365079365, "percentage": 35.33, "elapsed_time": "0:13:43", "remaining_time": "0:25:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 54, "total_steps": 150, "loss": 1.2513, "learning_rate": 2.988172051971717e-06, "epoch": 3.4285714285714284, "percentage": 36.0, "elapsed_time": "0:13:49", "remaining_time": "0:24:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 55, "total_steps": 150, "loss": 1.3811, "learning_rate": 2.981532510892707e-06, "epoch": 3.492063492063492, "percentage": 36.67, "elapsed_time": "0:13:54", "remaining_time": "0:24:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 56, "total_steps": 150, "loss": 1.2914, "learning_rate": 2.9734308760930334e-06, "epoch": 3.5555555555555554, "percentage": 37.33, "elapsed_time": "0:14:00", "remaining_time": "0:23:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 57, "total_steps": 150, "loss": 1.2351, "learning_rate": 2.9638751429081213e-06, "epoch": 3.619047619047619, "percentage": 38.0, "elapsed_time": "0:14:05", "remaining_time": "0:22:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 58, "total_steps": 150, "loss": 1.2103, "learning_rate": 2.9528747416929465e-06, "epoch": 3.682539682539683, "percentage": 38.67, "elapsed_time": "0:14:26", "remaining_time": "0:22:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 59, "total_steps": 150, "loss": 1.235, "learning_rate": 2.9404405285154148e-06, "epoch": 3.746031746031746, "percentage": 39.33, "elapsed_time": "0:16:22", "remaining_time": "0:25:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 60, "total_steps": 150, "loss": 1.1033, "learning_rate": 2.9265847744427307e-06, "epoch": 3.8095238095238093, "percentage": 40.0, "elapsed_time": "0:16:28", "remaining_time": "0:24:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 61, "total_steps": 150, "loss": 1.2773, "learning_rate": 2.9113211534313383e-06, "epoch": 3.873015873015873, "percentage": 40.67, "elapsed_time": "0:16:35", "remaining_time": "0:24:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 62, "total_steps": 150, "loss": 1.1921, "learning_rate": 2.894664728832377e-06, "epoch": 3.9365079365079367, "percentage": 41.33, "elapsed_time": "0:17:37", "remaining_time": "0:25:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 63, "total_steps": 150, "loss": 1.0918, "learning_rate": 2.8766319385259716e-06, "epoch": 4.0, "percentage": 42.0, "elapsed_time": "0:18:05", "remaining_time": "0:24:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 64, "total_steps": 150, "loss": 0.9075, "learning_rate": 2.8572405786990296e-06, "epoch": 4.063492063492063, "percentage": 42.67, "elapsed_time": "0:18:22", "remaining_time": "0:24:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 65, "total_steps": 150, "loss": 1.0097, "learning_rate": 2.8365097862825516e-06, "epoch": 4.1269841269841265, "percentage": 43.33, "elapsed_time": "0:18:28", "remaining_time": "0:24:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 66, "total_steps": 150, "loss": 0.9625, "learning_rate": 2.814460020065795e-06, "epoch": 4.190476190476191, "percentage": 44.0, "elapsed_time": "0:18:46", "remaining_time": "0:23:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 67, "total_steps": 150, "loss": 0.9898, "learning_rate": 2.7911130405059155e-06, "epoch": 4.253968253968254, "percentage": 44.67, "elapsed_time": "0:18:56", "remaining_time": "0:23:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 68, "total_steps": 150, "loss": 0.978, "learning_rate": 2.7664918882530226e-06, "epoch": 4.317460317460317, "percentage": 45.33, "elapsed_time": "0:19:15", "remaining_time": "0:23:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 69, "total_steps": 150, "loss": 0.988, "learning_rate": 2.7406208614118425e-06, "epoch": 4.380952380952381, "percentage": 46.0, "elapsed_time": "0:19:26", "remaining_time": "0:22:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 70, "total_steps": 150, "loss": 0.8734, "learning_rate": 2.713525491562421e-06, "epoch": 4.444444444444445, "percentage": 46.67, "elapsed_time": "0:19:34", "remaining_time": "0:22:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 71, "total_steps": 150, "loss": 0.7357, "learning_rate": 2.685232518563536e-06, "epoch": 4.507936507936508, "percentage": 47.33, "elapsed_time": "0:19:40", "remaining_time": "0:21:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 72, "total_steps": 150, "loss": 0.8909, "learning_rate": 2.655769864163684e-06, "epoch": 4.571428571428571, "percentage": 48.0, "elapsed_time": "0:19:45", "remaining_time": "0:21:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 73, "total_steps": 150, "loss": 0.78, "learning_rate": 2.6251666044456895e-06, "epoch": 4.634920634920634, "percentage": 48.67, "elapsed_time": "0:19:51", "remaining_time": "0:20:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 74, "total_steps": 150, "loss": 0.6989, "learning_rate": 2.5934529411321173e-06, "epoch": 4.698412698412699, "percentage": 49.33, "elapsed_time": "0:19:56", "remaining_time": "0:20:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 75, "total_steps": 150, "loss": 0.9173, "learning_rate": 2.5606601717798212e-06, "epoch": 4.761904761904762, "percentage": 50.0, "elapsed_time": "0:20:02", "remaining_time": "0:20:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 76, "total_steps": 150, "loss": 0.8555, "learning_rate": 2.526820658893033e-06, "epoch": 4.825396825396825, "percentage": 50.67, "elapsed_time": "0:20:07", "remaining_time": "0:19:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 77, "total_steps": 150, "loss": 0.768, "learning_rate": 2.491967797985478e-06, "epoch": 4.888888888888889, "percentage": 51.33, "elapsed_time": "0:20:45", "remaining_time": "0:19:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 78, "total_steps": 150, "loss": 0.6937, "learning_rate": 2.456135984623035e-06, "epoch": 4.9523809523809526, "percentage": 52.0, "elapsed_time": "0:20:51", "remaining_time": "0:19:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 79, "total_steps": 150, "loss": 0.8355, "learning_rate": 2.419360580479465e-06, "epoch": 5.015873015873016, "percentage": 52.67, "elapsed_time": "0:20:57", "remaining_time": "0:18:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 80, "total_steps": 150, "loss": 0.6985, "learning_rate": 2.3816778784387097e-06, "epoch": 5.079365079365079, "percentage": 53.33, "elapsed_time": "0:21:11", "remaining_time": "0:18:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 81, "total_steps": 150, "loss": 0.6097, "learning_rate": 2.343125066778196e-06, "epoch": 5.142857142857143, "percentage": 54.0, "elapsed_time": "0:21:21", "remaining_time": "0:18:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 82, "total_steps": 150, "loss": 0.8029, "learning_rate": 2.303740192468495e-06, "epoch": 5.2063492063492065, "percentage": 54.67, "elapsed_time": "0:21:38", "remaining_time": "0:17:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 83, "total_steps": 150, "loss": 0.5835, "learning_rate": 2.263562123625557e-06, "epoch": 5.26984126984127, "percentage": 55.33, "elapsed_time": "0:22:35", "remaining_time": "0:18:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 84, "total_steps": 150, "loss": 0.628, "learning_rate": 2.222630511152573e-06, "epoch": 5.333333333333333, "percentage": 56.0, "elapsed_time": "0:22:55", "remaining_time": "0:18:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 85, "total_steps": 150, "loss": 0.7011, "learning_rate": 2.18098574960932e-06, "epoch": 5.396825396825397, "percentage": 56.67, "elapsed_time": "0:23:26", "remaining_time": "0:17:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 86, "total_steps": 150, "loss": 0.5918, "learning_rate": 2.138668937347609e-06, "epoch": 5.4603174603174605, "percentage": 57.33, "elapsed_time": "0:23:32", "remaining_time": "0:17:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 87, "total_steps": 150, "loss": 0.4842, "learning_rate": 2.0957218359521707e-06, "epoch": 5.523809523809524, "percentage": 58.0, "elapsed_time": "0:23:37", "remaining_time": "0:17:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 88, "total_steps": 150, "loss": 0.7194, "learning_rate": 2.0521868290270174e-06, "epoch": 5.587301587301587, "percentage": 58.67, "elapsed_time": "0:23:43", "remaining_time": "0:16:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 89, "total_steps": 150, "loss": 0.5915, "learning_rate": 2.0081068803679374e-06, "epoch": 5.650793650793651, "percentage": 59.33, "elapsed_time": "0:23:48", "remaining_time": "0:16:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 90, "total_steps": 150, "loss": 0.6159, "learning_rate": 1.963525491562421e-06, "epoch": 5.714285714285714, "percentage": 60.0, "elapsed_time": "0:23:54", "remaining_time": "0:15:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 91, "total_steps": 150, "loss": 0.6515, "learning_rate": 1.918486659058844e-06, "epoch": 5.777777777777778, "percentage": 60.67, "elapsed_time": "0:24:00", "remaining_time": "0:15:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 92, "total_steps": 150, "loss": 0.4101, "learning_rate": 1.8730348307472826e-06, "epoch": 5.841269841269841, "percentage": 61.33, "elapsed_time": "0:24:05", "remaining_time": "0:15:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 93, "total_steps": 150, "loss": 0.5937, "learning_rate": 1.827214862094814e-06, "epoch": 5.904761904761905, "percentage": 62.0, "elapsed_time": "0:24:11", "remaining_time": "0:14:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 94, "total_steps": 150, "loss": 0.5382, "learning_rate": 1.7810719718785873e-06, "epoch": 5.968253968253968, "percentage": 62.67, "elapsed_time": "0:24:16", "remaining_time": "0:14:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 95, "total_steps": 150, "loss": 0.4762, "learning_rate": 1.7346516975603465e-06, "epoch": 6.031746031746032, "percentage": 63.33, "elapsed_time": "0:24:22", "remaining_time": "0:14:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 96, "total_steps": 150, "loss": 0.5713, "learning_rate": 1.6879998503464564e-06, "epoch": 6.095238095238095, "percentage": 64.0, "elapsed_time": "0:24:32", "remaining_time": "0:13:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 97, "total_steps": 150, "loss": 0.5565, "learning_rate": 1.6411624699777718e-06, "epoch": 6.158730158730159, "percentage": 64.67, "elapsed_time": "0:26:16", "remaining_time": "0:14:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 98, "total_steps": 150, "loss": 0.5058, "learning_rate": 1.5941857792939703e-06, "epoch": 6.222222222222222, "percentage": 65.33, "elapsed_time": "0:27:33", "remaining_time": "0:14:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 99, "total_steps": 150, "loss": 0.4028, "learning_rate": 1.5471161386171925e-06, "epoch": 6.285714285714286, "percentage": 66.0, "elapsed_time": "0:28:05", "remaining_time": "0:14:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 100, "total_steps": 150, "loss": 0.4107, "learning_rate": 1.5e-06, "epoch": 6.349206349206349, "percentage": 66.67, "elapsed_time": "0:28:27", "remaining_time": "0:14:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 101, "total_steps": 150, "loss": 0.4851, "learning_rate": 1.4528838613828075e-06, "epoch": 6.412698412698413, "percentage": 67.33, "elapsed_time": "0:28:57", "remaining_time": "0:14:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 102, "total_steps": 150, "loss": 0.4957, "learning_rate": 1.40581422070603e-06, "epoch": 6.476190476190476, "percentage": 68.0, "elapsed_time": "0:29:03", "remaining_time": "0:13:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 103, "total_steps": 150, "loss": 0.4534, "learning_rate": 1.3588375300222285e-06, "epoch": 6.5396825396825395, "percentage": 68.67, "elapsed_time": "0:29:24", "remaining_time": "0:13:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 104, "total_steps": 150, "loss": 0.4615, "learning_rate": 1.3120001496535434e-06, "epoch": 6.603174603174603, "percentage": 69.33, "elapsed_time": "0:29:39", "remaining_time": "0:13:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 105, "total_steps": 150, "loss": 0.3708, "learning_rate": 1.2653483024396534e-06, "epoch": 6.666666666666667, "percentage": 70.0, "elapsed_time": "0:31:18", "remaining_time": "0:13:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 106, "total_steps": 150, "loss": 0.3618, "learning_rate": 1.2189280281214128e-06, "epoch": 6.73015873015873, "percentage": 70.67, "elapsed_time": "0:31:43", "remaining_time": "0:13:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 107, "total_steps": 150, "loss": 0.5127, "learning_rate": 1.1727851379051866e-06, "epoch": 6.7936507936507935, "percentage": 71.33, "elapsed_time": "0:31:58", "remaining_time": "0:12:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 108, "total_steps": 150, "loss": 0.3902, "learning_rate": 1.1269651692527181e-06, "epoch": 6.857142857142857, "percentage": 72.0, "elapsed_time": "0:32:19", "remaining_time": "0:12:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 109, "total_steps": 150, "loss": 0.4069, "learning_rate": 1.0815133409411564e-06, "epoch": 6.920634920634921, "percentage": 72.67, "elapsed_time": "0:32:30", "remaining_time": "0:12:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 110, "total_steps": 150, "loss": 0.3469, "learning_rate": 1.036474508437579e-06, "epoch": 6.984126984126984, "percentage": 73.33, "elapsed_time": "0:32:42", "remaining_time": "0:11:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 111, "total_steps": 150, "loss": 0.3247, "learning_rate": 9.918931196320629e-07, "epoch": 7.0476190476190474, "percentage": 74.0, "elapsed_time": "0:32:56", "remaining_time": "0:11:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 112, "total_steps": 150, "loss": 0.3509, "learning_rate": 9.478131709729831e-07, "epoch": 7.111111111111111, "percentage": 74.67, "elapsed_time": "0:33:04", "remaining_time": "0:11:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 113, "total_steps": 150, "loss": 0.3648, "learning_rate": 9.042781640478293e-07, "epoch": 7.174603174603175, "percentage": 75.33, "elapsed_time": "0:33:13", "remaining_time": "0:10:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 114, "total_steps": 150, "loss": 0.2861, "learning_rate": 8.613310626523911e-07, "epoch": 7.238095238095238, "percentage": 76.0, "elapsed_time": "0:33:22", "remaining_time": "0:10:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 115, "total_steps": 150, "loss": 0.4778, "learning_rate": 8.190142503906799e-07, "epoch": 7.301587301587301, "percentage": 76.67, "elapsed_time": "0:35:21", "remaining_time": "0:10:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 116, "total_steps": 150, "loss": 0.3658, "learning_rate": 7.773694888474268e-07, "epoch": 7.365079365079365, "percentage": 77.33, "elapsed_time": "0:36:02", "remaining_time": "0:10:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 117, "total_steps": 150, "loss": 0.3291, "learning_rate": 7.36437876374443e-07, "epoch": 7.428571428571429, "percentage": 78.0, "elapsed_time": "0:36:09", "remaining_time": "0:10:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 118, "total_steps": 150, "loss": 0.2889, "learning_rate": 6.962598075315047e-07, "epoch": 7.492063492063492, "percentage": 78.67, "elapsed_time": "0:36:22", "remaining_time": "0:09:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 119, "total_steps": 150, "loss": 0.4034, "learning_rate": 6.568749332218045e-07, "epoch": 7.555555555555555, "percentage": 79.33, "elapsed_time": "0:36:33", "remaining_time": "0:09:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 120, "total_steps": 150, "loss": 0.3604, "learning_rate": 6.183221215612905e-07, "epoch": 7.619047619047619, "percentage": 80.0, "elapsed_time": "0:36:43", "remaining_time": "0:09:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 121, "total_steps": 150, "loss": 0.3938, "learning_rate": 5.806394195205356e-07, "epoch": 7.682539682539683, "percentage": 80.67, "elapsed_time": "0:37:41", "remaining_time": "0:09:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 122, "total_steps": 150, "loss": 0.3031, "learning_rate": 5.438640153769653e-07, "epoch": 7.746031746031746, "percentage": 81.33, "elapsed_time": "0:37:59", "remaining_time": "0:08:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 123, "total_steps": 150, "loss": 0.3826, "learning_rate": 5.080322020145225e-07, "epoch": 7.809523809523809, "percentage": 82.0, "elapsed_time": "0:38:29", "remaining_time": "0:08:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 124, "total_steps": 150, "loss": 0.292, "learning_rate": 4.731793411069669e-07, "epoch": 7.8730158730158735, "percentage": 82.67, "elapsed_time": "0:39:05", "remaining_time": "0:08:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 125, "total_steps": 150, "loss": 0.4526, "learning_rate": 4.3933982822017883e-07, "epoch": 7.936507936507937, "percentage": 83.33, "elapsed_time": "0:39:41", "remaining_time": "0:07:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 126, "total_steps": 150, "loss": 0.3632, "learning_rate": 4.06547058867883e-07, "epoch": 8.0, "percentage": 84.0, "elapsed_time": "0:40:02", "remaining_time": "0:07:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 127, "total_steps": 150, "loss": 0.2562, "learning_rate": 3.748333955543106e-07, "epoch": 8.063492063492063, "percentage": 84.67, "elapsed_time": "0:40:57", "remaining_time": "0:07:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 128, "total_steps": 150, "loss": 0.237, "learning_rate": 3.442301358363163e-07, "epoch": 8.126984126984127, "percentage": 85.33, "elapsed_time": "0:41:41", "remaining_time": "0:07:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 129, "total_steps": 150, "loss": 0.2607, "learning_rate": 3.147674814364644e-07, "epoch": 8.19047619047619, "percentage": 86.0, "elapsed_time": "0:42:33", "remaining_time": "0:06:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 130, "total_steps": 150, "loss": 0.2384, "learning_rate": 2.86474508437579e-07, "epoch": 8.253968253968253, "percentage": 86.67, "elapsed_time": "0:42:44", "remaining_time": "0:06:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 131, "total_steps": 150, "loss": 0.3726, "learning_rate": 2.593791385881571e-07, "epoch": 8.317460317460318, "percentage": 87.33, "elapsed_time": "0:42:51", "remaining_time": "0:06:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 132, "total_steps": 150, "loss": 0.3818, "learning_rate": 2.3350811174697772e-07, "epoch": 8.380952380952381, "percentage": 88.0, "elapsed_time": "0:43:12", "remaining_time": "0:05:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 133, "total_steps": 150, "loss": 0.4703, "learning_rate": 2.0888695949408471e-07, "epoch": 8.444444444444445, "percentage": 88.67, "elapsed_time": "0:43:20", "remaining_time": "0:05:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 134, "total_steps": 150, "loss": 0.357, "learning_rate": 1.8553997993420495e-07, "epoch": 8.507936507936508, "percentage": 89.33, "elapsed_time": "0:43:27", "remaining_time": "0:05:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 135, "total_steps": 150, "loss": 0.3128, "learning_rate": 1.634902137174483e-07, "epoch": 8.571428571428571, "percentage": 90.0, "elapsed_time": "0:43:45", "remaining_time": "0:04:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 136, "total_steps": 150, "loss": 0.3583, "learning_rate": 1.4275942130097098e-07, "epoch": 8.634920634920634, "percentage": 90.67, "elapsed_time": "0:43:50", "remaining_time": "0:04:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 137, "total_steps": 150, "loss": 0.3273, "learning_rate": 1.2336806147402828e-07, "epoch": 8.698412698412698, "percentage": 91.33, "elapsed_time": "0:43:58", "remaining_time": "0:04:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 138, "total_steps": 150, "loss": 0.298, "learning_rate": 1.0533527116762298e-07, "epoch": 8.761904761904763, "percentage": 92.0, "elapsed_time": "0:44:09", "remaining_time": "0:03:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 139, "total_steps": 150, "loss": 0.4737, "learning_rate": 8.867884656866182e-08, "epoch": 8.825396825396826, "percentage": 92.67, "elapsed_time": "0:44:14", "remaining_time": "0:03:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 140, "total_steps": 150, "loss": 0.2492, "learning_rate": 7.341522555726971e-08, "epoch": 8.88888888888889, "percentage": 93.33, "elapsed_time": "0:44:27", "remaining_time": "0:03:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 141, "total_steps": 150, "loss": 0.2531, "learning_rate": 5.9559471484585404e-08, "epoch": 8.952380952380953, "percentage": 94.0, "elapsed_time": "0:44:46", "remaining_time": "0:02:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 142, "total_steps": 150, "loss": 0.2074, "learning_rate": 4.712525830705339e-08, "epoch": 9.015873015873016, "percentage": 94.67, "elapsed_time": "0:45:09", "remaining_time": "0:02:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 143, "total_steps": 150, "loss": 0.1696, "learning_rate": 3.6124857091878847e-08, "epoch": 9.079365079365079, "percentage": 95.33, "elapsed_time": "0:46:02", "remaining_time": "0:02:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 144, "total_steps": 150, "loss": 0.3333, "learning_rate": 2.6569123906967087e-08, "epoch": 9.142857142857142, "percentage": 96.0, "elapsed_time": "0:46:42", "remaining_time": "0:01:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 145, "total_steps": 150, "loss": 0.4033, "learning_rate": 1.846748910729351e-08, "epoch": 9.206349206349206, "percentage": 96.67, "elapsed_time": "0:47:19", "remaining_time": "0:01:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 146, "total_steps": 150, "loss": 0.3716, "learning_rate": 1.1827948028283353e-08, "epoch": 9.26984126984127, "percentage": 97.33, "elapsed_time": "0:47:43", "remaining_time": "0:01:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 147, "total_steps": 150, "loss": 0.3588, "learning_rate": 6.657053095380006e-09, "epoch": 9.333333333333334, "percentage": 98.0, "elapsed_time": "0:48:04", "remaining_time": "0:00:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 148, "total_steps": 150, "loss": 0.2379, "learning_rate": 2.9599073575926614e-09, "epoch": 9.396825396825397, "percentage": 98.67, "elapsed_time": "0:48:21", "remaining_time": "0:00:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 149, "total_steps": 150, "loss": 0.2427, "learning_rate": 7.401594514026e-10, "epoch": 9.46031746031746, "percentage": 99.33, "elapsed_time": "0:48:39", "remaining_time": "0:00:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 150, "total_steps": 150, "loss": 0.2553, "learning_rate": 0.0, "epoch": 9.523809523809524, "percentage": 100.0, "elapsed_time": "0:48:56", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 150, "total_steps": 150, "epoch": 9.523809523809524, "percentage": 100.0, "elapsed_time": "0:49:15", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}