{"current_steps": 10, "total_steps": 1850, "loss": 0.8622, "learning_rate": 5e-06, "epoch": 0.02702702702702703, "percentage": 0.54, "elapsed_time": "0:02:28", "remaining_time": "7:34:18"} {"current_steps": 20, "total_steps": 1850, "loss": 0.6871, "learning_rate": 5e-06, "epoch": 0.05405405405405406, "percentage": 1.08, "elapsed_time": "0:04:52", "remaining_time": "7:25:40"} {"current_steps": 30, "total_steps": 1850, "loss": 0.6496, "learning_rate": 5e-06, "epoch": 0.08108108108108109, "percentage": 1.62, "elapsed_time": "0:07:16", "remaining_time": "7:21:07"} {"current_steps": 40, "total_steps": 1850, "loss": 0.6379, "learning_rate": 5e-06, "epoch": 0.10810810810810811, "percentage": 2.16, "elapsed_time": "0:09:40", "remaining_time": "7:17:31"} {"current_steps": 50, "total_steps": 1850, "loss": 0.6224, "learning_rate": 5e-06, "epoch": 0.13513513513513514, "percentage": 2.7, "elapsed_time": "0:12:03", "remaining_time": "7:14:18"} {"current_steps": 60, "total_steps": 1850, "loss": 0.6158, "learning_rate": 5e-06, "epoch": 0.16216216216216217, "percentage": 3.24, "elapsed_time": "0:14:27", "remaining_time": "7:11:26"} {"current_steps": 70, "total_steps": 1850, "loss": 0.6121, "learning_rate": 5e-06, "epoch": 0.1891891891891892, "percentage": 3.78, "elapsed_time": "0:16:51", "remaining_time": "7:08:45"} {"current_steps": 80, "total_steps": 1850, "loss": 0.6048, "learning_rate": 5e-06, "epoch": 0.21621621621621623, "percentage": 4.32, "elapsed_time": "0:19:15", "remaining_time": "7:06:08"} {"current_steps": 90, "total_steps": 1850, "loss": 0.6027, "learning_rate": 5e-06, "epoch": 0.24324324324324326, "percentage": 4.86, "elapsed_time": "0:21:39", "remaining_time": "7:03:32"} {"current_steps": 100, "total_steps": 1850, "loss": 0.6057, "learning_rate": 5e-06, "epoch": 0.2702702702702703, "percentage": 5.41, "elapsed_time": "0:24:03", "remaining_time": "7:00:59"} {"current_steps": 110, "total_steps": 1850, "loss": 0.603, "learning_rate": 5e-06, "epoch": 0.2972972972972973, "percentage": 5.95, "elapsed_time": "0:26:27", "remaining_time": "6:58:30"} {"current_steps": 120, "total_steps": 1850, "loss": 0.5968, "learning_rate": 5e-06, "epoch": 0.32432432432432434, "percentage": 6.49, "elapsed_time": "0:28:50", "remaining_time": "6:55:53"} {"current_steps": 130, "total_steps": 1850, "loss": 0.5971, "learning_rate": 5e-06, "epoch": 0.35135135135135137, "percentage": 7.03, "elapsed_time": "0:31:14", "remaining_time": "6:53:18"} {"current_steps": 140, "total_steps": 1850, "loss": 0.5967, "learning_rate": 5e-06, "epoch": 0.3783783783783784, "percentage": 7.57, "elapsed_time": "0:33:37", "remaining_time": "6:50:47"} {"current_steps": 150, "total_steps": 1850, "loss": 0.588, "learning_rate": 5e-06, "epoch": 0.40540540540540543, "percentage": 8.11, "elapsed_time": "0:36:01", "remaining_time": "6:48:21"} {"current_steps": 160, "total_steps": 1850, "loss": 0.5911, "learning_rate": 5e-06, "epoch": 0.43243243243243246, "percentage": 8.65, "elapsed_time": "0:38:25", "remaining_time": "6:45:55"} {"current_steps": 170, "total_steps": 1850, "loss": 0.5929, "learning_rate": 5e-06, "epoch": 0.4594594594594595, "percentage": 9.19, "elapsed_time": "0:40:49", "remaining_time": "6:43:26"} {"current_steps": 180, "total_steps": 1850, "loss": 0.592, "learning_rate": 5e-06, "epoch": 0.4864864864864865, "percentage": 9.73, "elapsed_time": "0:43:13", "remaining_time": "6:40:58"} {"current_steps": 190, "total_steps": 1850, "loss": 0.5881, "learning_rate": 5e-06, "epoch": 0.5135135135135135, "percentage": 10.27, "elapsed_time": "0:45:37", "remaining_time": "6:38:33"} {"current_steps": 200, "total_steps": 1850, "loss": 0.5863, "learning_rate": 5e-06, "epoch": 0.5405405405405406, "percentage": 10.81, "elapsed_time": "0:48:00", "remaining_time": "6:36:08"} {"current_steps": 210, "total_steps": 1850, "loss": 0.5888, "learning_rate": 5e-06, "epoch": 0.5675675675675675, "percentage": 11.35, "elapsed_time": "0:50:24", "remaining_time": "6:33:42"} {"current_steps": 220, "total_steps": 1850, "loss": 0.5846, "learning_rate": 5e-06, "epoch": 0.5945945945945946, "percentage": 11.89, "elapsed_time": "0:52:48", "remaining_time": "6:31:14"} {"current_steps": 230, "total_steps": 1850, "loss": 0.5858, "learning_rate": 5e-06, "epoch": 0.6216216216216216, "percentage": 12.43, "elapsed_time": "0:55:12", "remaining_time": "6:28:49"} {"current_steps": 240, "total_steps": 1850, "loss": 0.5823, "learning_rate": 5e-06, "epoch": 0.6486486486486487, "percentage": 12.97, "elapsed_time": "0:57:36", "remaining_time": "6:26:25"} {"current_steps": 250, "total_steps": 1850, "loss": 0.5759, "learning_rate": 5e-06, "epoch": 0.6756756756756757, "percentage": 13.51, "elapsed_time": "1:00:00", "remaining_time": "6:24:00"} {"current_steps": 260, "total_steps": 1850, "loss": 0.5788, "learning_rate": 5e-06, "epoch": 0.7027027027027027, "percentage": 14.05, "elapsed_time": "1:02:24", "remaining_time": "6:21:36"} {"current_steps": 270, "total_steps": 1850, "loss": 0.5807, "learning_rate": 5e-06, "epoch": 0.7297297297297297, "percentage": 14.59, "elapsed_time": "1:04:48", "remaining_time": "6:19:12"} {"current_steps": 280, "total_steps": 1850, "loss": 0.5753, "learning_rate": 5e-06, "epoch": 0.7567567567567568, "percentage": 15.14, "elapsed_time": "1:07:12", "remaining_time": "6:16:48"} {"current_steps": 290, "total_steps": 1850, "loss": 0.5751, "learning_rate": 5e-06, "epoch": 0.7837837837837838, "percentage": 15.68, "elapsed_time": "1:09:36", "remaining_time": "6:14:24"} {"current_steps": 300, "total_steps": 1850, "loss": 0.5752, "learning_rate": 5e-06, "epoch": 0.8108108108108109, "percentage": 16.22, "elapsed_time": "1:12:00", "remaining_time": "6:12:00"} {"current_steps": 310, "total_steps": 1850, "loss": 0.5731, "learning_rate": 5e-06, "epoch": 0.8378378378378378, "percentage": 16.76, "elapsed_time": "1:14:24", "remaining_time": "6:09:36"} {"current_steps": 320, "total_steps": 1850, "loss": 0.5719, "learning_rate": 5e-06, "epoch": 0.8648648648648649, "percentage": 17.3, "elapsed_time": "1:16:48", "remaining_time": "6:07:12"} {"current_steps": 330, "total_steps": 1850, "loss": 0.5736, "learning_rate": 5e-06, "epoch": 0.8918918918918919, "percentage": 17.84, "elapsed_time": "1:19:12", "remaining_time": "6:04:48"} {"current_steps": 340, "total_steps": 1850, "loss": 0.581, "learning_rate": 5e-06, "epoch": 0.918918918918919, "percentage": 18.38, "elapsed_time": "1:21:36", "remaining_time": "6:02:24"} {"current_steps": 350, "total_steps": 1850, "loss": 0.5726, "learning_rate": 5e-06, "epoch": 0.9459459459459459, "percentage": 18.92, "elapsed_time": "1:24:00", "remaining_time": "6:00:00"} {"current_steps": 360, "total_steps": 1850, "loss": 0.5717, "learning_rate": 5e-06, "epoch": 0.972972972972973, "percentage": 19.46, "elapsed_time": "1:26:24", "remaining_time": "5:57:36"} {"current_steps": 370, "total_steps": 1850, "loss": 0.5735, "learning_rate": 5e-06, "epoch": 1.0, "percentage": 20.0, "elapsed_time": "1:28:47", "remaining_time": "5:55:08"} {"current_steps": 370, "total_steps": 1850, "eval_loss": 0.28570452332496643, "epoch": 1.0, "percentage": 20.0, "elapsed_time": "1:30:23", "remaining_time": "6:01:34"} {"current_steps": 380, "total_steps": 1850, "loss": 0.4828, "learning_rate": 5e-06, "epoch": 1.027027027027027, "percentage": 20.54, "elapsed_time": "1:33:31", "remaining_time": "6:01:47"} {"current_steps": 390, "total_steps": 1850, "loss": 0.4753, "learning_rate": 5e-06, "epoch": 1.054054054054054, "percentage": 21.08, "elapsed_time": "1:35:55", "remaining_time": "5:59:05"} {"current_steps": 400, "total_steps": 1850, "loss": 0.4799, "learning_rate": 5e-06, "epoch": 1.0810810810810811, "percentage": 21.62, "elapsed_time": "1:38:19", "remaining_time": "5:56:25"} {"current_steps": 410, "total_steps": 1850, "loss": 0.4728, "learning_rate": 5e-06, "epoch": 1.1081081081081081, "percentage": 22.16, "elapsed_time": "1:40:43", "remaining_time": "5:53:45"} {"current_steps": 420, "total_steps": 1850, "loss": 0.4775, "learning_rate": 5e-06, "epoch": 1.135135135135135, "percentage": 22.7, "elapsed_time": "1:43:07", "remaining_time": "5:51:06"} {"current_steps": 430, "total_steps": 1850, "loss": 0.484, "learning_rate": 5e-06, "epoch": 1.1621621621621623, "percentage": 23.24, "elapsed_time": "1:45:31", "remaining_time": "5:48:29"} {"current_steps": 440, "total_steps": 1850, "loss": 0.4749, "learning_rate": 5e-06, "epoch": 1.1891891891891893, "percentage": 23.78, "elapsed_time": "1:47:55", "remaining_time": "5:45:51"} {"current_steps": 450, "total_steps": 1850, "loss": 0.48, "learning_rate": 5e-06, "epoch": 1.2162162162162162, "percentage": 24.32, "elapsed_time": "1:50:19", "remaining_time": "5:43:14"} {"current_steps": 460, "total_steps": 1850, "loss": 0.4809, "learning_rate": 5e-06, "epoch": 1.2432432432432432, "percentage": 24.86, "elapsed_time": "1:52:43", "remaining_time": "5:40:37"} {"current_steps": 470, "total_steps": 1850, "loss": 0.481, "learning_rate": 5e-06, "epoch": 1.2702702702702702, "percentage": 25.41, "elapsed_time": "1:55:07", "remaining_time": "5:38:02"} {"current_steps": 480, "total_steps": 1850, "loss": 0.4764, "learning_rate": 5e-06, "epoch": 1.2972972972972974, "percentage": 25.95, "elapsed_time": "1:57:31", "remaining_time": "5:35:26"} {"current_steps": 490, "total_steps": 1850, "loss": 0.4761, "learning_rate": 5e-06, "epoch": 1.3243243243243243, "percentage": 26.49, "elapsed_time": "1:59:55", "remaining_time": "5:32:50"} {"current_steps": 500, "total_steps": 1850, "loss": 0.482, "learning_rate": 5e-06, "epoch": 1.3513513513513513, "percentage": 27.03, "elapsed_time": "2:02:19", "remaining_time": "5:30:15"} {"current_steps": 510, "total_steps": 1850, "loss": 0.4817, "learning_rate": 5e-06, "epoch": 1.3783783783783785, "percentage": 27.57, "elapsed_time": "2:04:43", "remaining_time": "5:27:41"} {"current_steps": 520, "total_steps": 1850, "loss": 0.4861, "learning_rate": 5e-06, "epoch": 1.4054054054054055, "percentage": 28.11, "elapsed_time": "2:07:07", "remaining_time": "5:25:07"} {"current_steps": 530, "total_steps": 1850, "loss": 0.4801, "learning_rate": 5e-06, "epoch": 1.4324324324324325, "percentage": 28.65, "elapsed_time": "2:09:30", "remaining_time": "5:22:33"} {"current_steps": 540, "total_steps": 1850, "loss": 0.4834, "learning_rate": 5e-06, "epoch": 1.4594594594594594, "percentage": 29.19, "elapsed_time": "2:11:54", "remaining_time": "5:19:59"} {"current_steps": 550, "total_steps": 1850, "loss": 0.4815, "learning_rate": 5e-06, "epoch": 1.4864864864864864, "percentage": 29.73, "elapsed_time": "2:14:18", "remaining_time": "5:17:26"} {"current_steps": 560, "total_steps": 1850, "loss": 0.4853, "learning_rate": 5e-06, "epoch": 1.5135135135135136, "percentage": 30.27, "elapsed_time": "2:16:42", "remaining_time": "5:14:53"} {"current_steps": 570, "total_steps": 1850, "loss": 0.4775, "learning_rate": 5e-06, "epoch": 1.5405405405405406, "percentage": 30.81, "elapsed_time": "2:19:05", "remaining_time": "5:12:21"} {"current_steps": 580, "total_steps": 1850, "loss": 0.484, "learning_rate": 5e-06, "epoch": 1.5675675675675675, "percentage": 31.35, "elapsed_time": "2:21:29", "remaining_time": "5:09:49"} {"current_steps": 590, "total_steps": 1850, "loss": 0.4842, "learning_rate": 5e-06, "epoch": 1.5945945945945947, "percentage": 31.89, "elapsed_time": "2:23:53", "remaining_time": "5:07:18"} {"current_steps": 600, "total_steps": 1850, "loss": 0.4815, "learning_rate": 5e-06, "epoch": 1.6216216216216215, "percentage": 32.43, "elapsed_time": "2:26:17", "remaining_time": "5:04:46"} {"current_steps": 610, "total_steps": 1850, "loss": 0.4803, "learning_rate": 5e-06, "epoch": 1.6486486486486487, "percentage": 32.97, "elapsed_time": "2:28:41", "remaining_time": "5:02:14"} {"current_steps": 620, "total_steps": 1850, "loss": 0.4867, "learning_rate": 5e-06, "epoch": 1.6756756756756757, "percentage": 33.51, "elapsed_time": "2:31:05", "remaining_time": "4:59:43"} {"current_steps": 630, "total_steps": 1850, "loss": 0.4898, "learning_rate": 5e-06, "epoch": 1.7027027027027026, "percentage": 34.05, "elapsed_time": "2:33:28", "remaining_time": "4:57:12"} {"current_steps": 640, "total_steps": 1850, "loss": 0.4903, "learning_rate": 5e-06, "epoch": 1.7297297297297298, "percentage": 34.59, "elapsed_time": "2:35:51", "remaining_time": "4:54:41"} {"current_steps": 650, "total_steps": 1850, "loss": 0.4832, "learning_rate": 5e-06, "epoch": 1.7567567567567568, "percentage": 35.14, "elapsed_time": "2:38:15", "remaining_time": "4:52:10"} {"current_steps": 660, "total_steps": 1850, "loss": 0.4825, "learning_rate": 5e-06, "epoch": 1.7837837837837838, "percentage": 35.68, "elapsed_time": "2:40:39", "remaining_time": "4:49:40"} {"current_steps": 670, "total_steps": 1850, "loss": 0.4826, "learning_rate": 5e-06, "epoch": 1.810810810810811, "percentage": 36.22, "elapsed_time": "2:43:03", "remaining_time": "4:47:11"} {"current_steps": 680, "total_steps": 1850, "loss": 0.4864, "learning_rate": 5e-06, "epoch": 1.8378378378378377, "percentage": 36.76, "elapsed_time": "2:45:27", "remaining_time": "4:44:41"} {"current_steps": 690, "total_steps": 1850, "loss": 0.485, "learning_rate": 5e-06, "epoch": 1.864864864864865, "percentage": 37.3, "elapsed_time": "2:47:51", "remaining_time": "4:42:11"} {"current_steps": 700, "total_steps": 1850, "loss": 0.4884, "learning_rate": 5e-06, "epoch": 1.8918918918918919, "percentage": 37.84, "elapsed_time": "2:50:15", "remaining_time": "4:39:41"} {"current_steps": 710, "total_steps": 1850, "loss": 0.4926, "learning_rate": 5e-06, "epoch": 1.9189189189189189, "percentage": 38.38, "elapsed_time": "2:52:39", "remaining_time": "4:37:12"} {"current_steps": 720, "total_steps": 1850, "loss": 0.4855, "learning_rate": 5e-06, "epoch": 1.945945945945946, "percentage": 38.92, "elapsed_time": "2:55:03", "remaining_time": "4:34:43"} {"current_steps": 730, "total_steps": 1850, "loss": 0.4845, "learning_rate": 5e-06, "epoch": 1.972972972972973, "percentage": 39.46, "elapsed_time": "2:57:27", "remaining_time": "4:32:15"} {"current_steps": 740, "total_steps": 1850, "loss": 0.4841, "learning_rate": 5e-06, "epoch": 2.0, "percentage": 40.0, "elapsed_time": "2:59:50", "remaining_time": "4:29:45"} {"current_steps": 740, "total_steps": 1850, "eval_loss": 0.2870478928089142, "epoch": 2.0, "percentage": 40.0, "elapsed_time": "3:01:26", "remaining_time": "4:32:10"} {"current_steps": 750, "total_steps": 1850, "loss": 0.3857, "learning_rate": 5e-06, "epoch": 2.027027027027027, "percentage": 40.54, "elapsed_time": "3:04:38", "remaining_time": "4:30:48"} {"current_steps": 760, "total_steps": 1850, "loss": 0.3828, "learning_rate": 5e-06, "epoch": 2.054054054054054, "percentage": 41.08, "elapsed_time": "3:07:02", "remaining_time": "4:28:15"} {"current_steps": 770, "total_steps": 1850, "loss": 0.3811, "learning_rate": 5e-06, "epoch": 2.081081081081081, "percentage": 41.62, "elapsed_time": "3:09:26", "remaining_time": "4:25:42"} {"current_steps": 780, "total_steps": 1850, "loss": 0.379, "learning_rate": 5e-06, "epoch": 2.108108108108108, "percentage": 42.16, "elapsed_time": "3:11:49", "remaining_time": "4:23:09"} {"current_steps": 790, "total_steps": 1850, "loss": 0.3804, "learning_rate": 5e-06, "epoch": 2.135135135135135, "percentage": 42.7, "elapsed_time": "3:14:13", "remaining_time": "4:20:36"} {"current_steps": 800, "total_steps": 1850, "loss": 0.3877, "learning_rate": 5e-06, "epoch": 2.1621621621621623, "percentage": 43.24, "elapsed_time": "3:16:37", "remaining_time": "4:18:04"} {"current_steps": 810, "total_steps": 1850, "loss": 0.3865, "learning_rate": 5e-06, "epoch": 2.189189189189189, "percentage": 43.78, "elapsed_time": "3:19:02", "remaining_time": "4:15:32"} {"current_steps": 820, "total_steps": 1850, "loss": 0.3847, "learning_rate": 5e-06, "epoch": 2.2162162162162162, "percentage": 44.32, "elapsed_time": "3:21:26", "remaining_time": "4:13:01"} {"current_steps": 830, "total_steps": 1850, "loss": 0.392, "learning_rate": 5e-06, "epoch": 2.2432432432432434, "percentage": 44.86, "elapsed_time": "3:23:50", "remaining_time": "4:10:29"} {"current_steps": 840, "total_steps": 1850, "loss": 0.394, "learning_rate": 5e-06, "epoch": 2.27027027027027, "percentage": 45.41, "elapsed_time": "3:26:14", "remaining_time": "4:07:58"} {"current_steps": 850, "total_steps": 1850, "loss": 0.3879, "learning_rate": 5e-06, "epoch": 2.2972972972972974, "percentage": 45.95, "elapsed_time": "3:28:38", "remaining_time": "4:05:27"} {"current_steps": 860, "total_steps": 1850, "loss": 0.3904, "learning_rate": 5e-06, "epoch": 2.3243243243243246, "percentage": 46.49, "elapsed_time": "3:31:02", "remaining_time": "4:02:56"} {"current_steps": 870, "total_steps": 1850, "loss": 0.397, "learning_rate": 5e-06, "epoch": 2.3513513513513513, "percentage": 47.03, "elapsed_time": "3:33:26", "remaining_time": "4:00:25"} {"current_steps": 880, "total_steps": 1850, "loss": 0.3931, "learning_rate": 5e-06, "epoch": 2.3783783783783785, "percentage": 47.57, "elapsed_time": "3:35:50", "remaining_time": "3:57:54"} {"current_steps": 890, "total_steps": 1850, "loss": 0.3938, "learning_rate": 5e-06, "epoch": 2.4054054054054053, "percentage": 48.11, "elapsed_time": "3:38:14", "remaining_time": "3:55:24"} {"current_steps": 900, "total_steps": 1850, "loss": 0.3916, "learning_rate": 5e-06, "epoch": 2.4324324324324325, "percentage": 48.65, "elapsed_time": "3:40:38", "remaining_time": "3:52:53"} {"current_steps": 910, "total_steps": 1850, "loss": 0.3881, "learning_rate": 5e-06, "epoch": 2.4594594594594597, "percentage": 49.19, "elapsed_time": "3:43:02", "remaining_time": "3:50:23"} {"current_steps": 920, "total_steps": 1850, "loss": 0.391, "learning_rate": 5e-06, "epoch": 2.4864864864864864, "percentage": 49.73, "elapsed_time": "3:45:26", "remaining_time": "3:47:53"} {"current_steps": 930, "total_steps": 1850, "loss": 0.391, "learning_rate": 5e-06, "epoch": 2.5135135135135136, "percentage": 50.27, "elapsed_time": "3:47:50", "remaining_time": "3:45:23"} {"current_steps": 940, "total_steps": 1850, "loss": 0.3979, "learning_rate": 5e-06, "epoch": 2.5405405405405403, "percentage": 50.81, "elapsed_time": "3:50:14", "remaining_time": "3:42:54"} {"current_steps": 950, "total_steps": 1850, "loss": 0.3963, "learning_rate": 5e-06, "epoch": 2.5675675675675675, "percentage": 51.35, "elapsed_time": "3:52:39", "remaining_time": "3:40:24"} {"current_steps": 960, "total_steps": 1850, "loss": 0.399, "learning_rate": 5e-06, "epoch": 2.5945945945945947, "percentage": 51.89, "elapsed_time": "3:55:03", "remaining_time": "3:37:54"} {"current_steps": 970, "total_steps": 1850, "loss": 0.4023, "learning_rate": 5e-06, "epoch": 2.6216216216216215, "percentage": 52.43, "elapsed_time": "3:57:27", "remaining_time": "3:35:25"} {"current_steps": 980, "total_steps": 1850, "loss": 0.4037, "learning_rate": 5e-06, "epoch": 2.6486486486486487, "percentage": 52.97, "elapsed_time": "3:59:51", "remaining_time": "3:32:56"} {"current_steps": 990, "total_steps": 1850, "loss": 0.4037, "learning_rate": 5e-06, "epoch": 2.6756756756756754, "percentage": 53.51, "elapsed_time": "4:02:15", "remaining_time": "3:30:26"} {"current_steps": 1000, "total_steps": 1850, "loss": 0.3945, "learning_rate": 5e-06, "epoch": 2.7027027027027026, "percentage": 54.05, "elapsed_time": "4:04:39", "remaining_time": "3:27:57"} {"current_steps": 1010, "total_steps": 1850, "loss": 0.4051, "learning_rate": 5e-06, "epoch": 2.72972972972973, "percentage": 54.59, "elapsed_time": "4:07:03", "remaining_time": "3:25:28"} {"current_steps": 1020, "total_steps": 1850, "loss": 0.406, "learning_rate": 5e-06, "epoch": 2.756756756756757, "percentage": 55.14, "elapsed_time": "4:09:26", "remaining_time": "3:22:58"} {"current_steps": 1030, "total_steps": 1850, "loss": 0.4029, "learning_rate": 5e-06, "epoch": 2.7837837837837838, "percentage": 55.68, "elapsed_time": "4:11:50", "remaining_time": "3:20:29"} {"current_steps": 1040, "total_steps": 1850, "loss": 0.4055, "learning_rate": 5e-06, "epoch": 2.810810810810811, "percentage": 56.22, "elapsed_time": "4:14:14", "remaining_time": "3:18:01"} {"current_steps": 1050, "total_steps": 1850, "loss": 0.4046, "learning_rate": 5e-06, "epoch": 2.8378378378378377, "percentage": 56.76, "elapsed_time": "4:16:38", "remaining_time": "3:15:32"} {"current_steps": 1060, "total_steps": 1850, "loss": 0.4016, "learning_rate": 5e-06, "epoch": 2.864864864864865, "percentage": 57.3, "elapsed_time": "4:19:02", "remaining_time": "3:13:03"} {"current_steps": 1070, "total_steps": 1850, "loss": 0.4079, "learning_rate": 5e-06, "epoch": 2.891891891891892, "percentage": 57.84, "elapsed_time": "4:21:26", "remaining_time": "3:10:35"} {"current_steps": 1080, "total_steps": 1850, "loss": 0.4049, "learning_rate": 5e-06, "epoch": 2.918918918918919, "percentage": 58.38, "elapsed_time": "4:23:51", "remaining_time": "3:08:07"} {"current_steps": 1090, "total_steps": 1850, "loss": 0.4065, "learning_rate": 5e-06, "epoch": 2.945945945945946, "percentage": 58.92, "elapsed_time": "4:26:15", "remaining_time": "3:05:38"} {"current_steps": 1100, "total_steps": 1850, "loss": 0.4066, "learning_rate": 5e-06, "epoch": 2.972972972972973, "percentage": 59.46, "elapsed_time": "4:28:39", "remaining_time": "3:03:10"} {"current_steps": 1110, "total_steps": 1850, "loss": 0.408, "learning_rate": 5e-06, "epoch": 3.0, "percentage": 60.0, "elapsed_time": "4:31:02", "remaining_time": "3:00:41"} {"current_steps": 1110, "total_steps": 1850, "eval_loss": 0.3071748912334442, "epoch": 3.0, "percentage": 60.0, "elapsed_time": "4:32:39", "remaining_time": "3:01:46"} {"current_steps": 1120, "total_steps": 1850, "loss": 0.2928, "learning_rate": 5e-06, "epoch": 3.027027027027027, "percentage": 60.54, "elapsed_time": "4:35:50", "remaining_time": "2:59:47"} {"current_steps": 1130, "total_steps": 1850, "loss": 0.2851, "learning_rate": 5e-06, "epoch": 3.054054054054054, "percentage": 61.08, "elapsed_time": "4:38:14", "remaining_time": "2:57:17"} {"current_steps": 1140, "total_steps": 1850, "loss": 0.2828, "learning_rate": 5e-06, "epoch": 3.081081081081081, "percentage": 61.62, "elapsed_time": "4:40:38", "remaining_time": "2:54:47"} {"current_steps": 1150, "total_steps": 1850, "loss": 0.2809, "learning_rate": 5e-06, "epoch": 3.108108108108108, "percentage": 62.16, "elapsed_time": "4:43:02", "remaining_time": "2:52:17"} {"current_steps": 1160, "total_steps": 1850, "loss": 0.2814, "learning_rate": 5e-06, "epoch": 3.135135135135135, "percentage": 62.7, "elapsed_time": "4:45:26", "remaining_time": "2:49:47"} {"current_steps": 1170, "total_steps": 1850, "loss": 0.2865, "learning_rate": 5e-06, "epoch": 3.1621621621621623, "percentage": 63.24, "elapsed_time": "4:47:50", "remaining_time": "2:47:17"} {"current_steps": 1180, "total_steps": 1850, "loss": 0.2851, "learning_rate": 5e-06, "epoch": 3.189189189189189, "percentage": 63.78, "elapsed_time": "4:50:14", "remaining_time": "2:44:47"} {"current_steps": 1190, "total_steps": 1850, "loss": 0.2874, "learning_rate": 5e-06, "epoch": 3.2162162162162162, "percentage": 64.32, "elapsed_time": "4:52:38", "remaining_time": "2:42:18"} {"current_steps": 1200, "total_steps": 1850, "loss": 0.2874, "learning_rate": 5e-06, "epoch": 3.2432432432432434, "percentage": 64.86, "elapsed_time": "4:55:03", "remaining_time": "2:39:49"} {"current_steps": 1210, "total_steps": 1850, "loss": 0.2921, "learning_rate": 5e-06, "epoch": 3.27027027027027, "percentage": 65.41, "elapsed_time": "4:57:27", "remaining_time": "2:37:19"} {"current_steps": 1220, "total_steps": 1850, "loss": 0.2891, "learning_rate": 5e-06, "epoch": 3.2972972972972974, "percentage": 65.95, "elapsed_time": "4:59:51", "remaining_time": "2:34:50"} {"current_steps": 1230, "total_steps": 1850, "loss": 0.287, "learning_rate": 5e-06, "epoch": 3.3243243243243246, "percentage": 66.49, "elapsed_time": "5:02:15", "remaining_time": "2:32:21"} {"current_steps": 1240, "total_steps": 1850, "loss": 0.2895, "learning_rate": 5e-06, "epoch": 3.3513513513513513, "percentage": 67.03, "elapsed_time": "5:04:39", "remaining_time": "2:29:52"} {"current_steps": 1250, "total_steps": 1850, "loss": 0.2865, "learning_rate": 5e-06, "epoch": 3.3783783783783785, "percentage": 67.57, "elapsed_time": "5:07:04", "remaining_time": "2:27:23"} {"current_steps": 1260, "total_steps": 1850, "loss": 0.2899, "learning_rate": 5e-06, "epoch": 3.4054054054054053, "percentage": 68.11, "elapsed_time": "5:09:28", "remaining_time": "2:24:54"} {"current_steps": 1270, "total_steps": 1850, "loss": 0.2907, "learning_rate": 5e-06, "epoch": 3.4324324324324325, "percentage": 68.65, "elapsed_time": "5:11:52", "remaining_time": "2:22:25"} {"current_steps": 1280, "total_steps": 1850, "loss": 0.291, "learning_rate": 5e-06, "epoch": 3.4594594594594597, "percentage": 69.19, "elapsed_time": "5:14:17", "remaining_time": "2:19:57"} {"current_steps": 1290, "total_steps": 1850, "loss": 0.2934, "learning_rate": 5e-06, "epoch": 3.4864864864864864, "percentage": 69.73, "elapsed_time": "5:16:41", "remaining_time": "2:17:28"} {"current_steps": 1300, "total_steps": 1850, "loss": 0.2878, "learning_rate": 5e-06, "epoch": 3.5135135135135136, "percentage": 70.27, "elapsed_time": "5:19:05", "remaining_time": "2:14:59"} {"current_steps": 1310, "total_steps": 1850, "loss": 0.2918, "learning_rate": 5e-06, "epoch": 3.5405405405405403, "percentage": 70.81, "elapsed_time": "5:21:28", "remaining_time": "2:12:31"} {"current_steps": 1320, "total_steps": 1850, "loss": 0.2943, "learning_rate": 5e-06, "epoch": 3.5675675675675675, "percentage": 71.35, "elapsed_time": "5:23:53", "remaining_time": "2:10:02"} {"current_steps": 1330, "total_steps": 1850, "loss": 0.2925, "learning_rate": 5e-06, "epoch": 3.5945945945945947, "percentage": 71.89, "elapsed_time": "5:26:17", "remaining_time": "2:07:34"} {"current_steps": 1340, "total_steps": 1850, "loss": 0.2955, "learning_rate": 5e-06, "epoch": 3.6216216216216215, "percentage": 72.43, "elapsed_time": "5:28:41", "remaining_time": "2:05:05"} {"current_steps": 1350, "total_steps": 1850, "loss": 0.2988, "learning_rate": 5e-06, "epoch": 3.6486486486486487, "percentage": 72.97, "elapsed_time": "5:31:05", "remaining_time": "2:02:37"} {"current_steps": 1360, "total_steps": 1850, "loss": 0.2954, "learning_rate": 5e-06, "epoch": 3.6756756756756754, "percentage": 73.51, "elapsed_time": "5:33:29", "remaining_time": "2:00:09"} {"current_steps": 1370, "total_steps": 1850, "loss": 0.2962, "learning_rate": 5e-06, "epoch": 3.7027027027027026, "percentage": 74.05, "elapsed_time": "5:35:52", "remaining_time": "1:57:40"} {"current_steps": 1380, "total_steps": 1850, "loss": 0.2991, "learning_rate": 5e-06, "epoch": 3.72972972972973, "percentage": 74.59, "elapsed_time": "5:38:16", "remaining_time": "1:55:12"} {"current_steps": 1390, "total_steps": 1850, "loss": 0.2997, "learning_rate": 5e-06, "epoch": 3.756756756756757, "percentage": 75.14, "elapsed_time": "5:40:41", "remaining_time": "1:52:44"} {"current_steps": 1400, "total_steps": 1850, "loss": 0.3012, "learning_rate": 5e-06, "epoch": 3.7837837837837838, "percentage": 75.68, "elapsed_time": "5:43:05", "remaining_time": "1:50:16"} {"current_steps": 1410, "total_steps": 1850, "loss": 0.3005, "learning_rate": 5e-06, "epoch": 3.810810810810811, "percentage": 76.22, "elapsed_time": "5:45:28", "remaining_time": "1:47:48"} {"current_steps": 1420, "total_steps": 1850, "loss": 0.3022, "learning_rate": 5e-06, "epoch": 3.8378378378378377, "percentage": 76.76, "elapsed_time": "5:47:52", "remaining_time": "1:45:20"} {"current_steps": 1430, "total_steps": 1850, "loss": 0.3018, "learning_rate": 5e-06, "epoch": 3.864864864864865, "percentage": 77.3, "elapsed_time": "5:50:16", "remaining_time": "1:42:52"} {"current_steps": 1440, "total_steps": 1850, "loss": 0.3019, "learning_rate": 5e-06, "epoch": 3.891891891891892, "percentage": 77.84, "elapsed_time": "5:52:41", "remaining_time": "1:40:25"} {"current_steps": 1450, "total_steps": 1850, "loss": 0.307, "learning_rate": 5e-06, "epoch": 3.918918918918919, "percentage": 78.38, "elapsed_time": "5:55:05", "remaining_time": "1:37:57"} {"current_steps": 1460, "total_steps": 1850, "loss": 0.3058, "learning_rate": 5e-06, "epoch": 3.945945945945946, "percentage": 78.92, "elapsed_time": "5:57:29", "remaining_time": "1:35:29"} {"current_steps": 1470, "total_steps": 1850, "loss": 0.3032, "learning_rate": 5e-06, "epoch": 3.972972972972973, "percentage": 79.46, "elapsed_time": "5:59:53", "remaining_time": "1:33:02"} {"current_steps": 1480, "total_steps": 1850, "loss": 0.3066, "learning_rate": 5e-06, "epoch": 4.0, "percentage": 80.0, "elapsed_time": "6:02:16", "remaining_time": "1:30:34"} {"current_steps": 1480, "total_steps": 1850, "eval_loss": 0.3498997688293457, "epoch": 4.0, "percentage": 80.0, "elapsed_time": "6:03:52", "remaining_time": "1:30:58"} {"current_steps": 1490, "total_steps": 1850, "loss": 0.1986, "learning_rate": 5e-06, "epoch": 4.027027027027027, "percentage": 80.54, "elapsed_time": "6:07:04", "remaining_time": "1:28:41"} {"current_steps": 1500, "total_steps": 1850, "loss": 0.1914, "learning_rate": 5e-06, "epoch": 4.054054054054054, "percentage": 81.08, "elapsed_time": "6:09:29", "remaining_time": "1:26:12"} {"current_steps": 1510, "total_steps": 1850, "loss": 0.1906, "learning_rate": 5e-06, "epoch": 4.081081081081081, "percentage": 81.62, "elapsed_time": "6:11:53", "remaining_time": "1:23:44"} {"current_steps": 1520, "total_steps": 1850, "loss": 0.1894, "learning_rate": 5e-06, "epoch": 4.108108108108108, "percentage": 82.16, "elapsed_time": "6:14:17", "remaining_time": "1:21:15"} {"current_steps": 1530, "total_steps": 1850, "loss": 0.1923, "learning_rate": 5e-06, "epoch": 4.135135135135135, "percentage": 82.7, "elapsed_time": "6:16:41", "remaining_time": "1:18:47"} {"current_steps": 1540, "total_steps": 1850, "loss": 0.1918, "learning_rate": 5e-06, "epoch": 4.162162162162162, "percentage": 83.24, "elapsed_time": "6:19:05", "remaining_time": "1:16:18"} {"current_steps": 1550, "total_steps": 1850, "loss": 0.1955, "learning_rate": 5e-06, "epoch": 4.1891891891891895, "percentage": 83.78, "elapsed_time": "6:21:29", "remaining_time": "1:13:50"} {"current_steps": 1560, "total_steps": 1850, "loss": 0.1967, "learning_rate": 5e-06, "epoch": 4.216216216216216, "percentage": 84.32, "elapsed_time": "6:23:53", "remaining_time": "1:11:21"} {"current_steps": 1570, "total_steps": 1850, "loss": 0.1973, "learning_rate": 5e-06, "epoch": 4.243243243243243, "percentage": 84.86, "elapsed_time": "6:26:18", "remaining_time": "1:08:53"} {"current_steps": 1580, "total_steps": 1850, "loss": 0.2001, "learning_rate": 5e-06, "epoch": 4.27027027027027, "percentage": 85.41, "elapsed_time": "6:28:41", "remaining_time": "1:06:25"} {"current_steps": 1590, "total_steps": 1850, "loss": 0.1999, "learning_rate": 5e-06, "epoch": 4.297297297297297, "percentage": 85.95, "elapsed_time": "6:31:05", "remaining_time": "1:03:57"} {"current_steps": 1600, "total_steps": 1850, "loss": 0.1977, "learning_rate": 5e-06, "epoch": 4.324324324324325, "percentage": 86.49, "elapsed_time": "6:33:29", "remaining_time": "1:01:29"} {"current_steps": 1610, "total_steps": 1850, "loss": 0.1988, "learning_rate": 5e-06, "epoch": 4.351351351351352, "percentage": 87.03, "elapsed_time": "6:35:53", "remaining_time": "0:59:00"} {"current_steps": 1620, "total_steps": 1850, "loss": 0.2016, "learning_rate": 5e-06, "epoch": 4.378378378378378, "percentage": 87.57, "elapsed_time": "6:38:17", "remaining_time": "0:56:32"} {"current_steps": 1630, "total_steps": 1850, "loss": 0.2045, "learning_rate": 5e-06, "epoch": 4.405405405405405, "percentage": 88.11, "elapsed_time": "6:40:41", "remaining_time": "0:54:04"} {"current_steps": 1640, "total_steps": 1850, "loss": 0.2049, "learning_rate": 5e-06, "epoch": 4.4324324324324325, "percentage": 88.65, "elapsed_time": "6:43:05", "remaining_time": "0:51:36"} {"current_steps": 1650, "total_steps": 1850, "loss": 0.2058, "learning_rate": 5e-06, "epoch": 4.45945945945946, "percentage": 89.19, "elapsed_time": "6:45:29", "remaining_time": "0:49:09"} {"current_steps": 1660, "total_steps": 1850, "loss": 0.2063, "learning_rate": 5e-06, "epoch": 4.486486486486487, "percentage": 89.73, "elapsed_time": "6:47:53", "remaining_time": "0:46:41"} {"current_steps": 1670, "total_steps": 1850, "loss": 0.2079, "learning_rate": 5e-06, "epoch": 4.513513513513513, "percentage": 90.27, "elapsed_time": "6:50:17", "remaining_time": "0:44:13"} {"current_steps": 1680, "total_steps": 1850, "loss": 0.2063, "learning_rate": 5e-06, "epoch": 4.54054054054054, "percentage": 90.81, "elapsed_time": "6:52:42", "remaining_time": "0:41:45"} {"current_steps": 1690, "total_steps": 1850, "loss": 0.2073, "learning_rate": 5e-06, "epoch": 4.5675675675675675, "percentage": 91.35, "elapsed_time": "6:55:05", "remaining_time": "0:39:17"} {"current_steps": 1700, "total_steps": 1850, "loss": 0.2064, "learning_rate": 5e-06, "epoch": 4.594594594594595, "percentage": 91.89, "elapsed_time": "6:57:29", "remaining_time": "0:36:50"} {"current_steps": 1710, "total_steps": 1850, "loss": 0.208, "learning_rate": 5e-06, "epoch": 4.621621621621622, "percentage": 92.43, "elapsed_time": "6:59:53", "remaining_time": "0:34:22"} {"current_steps": 1720, "total_steps": 1850, "loss": 0.2091, "learning_rate": 5e-06, "epoch": 4.648648648648649, "percentage": 92.97, "elapsed_time": "7:02:18", "remaining_time": "0:31:55"} {"current_steps": 1730, "total_steps": 1850, "loss": 0.2083, "learning_rate": 5e-06, "epoch": 4.675675675675675, "percentage": 93.51, "elapsed_time": "7:04:41", "remaining_time": "0:29:27"} {"current_steps": 1740, "total_steps": 1850, "loss": 0.2099, "learning_rate": 5e-06, "epoch": 4.702702702702703, "percentage": 94.05, "elapsed_time": "7:07:05", "remaining_time": "0:27:00"} {"current_steps": 1750, "total_steps": 1850, "loss": 0.2107, "learning_rate": 5e-06, "epoch": 4.72972972972973, "percentage": 94.59, "elapsed_time": "7:09:29", "remaining_time": "0:24:32"} {"current_steps": 1760, "total_steps": 1850, "loss": 0.2096, "learning_rate": 5e-06, "epoch": 4.756756756756757, "percentage": 95.14, "elapsed_time": "7:11:53", "remaining_time": "0:22:05"} {"current_steps": 1770, "total_steps": 1850, "loss": 0.2111, "learning_rate": 5e-06, "epoch": 4.783783783783784, "percentage": 95.68, "elapsed_time": "7:14:18", "remaining_time": "0:19:37"} {"current_steps": 1780, "total_steps": 1850, "loss": 0.2097, "learning_rate": 5e-06, "epoch": 4.8108108108108105, "percentage": 96.22, "elapsed_time": "7:16:42", "remaining_time": "0:17:10"} {"current_steps": 1790, "total_steps": 1850, "loss": 0.2132, "learning_rate": 5e-06, "epoch": 4.837837837837838, "percentage": 96.76, "elapsed_time": "7:19:06", "remaining_time": "0:14:43"} {"current_steps": 1800, "total_steps": 1850, "loss": 0.212, "learning_rate": 5e-06, "epoch": 4.864864864864865, "percentage": 97.3, "elapsed_time": "7:21:30", "remaining_time": "0:12:15"} {"current_steps": 1810, "total_steps": 1850, "loss": 0.2143, "learning_rate": 5e-06, "epoch": 4.891891891891892, "percentage": 97.84, "elapsed_time": "7:23:54", "remaining_time": "0:09:48"} {"current_steps": 1820, "total_steps": 1850, "loss": 0.2137, "learning_rate": 5e-06, "epoch": 4.918918918918919, "percentage": 98.38, "elapsed_time": "7:26:17", "remaining_time": "0:07:21"} {"current_steps": 1830, "total_steps": 1850, "loss": 0.2162, "learning_rate": 5e-06, "epoch": 4.945945945945946, "percentage": 98.92, "elapsed_time": "7:28:41", "remaining_time": "0:04:54"} {"current_steps": 1840, "total_steps": 1850, "loss": 0.215, "learning_rate": 5e-06, "epoch": 4.972972972972973, "percentage": 99.46, "elapsed_time": "7:31:06", "remaining_time": "0:02:27"} {"current_steps": 1850, "total_steps": 1850, "loss": 0.2144, "learning_rate": 5e-06, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "7:33:28", "remaining_time": "0:00:00"} {"current_steps": 1850, "total_steps": 1850, "eval_loss": 0.4100167155265808, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "7:35:51", "remaining_time": "0:00:00"} {"current_steps": 1850, "total_steps": 1850, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "7:36:34", "remaining_time": "0:00:00"}