Training in progress, epoch 4
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9794765bc3af9adb8ce0974ff7ed5e3e369f0b45fd2ba1b2c2635db42b41ac76
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9944277146fa6c909423248575399792ee6af650dbb31fb99396de30ef4106d2
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eccdb3b8a73684018b8b4d9abe1d4a1523398685ee736a76a854e989398bd2e2
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a35c1e9126588164fc165c97d2807bc5d4bfdca3b7f94dd1a5165e18caf83098
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -806,3 +806,250 @@
|
|
806 |
{"current_steps": 806, "total_steps": 1235, "loss": 0.0173, "lr": 1.2997471016172188e-05, "epoch": 3.263157894736842, "percentage": 65.26, "elapsed_time": "4:30:49", "remaining_time": "2:24:08"}
|
807 |
{"current_steps": 807, "total_steps": 1235, "loss": 0.0164, "lr": 1.2944524510000042e-05, "epoch": 3.2672064777327936, "percentage": 65.34, "elapsed_time": "4:31:12", "remaining_time": "2:23:50"}
|
808 |
{"current_steps": 808, "total_steps": 1235, "loss": 0.0145, "lr": 1.2891634419221908e-05, "epoch": 3.2712550607287447, "percentage": 65.43, "elapsed_time": "4:31:31", "remaining_time": "2:23:29"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
806 |
{"current_steps": 806, "total_steps": 1235, "loss": 0.0173, "lr": 1.2997471016172188e-05, "epoch": 3.263157894736842, "percentage": 65.26, "elapsed_time": "4:30:49", "remaining_time": "2:24:08"}
|
807 |
{"current_steps": 807, "total_steps": 1235, "loss": 0.0164, "lr": 1.2944524510000042e-05, "epoch": 3.2672064777327936, "percentage": 65.34, "elapsed_time": "4:31:12", "remaining_time": "2:23:50"}
|
808 |
{"current_steps": 808, "total_steps": 1235, "loss": 0.0145, "lr": 1.2891634419221908e-05, "epoch": 3.2712550607287447, "percentage": 65.43, "elapsed_time": "4:31:31", "remaining_time": "2:23:29"}
|
809 |
+
{"current_steps": 809, "total_steps": 1235, "loss": 0.0111, "lr": 1.2838801166745545e-05, "epoch": 3.2753036437246963, "percentage": 65.51, "elapsed_time": "4:31:53", "remaining_time": "2:23:10"}
|
810 |
+
{"current_steps": 810, "total_steps": 1235, "loss": 0.0119, "lr": 1.2786025175024216e-05, "epoch": 3.279352226720648, "percentage": 65.59, "elapsed_time": "4:32:15", "remaining_time": "2:22:51"}
|
811 |
+
{"current_steps": 811, "total_steps": 1235, "loss": 0.0105, "lr": 1.2733306866053357e-05, "epoch": 3.283400809716599, "percentage": 65.67, "elapsed_time": "4:32:32", "remaining_time": "2:22:29"}
|
812 |
+
{"current_steps": 812, "total_steps": 1235, "loss": 0.0144, "lr": 1.2680646661367163e-05, "epoch": 3.2874493927125505, "percentage": 65.75, "elapsed_time": "4:32:55", "remaining_time": "2:22:10"}
|
813 |
+
{"current_steps": 813, "total_steps": 1235, "loss": 0.0126, "lr": 1.2628044982035219e-05, "epoch": 3.291497975708502, "percentage": 65.83, "elapsed_time": "4:33:15", "remaining_time": "2:21:50"}
|
814 |
+
{"current_steps": 814, "total_steps": 1235, "loss": 0.0123, "lr": 1.2575502248659155e-05, "epoch": 3.2955465587044532, "percentage": 65.91, "elapsed_time": "4:33:37", "remaining_time": "2:21:31"}
|
815 |
+
{"current_steps": 815, "total_steps": 1235, "loss": 0.0128, "lr": 1.2523018881369269e-05, "epoch": 3.299595141700405, "percentage": 65.99, "elapsed_time": "4:33:56", "remaining_time": "2:21:10"}
|
816 |
+
{"current_steps": 816, "total_steps": 1235, "loss": 0.0116, "lr": 1.2470595299821176e-05, "epoch": 3.3036437246963564, "percentage": 66.07, "elapsed_time": "4:34:16", "remaining_time": "2:20:50"}
|
817 |
+
{"current_steps": 817, "total_steps": 1235, "loss": 0.0135, "lr": 1.2418231923192416e-05, "epoch": 3.3076923076923075, "percentage": 66.15, "elapsed_time": "4:34:37", "remaining_time": "2:20:30"}
|
818 |
+
{"current_steps": 818, "total_steps": 1235, "loss": 0.0125, "lr": 1.2365929170179165e-05, "epoch": 3.311740890688259, "percentage": 66.23, "elapsed_time": "4:34:57", "remaining_time": "2:20:10"}
|
819 |
+
{"current_steps": 819, "total_steps": 1235, "loss": 0.0142, "lr": 1.2313687458992848e-05, "epoch": 3.3157894736842106, "percentage": 66.32, "elapsed_time": "4:35:18", "remaining_time": "2:19:50"}
|
820 |
+
{"current_steps": 820, "total_steps": 1235, "loss": 0.0135, "lr": 1.2261507207356785e-05, "epoch": 3.3198380566801617, "percentage": 66.4, "elapsed_time": "4:35:36", "remaining_time": "2:19:29"}
|
821 |
+
{"current_steps": 821, "total_steps": 1235, "loss": 0.0121, "lr": 1.220938883250288e-05, "epoch": 3.3238866396761133, "percentage": 66.48, "elapsed_time": "4:35:54", "remaining_time": "2:19:07"}
|
822 |
+
{"current_steps": 822, "total_steps": 1235, "loss": 0.0099, "lr": 1.215733275116827e-05, "epoch": 3.327935222672065, "percentage": 66.56, "elapsed_time": "4:36:13", "remaining_time": "2:18:46"}
|
823 |
+
{"current_steps": 823, "total_steps": 1235, "loss": 0.0122, "lr": 1.2105339379592005e-05, "epoch": 3.331983805668016, "percentage": 66.64, "elapsed_time": "4:36:33", "remaining_time": "2:18:26"}
|
824 |
+
{"current_steps": 824, "total_steps": 1235, "loss": 0.0161, "lr": 1.2053409133511681e-05, "epoch": 3.3360323886639676, "percentage": 66.72, "elapsed_time": "4:36:55", "remaining_time": "2:18:07"}
|
825 |
+
{"current_steps": 825, "total_steps": 1235, "loss": 0.0107, "lr": 1.2001542428160173e-05, "epoch": 3.340080971659919, "percentage": 66.8, "elapsed_time": "4:37:16", "remaining_time": "2:17:47"}
|
826 |
+
{"current_steps": 826, "total_steps": 1235, "loss": 0.0097, "lr": 1.1949739678262278e-05, "epoch": 3.3441295546558703, "percentage": 66.88, "elapsed_time": "4:37:30", "remaining_time": "2:17:24"}
|
827 |
+
{"current_steps": 827, "total_steps": 1235, "loss": 0.0119, "lr": 1.189800129803139e-05, "epoch": 3.348178137651822, "percentage": 66.96, "elapsed_time": "4:37:49", "remaining_time": "2:17:03"}
|
828 |
+
{"current_steps": 828, "total_steps": 1235, "loss": 0.0108, "lr": 1.1846327701166228e-05, "epoch": 3.3522267206477734, "percentage": 67.04, "elapsed_time": "4:38:06", "remaining_time": "2:16:42"}
|
829 |
+
{"current_steps": 829, "total_steps": 1235, "loss": 0.0093, "lr": 1.1794719300847493e-05, "epoch": 3.3562753036437245, "percentage": 67.13, "elapsed_time": "4:38:24", "remaining_time": "2:16:21"}
|
830 |
+
{"current_steps": 830, "total_steps": 1235, "loss": 0.0147, "lr": 1.1743176509734582e-05, "epoch": 3.360323886639676, "percentage": 67.21, "elapsed_time": "4:38:44", "remaining_time": "2:16:00"}
|
831 |
+
{"current_steps": 831, "total_steps": 1235, "loss": 0.0107, "lr": 1.1691699739962275e-05, "epoch": 3.3643724696356276, "percentage": 67.29, "elapsed_time": "4:39:03", "remaining_time": "2:15:40"}
|
832 |
+
{"current_steps": 832, "total_steps": 1235, "loss": 0.0134, "lr": 1.1640289403137456e-05, "epoch": 3.3684210526315788, "percentage": 67.37, "elapsed_time": "4:39:22", "remaining_time": "2:15:19"}
|
833 |
+
{"current_steps": 833, "total_steps": 1235, "loss": 0.0133, "lr": 1.1588945910335802e-05, "epoch": 3.3724696356275303, "percentage": 67.45, "elapsed_time": "4:39:41", "remaining_time": "2:14:58"}
|
834 |
+
{"current_steps": 834, "total_steps": 1235, "loss": 0.0118, "lr": 1.1537669672098517e-05, "epoch": 3.376518218623482, "percentage": 67.53, "elapsed_time": "4:40:02", "remaining_time": "2:14:38"}
|
835 |
+
{"current_steps": 835, "total_steps": 1235, "loss": 0.0117, "lr": 1.1486461098429036e-05, "epoch": 3.380566801619433, "percentage": 67.61, "elapsed_time": "4:40:22", "remaining_time": "2:14:18"}
|
836 |
+
{"current_steps": 836, "total_steps": 1235, "loss": 0.0086, "lr": 1.1435320598789747e-05, "epoch": 3.3846153846153846, "percentage": 67.69, "elapsed_time": "4:40:41", "remaining_time": "2:13:58"}
|
837 |
+
{"current_steps": 837, "total_steps": 1235, "loss": 0.0118, "lr": 1.1384248582098736e-05, "epoch": 3.388663967611336, "percentage": 67.77, "elapsed_time": "4:41:00", "remaining_time": "2:13:37"}
|
838 |
+
{"current_steps": 838, "total_steps": 1235, "loss": 0.0128, "lr": 1.1333245456726467e-05, "epoch": 3.3927125506072873, "percentage": 67.85, "elapsed_time": "4:41:20", "remaining_time": "2:13:16"}
|
839 |
+
{"current_steps": 839, "total_steps": 1235, "loss": 0.0123, "lr": 1.128231163049258e-05, "epoch": 3.396761133603239, "percentage": 67.94, "elapsed_time": "4:41:40", "remaining_time": "2:12:56"}
|
840 |
+
{"current_steps": 840, "total_steps": 1235, "loss": 0.0132, "lr": 1.123144751066259e-05, "epoch": 3.4008097165991904, "percentage": 68.02, "elapsed_time": "4:42:01", "remaining_time": "2:12:37"}
|
841 |
+
{"current_steps": 841, "total_steps": 1235, "loss": 0.0057, "lr": 1.1180653503944657e-05, "epoch": 3.4048582995951415, "percentage": 68.1, "elapsed_time": "4:42:17", "remaining_time": "2:12:14"}
|
842 |
+
{"current_steps": 842, "total_steps": 1235, "loss": 0.0111, "lr": 1.1129930016486287e-05, "epoch": 3.408906882591093, "percentage": 68.18, "elapsed_time": "4:42:37", "remaining_time": "2:11:55"}
|
843 |
+
{"current_steps": 843, "total_steps": 1235, "loss": 0.0115, "lr": 1.107927745387114e-05, "epoch": 3.4129554655870447, "percentage": 68.26, "elapsed_time": "4:42:58", "remaining_time": "2:11:35"}
|
844 |
+
{"current_steps": 844, "total_steps": 1235, "loss": 0.0097, "lr": 1.1028696221115766e-05, "epoch": 3.417004048582996, "percentage": 68.34, "elapsed_time": "4:43:19", "remaining_time": "2:11:15"}
|
845 |
+
{"current_steps": 845, "total_steps": 1235, "loss": 0.0103, "lr": 1.0978186722666341e-05, "epoch": 3.4210526315789473, "percentage": 68.42, "elapsed_time": "4:43:41", "remaining_time": "2:10:56"}
|
846 |
+
{"current_steps": 846, "total_steps": 1235, "loss": 0.0107, "lr": 1.0927749362395475e-05, "epoch": 3.425101214574899, "percentage": 68.5, "elapsed_time": "4:44:01", "remaining_time": "2:10:35"}
|
847 |
+
{"current_steps": 847, "total_steps": 1235, "loss": 0.0121, "lr": 1.0877384543598954e-05, "epoch": 3.42914979757085, "percentage": 68.58, "elapsed_time": "4:44:20", "remaining_time": "2:10:15"}
|
848 |
+
{"current_steps": 848, "total_steps": 1235, "loss": 0.0098, "lr": 1.0827092668992529e-05, "epoch": 3.4331983805668016, "percentage": 68.66, "elapsed_time": "4:44:41", "remaining_time": "2:09:55"}
|
849 |
+
{"current_steps": 849, "total_steps": 1235, "loss": 0.0124, "lr": 1.077687414070869e-05, "epoch": 3.437246963562753, "percentage": 68.74, "elapsed_time": "4:44:57", "remaining_time": "2:09:33"}
|
850 |
+
{"current_steps": 850, "total_steps": 1235, "loss": 0.0113, "lr": 1.0726729360293451e-05, "epoch": 3.4412955465587043, "percentage": 68.83, "elapsed_time": "4:45:20", "remaining_time": "2:09:14"}
|
851 |
+
{"current_steps": 851, "total_steps": 1235, "loss": 0.0123, "lr": 1.0676658728703147e-05, "epoch": 3.445344129554656, "percentage": 68.91, "elapsed_time": "4:45:41", "remaining_time": "2:08:54"}
|
852 |
+
{"current_steps": 852, "total_steps": 1235, "loss": 0.0105, "lr": 1.0626662646301198e-05, "epoch": 3.4493927125506074, "percentage": 68.99, "elapsed_time": "4:46:01", "remaining_time": "2:08:34"}
|
853 |
+
{"current_steps": 853, "total_steps": 1235, "loss": 0.0097, "lr": 1.0576741512854958e-05, "epoch": 3.4534412955465585, "percentage": 69.07, "elapsed_time": "4:46:20", "remaining_time": "2:08:14"}
|
854 |
+
{"current_steps": 854, "total_steps": 1235, "loss": 0.0108, "lr": 1.052689572753247e-05, "epoch": 3.45748987854251, "percentage": 69.15, "elapsed_time": "4:46:40", "remaining_time": "2:07:53"}
|
855 |
+
{"current_steps": 855, "total_steps": 1235, "loss": 0.0106, "lr": 1.0477125688899328e-05, "epoch": 3.4615384615384617, "percentage": 69.23, "elapsed_time": "4:47:01", "remaining_time": "2:07:34"}
|
856 |
+
{"current_steps": 856, "total_steps": 1235, "loss": 0.0077, "lr": 1.0427431794915406e-05, "epoch": 3.465587044534413, "percentage": 69.31, "elapsed_time": "4:47:21", "remaining_time": "2:07:13"}
|
857 |
+
{"current_steps": 857, "total_steps": 1235, "loss": 0.0119, "lr": 1.0377814442931769e-05, "epoch": 3.4696356275303644, "percentage": 69.39, "elapsed_time": "4:47:42", "remaining_time": "2:06:54"}
|
858 |
+
{"current_steps": 858, "total_steps": 1235, "loss": 0.0109, "lr": 1.0328274029687439e-05, "epoch": 3.473684210526316, "percentage": 69.47, "elapsed_time": "4:48:02", "remaining_time": "2:06:33"}
|
859 |
+
{"current_steps": 859, "total_steps": 1235, "loss": 0.0108, "lr": 1.0278810951306253e-05, "epoch": 3.477732793522267, "percentage": 69.55, "elapsed_time": "4:48:24", "remaining_time": "2:06:14"}
|
860 |
+
{"current_steps": 860, "total_steps": 1235, "loss": 0.0094, "lr": 1.0229425603293647e-05, "epoch": 3.4817813765182186, "percentage": 69.64, "elapsed_time": "4:48:41", "remaining_time": "2:05:52"}
|
861 |
+
{"current_steps": 861, "total_steps": 1235, "loss": 0.0102, "lr": 1.0180118380533558e-05, "epoch": 3.48582995951417, "percentage": 69.72, "elapsed_time": "4:48:59", "remaining_time": "2:05:31"}
|
862 |
+
{"current_steps": 862, "total_steps": 1235, "loss": 0.0124, "lr": 1.0130889677285225e-05, "epoch": 3.4898785425101213, "percentage": 69.8, "elapsed_time": "4:49:20", "remaining_time": "2:05:12"}
|
863 |
+
{"current_steps": 863, "total_steps": 1235, "loss": 0.0095, "lr": 1.008173988718005e-05, "epoch": 3.493927125506073, "percentage": 69.88, "elapsed_time": "4:49:40", "remaining_time": "2:04:52"}
|
864 |
+
{"current_steps": 864, "total_steps": 1235, "loss": 0.0068, "lr": 1.0032669403218439e-05, "epoch": 3.4979757085020244, "percentage": 69.96, "elapsed_time": "4:49:58", "remaining_time": "2:04:30"}
|
865 |
+
{"current_steps": 865, "total_steps": 1235, "loss": 0.009, "lr": 9.983678617766677e-06, "epoch": 3.5020242914979756, "percentage": 70.04, "elapsed_time": "4:50:18", "remaining_time": "2:04:10"}
|
866 |
+
{"current_steps": 866, "total_steps": 1235, "loss": 0.0111, "lr": 9.934767922553788e-06, "epoch": 3.506072874493927, "percentage": 70.12, "elapsed_time": "4:50:39", "remaining_time": "2:03:50"}
|
867 |
+
{"current_steps": 867, "total_steps": 1235, "loss": 0.0082, "lr": 9.885937708668371e-06, "epoch": 3.5101214574898787, "percentage": 70.2, "elapsed_time": "4:50:58", "remaining_time": "2:03:30"}
|
868 |
+
{"current_steps": 868, "total_steps": 1235, "loss": 0.0134, "lr": 9.837188366555524e-06, "epoch": 3.51417004048583, "percentage": 70.28, "elapsed_time": "4:51:20", "remaining_time": "2:03:10"}
|
869 |
+
{"current_steps": 869, "total_steps": 1235, "loss": 0.0111, "lr": 9.788520286013691e-06, "epoch": 3.5182186234817814, "percentage": 70.36, "elapsed_time": "4:51:41", "remaining_time": "2:02:51"}
|
870 |
+
{"current_steps": 870, "total_steps": 1235, "loss": 0.0055, "lr": 9.739933856191537e-06, "epoch": 3.522267206477733, "percentage": 70.45, "elapsed_time": "4:52:00", "remaining_time": "2:02:30"}
|
871 |
+
{"current_steps": 871, "total_steps": 1235, "loss": 0.0084, "lr": 9.691429465584866e-06, "epoch": 3.526315789473684, "percentage": 70.53, "elapsed_time": "4:52:18", "remaining_time": "2:02:09"}
|
872 |
+
{"current_steps": 872, "total_steps": 1235, "loss": 0.0082, "lr": 9.643007502033492e-06, "epoch": 3.5303643724696356, "percentage": 70.61, "elapsed_time": "4:52:37", "remaining_time": "2:01:49"}
|
873 |
+
{"current_steps": 873, "total_steps": 1235, "loss": 0.0092, "lr": 9.594668352718152e-06, "epoch": 3.534412955465587, "percentage": 70.69, "elapsed_time": "4:52:56", "remaining_time": "2:01:28"}
|
874 |
+
{"current_steps": 874, "total_steps": 1235, "loss": 0.0108, "lr": 9.546412404157383e-06, "epoch": 3.5384615384615383, "percentage": 70.77, "elapsed_time": "4:53:17", "remaining_time": "2:01:08"}
|
875 |
+
{"current_steps": 875, "total_steps": 1235, "loss": 0.0088, "lr": 9.498240042204471e-06, "epoch": 3.54251012145749, "percentage": 70.85, "elapsed_time": "4:53:38", "remaining_time": "2:00:48"}
|
876 |
+
{"current_steps": 876, "total_steps": 1235, "loss": 0.0102, "lr": 9.450151652044339e-06, "epoch": 3.5465587044534415, "percentage": 70.93, "elapsed_time": "4:53:56", "remaining_time": "2:00:27"}
|
877 |
+
{"current_steps": 877, "total_steps": 1235, "loss": 0.009, "lr": 9.402147618190472e-06, "epoch": 3.5506072874493926, "percentage": 71.01, "elapsed_time": "4:54:17", "remaining_time": "2:00:07"}
|
878 |
+
{"current_steps": 878, "total_steps": 1235, "loss": 0.0095, "lr": 9.354228324481841e-06, "epoch": 3.554655870445344, "percentage": 71.09, "elapsed_time": "4:54:36", "remaining_time": "1:59:47"}
|
879 |
+
{"current_steps": 879, "total_steps": 1235, "loss": 0.0059, "lr": 9.306394154079852e-06, "epoch": 3.5587044534412957, "percentage": 71.17, "elapsed_time": "4:54:54", "remaining_time": "1:59:26"}
|
880 |
+
{"current_steps": 880, "total_steps": 1235, "loss": 0.0124, "lr": 9.258645489465254e-06, "epoch": 3.562753036437247, "percentage": 71.26, "elapsed_time": "4:55:15", "remaining_time": "1:59:06"}
|
881 |
+
{"current_steps": 881, "total_steps": 1235, "loss": 0.0086, "lr": 9.21098271243509e-06, "epoch": 3.5668016194331984, "percentage": 71.34, "elapsed_time": "4:55:32", "remaining_time": "1:58:45"}
|
882 |
+
{"current_steps": 882, "total_steps": 1235, "loss": 0.009, "lr": 9.163406204099659e-06, "epoch": 3.57085020242915, "percentage": 71.42, "elapsed_time": "4:55:52", "remaining_time": "1:58:25"}
|
883 |
+
{"current_steps": 883, "total_steps": 1235, "loss": 0.0092, "lr": 9.115916344879452e-06, "epoch": 3.574898785425101, "percentage": 71.5, "elapsed_time": "4:56:13", "remaining_time": "1:58:05"}
|
884 |
+
{"current_steps": 884, "total_steps": 1235, "loss": 0.0119, "lr": 9.068513514502126e-06, "epoch": 3.5789473684210527, "percentage": 71.58, "elapsed_time": "4:56:33", "remaining_time": "1:57:45"}
|
885 |
+
{"current_steps": 885, "total_steps": 1235, "loss": 0.0095, "lr": 9.021198091999439e-06, "epoch": 3.582995951417004, "percentage": 71.66, "elapsed_time": "4:56:54", "remaining_time": "1:57:25"}
|
886 |
+
{"current_steps": 886, "total_steps": 1235, "loss": 0.0073, "lr": 8.973970455704251e-06, "epoch": 3.5870445344129553, "percentage": 71.74, "elapsed_time": "4:57:13", "remaining_time": "1:57:04"}
|
887 |
+
{"current_steps": 887, "total_steps": 1235, "loss": 0.0082, "lr": 8.926830983247495e-06, "epoch": 3.591093117408907, "percentage": 71.82, "elapsed_time": "4:57:33", "remaining_time": "1:56:44"}
|
888 |
+
{"current_steps": 888, "total_steps": 1235, "loss": 0.0107, "lr": 8.879780051555116e-06, "epoch": 3.5951417004048585, "percentage": 71.9, "elapsed_time": "4:57:54", "remaining_time": "1:56:24"}
|
889 |
+
{"current_steps": 889, "total_steps": 1235, "loss": 0.0078, "lr": 8.83281803684512e-06, "epoch": 3.5991902834008096, "percentage": 71.98, "elapsed_time": "4:58:13", "remaining_time": "1:56:04"}
|
890 |
+
{"current_steps": 890, "total_steps": 1235, "loss": 0.0081, "lr": 8.785945314624532e-06, "epoch": 3.603238866396761, "percentage": 72.06, "elapsed_time": "4:58:33", "remaining_time": "1:55:43"}
|
891 |
+
{"current_steps": 891, "total_steps": 1235, "loss": 0.0052, "lr": 8.739162259686385e-06, "epoch": 3.6072874493927127, "percentage": 72.15, "elapsed_time": "4:58:48", "remaining_time": "1:55:21"}
|
892 |
+
{"current_steps": 892, "total_steps": 1235, "loss": 0.0064, "lr": 8.692469246106734e-06, "epoch": 3.611336032388664, "percentage": 72.23, "elapsed_time": "4:59:07", "remaining_time": "1:55:01"}
|
893 |
+
{"current_steps": 893, "total_steps": 1235, "loss": 0.0063, "lr": 8.645866647241677e-06, "epoch": 3.6153846153846154, "percentage": 72.31, "elapsed_time": "4:59:26", "remaining_time": "1:54:40"}
|
894 |
+
{"current_steps": 894, "total_steps": 1235, "loss": 0.0121, "lr": 8.599354835724348e-06, "epoch": 3.619433198380567, "percentage": 72.39, "elapsed_time": "4:59:46", "remaining_time": "1:54:20"}
|
895 |
+
{"current_steps": 895, "total_steps": 1235, "loss": 0.0086, "lr": 8.552934183461958e-06, "epoch": 3.623481781376518, "percentage": 72.47, "elapsed_time": "5:00:07", "remaining_time": "1:54:00"}
|
896 |
+
{"current_steps": 896, "total_steps": 1235, "loss": 0.0048, "lr": 8.506605061632805e-06, "epoch": 3.6275303643724697, "percentage": 72.55, "elapsed_time": "5:00:25", "remaining_time": "1:53:40"}
|
897 |
+
{"current_steps": 897, "total_steps": 1235, "loss": 0.006, "lr": 8.460367840683308e-06, "epoch": 3.6315789473684212, "percentage": 72.63, "elapsed_time": "5:00:45", "remaining_time": "1:53:19"}
|
898 |
+
{"current_steps": 898, "total_steps": 1235, "loss": 0.0059, "lr": 8.414222890325065e-06, "epoch": 3.6356275303643724, "percentage": 72.71, "elapsed_time": "5:01:05", "remaining_time": "1:52:59"}
|
899 |
+
{"current_steps": 899, "total_steps": 1235, "loss": 0.008, "lr": 8.368170579531855e-06, "epoch": 3.639676113360324, "percentage": 72.79, "elapsed_time": "5:01:27", "remaining_time": "1:52:40"}
|
900 |
+
{"current_steps": 900, "total_steps": 1235, "loss": 0.0081, "lr": 8.322211276536733e-06, "epoch": 3.6437246963562755, "percentage": 72.87, "elapsed_time": "5:01:46", "remaining_time": "1:52:19"}
|
901 |
+
{"current_steps": 901, "total_steps": 1235, "loss": 0.0096, "lr": 8.27634534882907e-06, "epoch": 3.6477732793522266, "percentage": 72.96, "elapsed_time": "5:02:07", "remaining_time": "1:51:59"}
|
902 |
+
{"current_steps": 902, "total_steps": 1235, "loss": 0.0063, "lr": 8.230573163151585e-06, "epoch": 3.651821862348178, "percentage": 73.04, "elapsed_time": "5:02:28", "remaining_time": "1:51:40"}
|
903 |
+
{"current_steps": 903, "total_steps": 1235, "loss": 0.007, "lr": 8.184895085497466e-06, "epoch": 3.6558704453441297, "percentage": 73.12, "elapsed_time": "5:02:48", "remaining_time": "1:51:20"}
|
904 |
+
{"current_steps": 904, "total_steps": 1235, "loss": 0.0064, "lr": 8.139311481107401e-06, "epoch": 3.659919028340081, "percentage": 73.2, "elapsed_time": "5:03:08", "remaining_time": "1:50:59"}
|
905 |
+
{"current_steps": 905, "total_steps": 1235, "loss": 0.0062, "lr": 8.093822714466686e-06, "epoch": 3.6639676113360324, "percentage": 73.28, "elapsed_time": "5:03:27", "remaining_time": "1:50:39"}
|
906 |
+
{"current_steps": 906, "total_steps": 1235, "loss": 0.0056, "lr": 8.048429149302271e-06, "epoch": 3.668016194331984, "percentage": 73.36, "elapsed_time": "5:03:46", "remaining_time": "1:50:18"}
|
907 |
+
{"current_steps": 907, "total_steps": 1235, "loss": 0.0067, "lr": 8.003131148579902e-06, "epoch": 3.672064777327935, "percentage": 73.44, "elapsed_time": "5:04:06", "remaining_time": "1:49:58"}
|
908 |
+
{"current_steps": 908, "total_steps": 1235, "loss": 0.0075, "lr": 7.957929074501182e-06, "epoch": 3.6761133603238867, "percentage": 73.52, "elapsed_time": "5:04:24", "remaining_time": "1:49:37"}
|
909 |
+
{"current_steps": 909, "total_steps": 1235, "loss": 0.0056, "lr": 7.912823288500695e-06, "epoch": 3.6801619433198383, "percentage": 73.6, "elapsed_time": "5:04:43", "remaining_time": "1:49:17"}
|
910 |
+
{"current_steps": 910, "total_steps": 1235, "loss": 0.0053, "lr": 7.867814151243102e-06, "epoch": 3.6842105263157894, "percentage": 73.68, "elapsed_time": "5:05:03", "remaining_time": "1:48:57"}
|
911 |
+
{"current_steps": 911, "total_steps": 1235, "loss": 0.0083, "lr": 7.822902022620267e-06, "epoch": 3.688259109311741, "percentage": 73.77, "elapsed_time": "5:05:22", "remaining_time": "1:48:36"}
|
912 |
+
{"current_steps": 912, "total_steps": 1235, "loss": 0.006, "lr": 7.778087261748377e-06, "epoch": 3.6923076923076925, "percentage": 73.85, "elapsed_time": "5:05:41", "remaining_time": "1:48:16"}
|
913 |
+
{"current_steps": 913, "total_steps": 1235, "loss": 0.0057, "lr": 7.733370226965056e-06, "epoch": 3.6963562753036436, "percentage": 73.93, "elapsed_time": "5:06:02", "remaining_time": "1:47:56"}
|
914 |
+
{"current_steps": 914, "total_steps": 1235, "loss": 0.0069, "lr": 7.688751275826527e-06, "epoch": 3.700404858299595, "percentage": 74.01, "elapsed_time": "5:06:22", "remaining_time": "1:47:35"}
|
915 |
+
{"current_steps": 915, "total_steps": 1235, "loss": 0.0059, "lr": 7.644230765104735e-06, "epoch": 3.7044534412955468, "percentage": 74.09, "elapsed_time": "5:06:42", "remaining_time": "1:47:15"}
|
916 |
+
{"current_steps": 916, "total_steps": 1235, "loss": 0.0063, "lr": 7.599809050784502e-06, "epoch": 3.708502024291498, "percentage": 74.17, "elapsed_time": "5:07:01", "remaining_time": "1:46:55"}
|
917 |
+
{"current_steps": 917, "total_steps": 1235, "loss": 0.0056, "lr": 7.555486488060661e-06, "epoch": 3.7125506072874495, "percentage": 74.25, "elapsed_time": "5:07:20", "remaining_time": "1:46:34"}
|
918 |
+
{"current_steps": 918, "total_steps": 1235, "loss": 0.0086, "lr": 7.511263431335249e-06, "epoch": 3.716599190283401, "percentage": 74.33, "elapsed_time": "5:07:42", "remaining_time": "1:46:15"}
|
919 |
+
{"current_steps": 919, "total_steps": 1235, "loss": 0.0066, "lr": 7.467140234214656e-06, "epoch": 3.720647773279352, "percentage": 74.41, "elapsed_time": "5:08:03", "remaining_time": "1:45:55"}
|
920 |
+
{"current_steps": 920, "total_steps": 1235, "loss": 0.0075, "lr": 7.423117249506777e-06, "epoch": 3.7246963562753037, "percentage": 74.49, "elapsed_time": "5:08:23", "remaining_time": "1:45:35"}
|
921 |
+
{"current_steps": 921, "total_steps": 1235, "loss": 0.006, "lr": 7.379194829218231e-06, "epoch": 3.7287449392712553, "percentage": 74.57, "elapsed_time": "5:08:43", "remaining_time": "1:45:15"}
|
922 |
+
{"current_steps": 922, "total_steps": 1235, "loss": 0.0063, "lr": 7.335373324551518e-06, "epoch": 3.7327935222672064, "percentage": 74.66, "elapsed_time": "5:09:03", "remaining_time": "1:44:55"}
|
923 |
+
{"current_steps": 923, "total_steps": 1235, "loss": 0.004, "lr": 7.291653085902224e-06, "epoch": 3.736842105263158, "percentage": 74.74, "elapsed_time": "5:09:20", "remaining_time": "1:44:33"}
|
924 |
+
{"current_steps": 924, "total_steps": 1235, "loss": 0.0062, "lr": 7.248034462856213e-06, "epoch": 3.7408906882591095, "percentage": 74.82, "elapsed_time": "5:09:40", "remaining_time": "1:44:13"}
|
925 |
+
{"current_steps": 925, "total_steps": 1235, "loss": 0.0049, "lr": 7.20451780418683e-06, "epoch": 3.7449392712550607, "percentage": 74.9, "elapsed_time": "5:10:00", "remaining_time": "1:43:53"}
|
926 |
+
{"current_steps": 926, "total_steps": 1235, "loss": 0.0051, "lr": 7.161103457852128e-06, "epoch": 3.748987854251012, "percentage": 74.98, "elapsed_time": "5:10:19", "remaining_time": "1:43:33"}
|
927 |
+
{"current_steps": 927, "total_steps": 1235, "loss": 0.0103, "lr": 7.117791770992046e-06, "epoch": 3.753036437246964, "percentage": 75.06, "elapsed_time": "5:10:39", "remaining_time": "1:43:13"}
|
928 |
+
{"current_steps": 928, "total_steps": 1235, "loss": 0.0048, "lr": 7.074583089925688e-06, "epoch": 3.757085020242915, "percentage": 75.14, "elapsed_time": "5:10:59", "remaining_time": "1:42:52"}
|
929 |
+
{"current_steps": 929, "total_steps": 1235, "loss": 0.0053, "lr": 7.0314777601485155e-06, "epoch": 3.7611336032388665, "percentage": 75.22, "elapsed_time": "5:11:19", "remaining_time": "1:42:32"}
|
930 |
+
{"current_steps": 930, "total_steps": 1235, "loss": 0.005, "lr": 6.988476126329604e-06, "epoch": 3.765182186234818, "percentage": 75.3, "elapsed_time": "5:11:39", "remaining_time": "1:42:12"}
|
931 |
+
{"current_steps": 931, "total_steps": 1235, "loss": 0.0055, "lr": 6.945578532308857e-06, "epoch": 3.769230769230769, "percentage": 75.38, "elapsed_time": "5:12:00", "remaining_time": "1:41:52"}
|
932 |
+
{"current_steps": 932, "total_steps": 1235, "loss": 0.0048, "lr": 6.902785321094301e-06, "epoch": 3.7732793522267207, "percentage": 75.47, "elapsed_time": "5:12:20", "remaining_time": "1:41:32"}
|
933 |
+
{"current_steps": 933, "total_steps": 1235, "loss": 0.0045, "lr": 6.8600968348593115e-06, "epoch": 3.7773279352226723, "percentage": 75.55, "elapsed_time": "5:12:41", "remaining_time": "1:41:12"}
|
934 |
+
{"current_steps": 934, "total_steps": 1235, "loss": 0.0043, "lr": 6.817513414939892e-06, "epoch": 3.7813765182186234, "percentage": 75.63, "elapsed_time": "5:13:01", "remaining_time": "1:40:52"}
|
935 |
+
{"current_steps": 935, "total_steps": 1235, "loss": 0.0051, "lr": 6.775035401831924e-06, "epoch": 3.785425101214575, "percentage": 75.71, "elapsed_time": "5:13:19", "remaining_time": "1:40:31"}
|
936 |
+
{"current_steps": 936, "total_steps": 1235, "loss": 0.0069, "lr": 6.732663135188473e-06, "epoch": 3.7894736842105265, "percentage": 75.79, "elapsed_time": "5:13:39", "remaining_time": "1:40:11"}
|
937 |
+
{"current_steps": 937, "total_steps": 1235, "loss": 0.0041, "lr": 6.690396953817055e-06, "epoch": 3.7935222672064777, "percentage": 75.87, "elapsed_time": "5:13:59", "remaining_time": "1:39:51"}
|
938 |
+
{"current_steps": 938, "total_steps": 1235, "loss": 0.0055, "lr": 6.648237195676927e-06, "epoch": 3.7975708502024292, "percentage": 75.95, "elapsed_time": "5:14:19", "remaining_time": "1:39:31"}
|
939 |
+
{"current_steps": 939, "total_steps": 1235, "loss": 0.005, "lr": 6.606184197876395e-06, "epoch": 3.801619433198381, "percentage": 76.03, "elapsed_time": "5:14:39", "remaining_time": "1:39:11"}
|
940 |
+
{"current_steps": 940, "total_steps": 1235, "loss": 0.005, "lr": 6.564238296670109e-06, "epoch": 3.805668016194332, "percentage": 76.11, "elapsed_time": "5:15:00", "remaining_time": "1:38:51"}
|
941 |
+
{"current_steps": 941, "total_steps": 1235, "loss": 0.0053, "lr": 6.52239982745638e-06, "epoch": 3.8097165991902835, "percentage": 76.19, "elapsed_time": "5:15:20", "remaining_time": "1:38:31"}
|
942 |
+
{"current_steps": 942, "total_steps": 1235, "loss": 0.0048, "lr": 6.480669124774484e-06, "epoch": 3.813765182186235, "percentage": 76.28, "elapsed_time": "5:15:39", "remaining_time": "1:38:11"}
|
943 |
+
{"current_steps": 943, "total_steps": 1235, "loss": 0.0048, "lr": 6.439046522302013e-06, "epoch": 3.817813765182186, "percentage": 76.36, "elapsed_time": "5:15:59", "remaining_time": "1:37:50"}
|
944 |
+
{"current_steps": 944, "total_steps": 1235, "loss": 0.0053, "lr": 6.397532352852191e-06, "epoch": 3.8218623481781377, "percentage": 76.44, "elapsed_time": "5:16:19", "remaining_time": "1:37:30"}
|
945 |
+
{"current_steps": 945, "total_steps": 1235, "loss": 0.0057, "lr": 6.356126948371202e-06, "epoch": 3.8259109311740893, "percentage": 76.52, "elapsed_time": "5:16:40", "remaining_time": "1:37:10"}
|
946 |
+
{"current_steps": 946, "total_steps": 1235, "loss": 0.0063, "lr": 6.314830639935559e-06, "epoch": 3.8299595141700404, "percentage": 76.6, "elapsed_time": "5:17:01", "remaining_time": "1:36:50"}
|
947 |
+
{"current_steps": 947, "total_steps": 1235, "loss": 0.0052, "lr": 6.273643757749448e-06, "epoch": 3.834008097165992, "percentage": 76.68, "elapsed_time": "5:17:20", "remaining_time": "1:36:30"}
|
948 |
+
{"current_steps": 948, "total_steps": 1235, "loss": 0.0041, "lr": 6.2325666311420856e-06, "epoch": 3.8380566801619436, "percentage": 76.76, "elapsed_time": "5:17:39", "remaining_time": "1:36:10"}
|
949 |
+
{"current_steps": 949, "total_steps": 1235, "loss": 0.005, "lr": 6.1915995885650675e-06, "epoch": 3.8421052631578947, "percentage": 76.84, "elapsed_time": "5:18:00", "remaining_time": "1:35:50"}
|
950 |
+
{"current_steps": 950, "total_steps": 1235, "loss": 0.0038, "lr": 6.150742957589784e-06, "epoch": 3.8461538461538463, "percentage": 76.92, "elapsed_time": "5:18:19", "remaining_time": "1:35:29"}
|
951 |
+
{"current_steps": 951, "total_steps": 1235, "loss": 0.0073, "lr": 6.109997064904774e-06, "epoch": 3.850202429149798, "percentage": 77.0, "elapsed_time": "5:18:41", "remaining_time": "1:35:10"}
|
952 |
+
{"current_steps": 952, "total_steps": 1235, "loss": 0.0042, "lr": 6.069362236313092e-06, "epoch": 3.854251012145749, "percentage": 77.09, "elapsed_time": "5:18:58", "remaining_time": "1:34:49"}
|
953 |
+
{"current_steps": 953, "total_steps": 1235, "loss": 0.0057, "lr": 6.0288387967297565e-06, "epoch": 3.8582995951417005, "percentage": 77.17, "elapsed_time": "5:19:17", "remaining_time": "1:34:28"}
|
954 |
+
{"current_steps": 954, "total_steps": 1235, "loss": 0.0041, "lr": 5.988427070179108e-06, "epoch": 3.862348178137652, "percentage": 77.25, "elapsed_time": "5:19:36", "remaining_time": "1:34:08"}
|
955 |
+
{"current_steps": 955, "total_steps": 1235, "loss": 0.003, "lr": 5.948127379792234e-06, "epoch": 3.866396761133603, "percentage": 77.33, "elapsed_time": "5:19:53", "remaining_time": "1:33:47"}
|
956 |
+
{"current_steps": 956, "total_steps": 1235, "loss": 0.0056, "lr": 5.90794004780439e-06, "epoch": 3.8704453441295548, "percentage": 77.41, "elapsed_time": "5:20:13", "remaining_time": "1:33:27"}
|
957 |
+
{"current_steps": 957, "total_steps": 1235, "loss": 0.0039, "lr": 5.867865395552405e-06, "epoch": 3.8744939271255063, "percentage": 77.49, "elapsed_time": "5:20:35", "remaining_time": "1:33:07"}
|
958 |
+
{"current_steps": 958, "total_steps": 1235, "loss": 0.0035, "lr": 5.8279037434721364e-06, "epoch": 3.8785425101214575, "percentage": 77.57, "elapsed_time": "5:20:55", "remaining_time": "1:32:47"}
|
959 |
+
{"current_steps": 959, "total_steps": 1235, "loss": 0.0042, "lr": 5.788055411095892e-06, "epoch": 3.882591093117409, "percentage": 77.65, "elapsed_time": "5:21:15", "remaining_time": "1:32:27"}
|
960 |
+
{"current_steps": 960, "total_steps": 1235, "loss": 0.0035, "lr": 5.7483207170498625e-06, "epoch": 3.8866396761133606, "percentage": 77.73, "elapsed_time": "5:21:33", "remaining_time": "1:32:06"}
|
961 |
+
{"current_steps": 961, "total_steps": 1235, "loss": 0.007, "lr": 5.708699979051613e-06, "epoch": 3.8906882591093117, "percentage": 77.81, "elapsed_time": "5:21:55", "remaining_time": "1:31:47"}
|
962 |
+
{"current_steps": 962, "total_steps": 1235, "loss": 0.0041, "lr": 5.66919351390751e-06, "epoch": 3.8947368421052633, "percentage": 77.89, "elapsed_time": "5:22:14", "remaining_time": "1:31:26"}
|
963 |
+
{"current_steps": 963, "total_steps": 1235, "loss": 0.0047, "lr": 5.629801637510188e-06, "epoch": 3.898785425101215, "percentage": 77.98, "elapsed_time": "5:22:35", "remaining_time": "1:31:06"}
|
964 |
+
{"current_steps": 964, "total_steps": 1235, "loss": 0.0041, "lr": 5.590524664836043e-06, "epoch": 3.902834008097166, "percentage": 78.06, "elapsed_time": "5:22:54", "remaining_time": "1:30:46"}
|
965 |
+
{"current_steps": 965, "total_steps": 1235, "loss": 0.0038, "lr": 5.551362909942708e-06, "epoch": 3.9068825910931175, "percentage": 78.14, "elapsed_time": "5:23:15", "remaining_time": "1:30:26"}
|
966 |
+
{"current_steps": 966, "total_steps": 1235, "loss": 0.0053, "lr": 5.51231668596653e-06, "epoch": 3.910931174089069, "percentage": 78.22, "elapsed_time": "5:23:35", "remaining_time": "1:30:06"}
|
967 |
+
{"current_steps": 967, "total_steps": 1235, "loss": 0.0036, "lr": 5.47338630512007e-06, "epoch": 3.91497975708502, "percentage": 78.3, "elapsed_time": "5:23:55", "remaining_time": "1:29:46"}
|
968 |
+
{"current_steps": 968, "total_steps": 1235, "loss": 0.0037, "lr": 5.434572078689617e-06, "epoch": 3.919028340080972, "percentage": 78.38, "elapsed_time": "5:24:15", "remaining_time": "1:29:26"}
|
969 |
+
{"current_steps": 969, "total_steps": 1235, "loss": 0.0051, "lr": 5.395874317032694e-06, "epoch": 3.9230769230769234, "percentage": 78.46, "elapsed_time": "5:24:34", "remaining_time": "1:29:05"}
|
970 |
+
{"current_steps": 970, "total_steps": 1235, "loss": 0.0035, "lr": 5.357293329575573e-06, "epoch": 3.9271255060728745, "percentage": 78.54, "elapsed_time": "5:24:51", "remaining_time": "1:28:45"}
|
971 |
+
{"current_steps": 971, "total_steps": 1235, "loss": 0.0045, "lr": 5.318829424810797e-06, "epoch": 3.931174089068826, "percentage": 78.62, "elapsed_time": "5:25:11", "remaining_time": "1:28:24"}
|
972 |
+
{"current_steps": 972, "total_steps": 1235, "loss": 0.0058, "lr": 5.280482910294728e-06, "epoch": 3.9352226720647776, "percentage": 78.7, "elapsed_time": "5:25:34", "remaining_time": "1:28:05"}
|
973 |
+
{"current_steps": 973, "total_steps": 1235, "loss": 0.0035, "lr": 5.242254092645078e-06, "epoch": 3.9392712550607287, "percentage": 78.79, "elapsed_time": "5:25:54", "remaining_time": "1:27:45"}
|
974 |
+
{"current_steps": 974, "total_steps": 1235, "loss": 0.0031, "lr": 5.2041432775384445e-06, "epoch": 3.9433198380566803, "percentage": 78.87, "elapsed_time": "5:26:13", "remaining_time": "1:27:25"}
|
975 |
+
{"current_steps": 975, "total_steps": 1235, "loss": 0.0033, "lr": 5.166150769707892e-06, "epoch": 3.9473684210526314, "percentage": 78.95, "elapsed_time": "5:26:30", "remaining_time": "1:27:04"}
|
976 |
+
{"current_steps": 976, "total_steps": 1235, "loss": 0.0042, "lr": 5.128276872940503e-06, "epoch": 3.951417004048583, "percentage": 79.03, "elapsed_time": "5:26:51", "remaining_time": "1:26:44"}
|
977 |
+
{"current_steps": 977, "total_steps": 1235, "loss": 0.0033, "lr": 5.090521890074953e-06, "epoch": 3.9554655870445345, "percentage": 79.11, "elapsed_time": "5:27:12", "remaining_time": "1:26:24"}
|
978 |
+
{"current_steps": 978, "total_steps": 1235, "loss": 0.0028, "lr": 5.0528861229990675e-06, "epoch": 3.9595141700404857, "percentage": 79.19, "elapsed_time": "5:27:32", "remaining_time": "1:26:04"}
|
979 |
+
{"current_steps": 979, "total_steps": 1235, "loss": 0.0032, "lr": 5.015369872647442e-06, "epoch": 3.9635627530364372, "percentage": 79.27, "elapsed_time": "5:27:51", "remaining_time": "1:25:44"}
|
980 |
+
{"current_steps": 980, "total_steps": 1235, "loss": 0.003, "lr": 4.9779734389990195e-06, "epoch": 3.967611336032389, "percentage": 79.35, "elapsed_time": "5:28:11", "remaining_time": "1:25:23"}
|
981 |
+
{"current_steps": 981, "total_steps": 1235, "loss": 0.0042, "lr": 4.940697121074675e-06, "epoch": 3.97165991902834, "percentage": 79.43, "elapsed_time": "5:28:33", "remaining_time": "1:25:04"}
|
982 |
+
{"current_steps": 982, "total_steps": 1235, "loss": 0.0036, "lr": 4.903541216934864e-06, "epoch": 3.9757085020242915, "percentage": 79.51, "elapsed_time": "5:28:52", "remaining_time": "1:24:43"}
|
983 |
+
{"current_steps": 983, "total_steps": 1235, "loss": 0.0036, "lr": 4.8665060236772e-06, "epoch": 3.979757085020243, "percentage": 79.6, "elapsed_time": "5:29:13", "remaining_time": "1:24:24"}
|
984 |
+
{"current_steps": 984, "total_steps": 1235, "loss": 0.0028, "lr": 4.829591837434102e-06, "epoch": 3.983805668016194, "percentage": 79.68, "elapsed_time": "5:29:31", "remaining_time": "1:24:03"}
|
985 |
+
{"current_steps": 985, "total_steps": 1235, "loss": 0.0035, "lr": 4.792798953370424e-06, "epoch": 3.9878542510121457, "percentage": 79.76, "elapsed_time": "5:29:48", "remaining_time": "1:23:42"}
|
986 |
+
{"current_steps": 986, "total_steps": 1235, "loss": 0.0023, "lr": 4.756127665681083e-06, "epoch": 3.9919028340080973, "percentage": 79.84, "elapsed_time": "5:30:07", "remaining_time": "1:23:22"}
|
987 |
+
{"current_steps": 987, "total_steps": 1235, "loss": 0.0033, "lr": 4.719578267588725e-06, "epoch": 3.9959514170040484, "percentage": 79.92, "elapsed_time": "5:30:27", "remaining_time": "1:23:02"}
|
988 |
+
{"current_steps": 988, "total_steps": 1235, "loss": 0.0026, "lr": 4.6831510513413525e-06, "epoch": 4.0, "percentage": 80.0, "elapsed_time": "5:30:47", "remaining_time": "1:22:41"}
|
989 |
+
{"current_steps": 989, "total_steps": 1235, "loss": 0.0016, "lr": 4.6468463082100176e-06, "epoch": 4.004048582995951, "percentage": 80.08, "elapsed_time": "5:32:43", "remaining_time": "1:22:45"}
|
990 |
+
{"current_steps": 990, "total_steps": 1235, "loss": 0.0018, "lr": 4.610664328486485e-06, "epoch": 4.008097165991903, "percentage": 80.16, "elapsed_time": "5:33:03", "remaining_time": "1:22:25"}
|
991 |
+
{"current_steps": 991, "total_steps": 1235, "loss": 0.0017, "lr": 4.5746054014809e-06, "epoch": 4.012145748987854, "percentage": 80.24, "elapsed_time": "5:33:25", "remaining_time": "1:22:05"}
|
992 |
+
{"current_steps": 992, "total_steps": 1235, "loss": 0.0021, "lr": 4.5386698155194766e-06, "epoch": 4.016194331983805, "percentage": 80.32, "elapsed_time": "5:33:44", "remaining_time": "1:21:45"}
|
993 |
+
{"current_steps": 993, "total_steps": 1235, "loss": 0.0022, "lr": 4.502857857942204e-06, "epoch": 4.020242914979757, "percentage": 80.4, "elapsed_time": "5:34:05", "remaining_time": "1:21:25"}
|
994 |
+
{"current_steps": 994, "total_steps": 1235, "loss": 0.0018, "lr": 4.467169815100549e-06, "epoch": 4.0242914979757085, "percentage": 80.49, "elapsed_time": "5:34:27", "remaining_time": "1:21:05"}
|
995 |
+
{"current_steps": 995, "total_steps": 1235, "loss": 0.0021, "lr": 4.431605972355137e-06, "epoch": 4.02834008097166, "percentage": 80.57, "elapsed_time": "5:34:47", "remaining_time": "1:20:45"}
|
996 |
+
{"current_steps": 996, "total_steps": 1235, "loss": 0.0012, "lr": 4.396166614073516e-06, "epoch": 4.032388663967612, "percentage": 80.65, "elapsed_time": "5:35:04", "remaining_time": "1:20:24"}
|
997 |
+
{"current_steps": 997, "total_steps": 1235, "loss": 0.0015, "lr": 4.360852023627846e-06, "epoch": 4.036437246963563, "percentage": 80.73, "elapsed_time": "5:35:22", "remaining_time": "1:20:03"}
|
998 |
+
{"current_steps": 998, "total_steps": 1235, "loss": 0.0012, "lr": 4.325662483392656e-06, "epoch": 4.040485829959514, "percentage": 80.81, "elapsed_time": "5:35:40", "remaining_time": "1:19:42"}
|
999 |
+
{"current_steps": 999, "total_steps": 1235, "loss": 0.0015, "lr": 4.29059827474257e-06, "epoch": 4.044534412955466, "percentage": 80.89, "elapsed_time": "5:36:01", "remaining_time": "1:19:22"}
|
1000 |
+
{"current_steps": 1000, "total_steps": 1235, "loss": 0.0021, "lr": 4.255659678050063e-06, "epoch": 4.048582995951417, "percentage": 80.97, "elapsed_time": "5:36:21", "remaining_time": "1:19:02"}
|
1001 |
+
{"current_steps": 1001, "total_steps": 1235, "loss": 0.0019, "lr": 4.22084697268323e-06, "epoch": 4.052631578947368, "percentage": 81.05, "elapsed_time": "5:36:42", "remaining_time": "1:18:42"}
|
1002 |
+
{"current_steps": 1002, "total_steps": 1235, "loss": 0.0014, "lr": 4.186160437003535e-06, "epoch": 4.05668016194332, "percentage": 81.13, "elapsed_time": "5:37:05", "remaining_time": "1:18:23"}
|
1003 |
+
{"current_steps": 1003, "total_steps": 1235, "loss": 0.0017, "lr": 4.151600348363582e-06, "epoch": 4.060728744939271, "percentage": 81.21, "elapsed_time": "5:37:25", "remaining_time": "1:18:02"}
|
1004 |
+
{"current_steps": 1004, "total_steps": 1235, "loss": 0.0016, "lr": 4.11716698310493e-06, "epoch": 4.064777327935222, "percentage": 81.3, "elapsed_time": "5:37:45", "remaining_time": "1:17:42"}
|
1005 |
+
{"current_steps": 1005, "total_steps": 1235, "loss": 0.0017, "lr": 4.082860616555848e-06, "epoch": 4.068825910931174, "percentage": 81.38, "elapsed_time": "5:38:03", "remaining_time": "1:17:21"}
|
1006 |
+
{"current_steps": 1006, "total_steps": 1235, "loss": 0.0017, "lr": 4.048681523029125e-06, "epoch": 4.0728744939271255, "percentage": 81.46, "elapsed_time": "5:38:25", "remaining_time": "1:17:02"}
|
1007 |
+
{"current_steps": 1007, "total_steps": 1235, "loss": 0.0015, "lr": 4.014629975819882e-06, "epoch": 4.076923076923077, "percentage": 81.54, "elapsed_time": "5:38:45", "remaining_time": "1:16:41"}
|
1008 |
+
{"current_steps": 1008, "total_steps": 1235, "loss": 0.0014, "lr": 3.9807062472033855e-06, "epoch": 4.080971659919029, "percentage": 81.62, "elapsed_time": "5:39:07", "remaining_time": "1:16:22"}
|
1009 |
+
{"current_steps": 1009, "total_steps": 1235, "loss": 0.0017, "lr": 3.94691060843287e-06, "epoch": 4.08502024291498, "percentage": 81.7, "elapsed_time": "5:39:27", "remaining_time": "1:16:02"}
|
1010 |
+
{"current_steps": 1010, "total_steps": 1235, "loss": 0.0016, "lr": 3.913243329737353e-06, "epoch": 4.089068825910931, "percentage": 81.78, "elapsed_time": "5:39:46", "remaining_time": "1:15:41"}
|
1011 |
+
{"current_steps": 1011, "total_steps": 1235, "loss": 0.0012, "lr": 3.879704680319503e-06, "epoch": 4.093117408906883, "percentage": 81.86, "elapsed_time": "5:40:06", "remaining_time": "1:15:21"}
|
1012 |
+
{"current_steps": 1012, "total_steps": 1235, "loss": 0.0016, "lr": 3.846294928353471e-06, "epoch": 4.097165991902834, "percentage": 81.94, "elapsed_time": "5:40:26", "remaining_time": "1:15:01"}
|
1013 |
+
{"current_steps": 1013, "total_steps": 1235, "loss": 0.0012, "lr": 3.8130143409827345e-06, "epoch": 4.101214574898785, "percentage": 82.02, "elapsed_time": "5:40:44", "remaining_time": "1:14:40"}
|
1014 |
+
{"current_steps": 1014, "total_steps": 1235, "loss": 0.0016, "lr": 3.7798631843179887e-06, "epoch": 4.105263157894737, "percentage": 82.11, "elapsed_time": "5:41:00", "remaining_time": "1:14:19"}
|
1015 |
+
{"current_steps": 1015, "total_steps": 1235, "loss": 0.0017, "lr": 3.7468417234349973e-06, "epoch": 4.109311740890688, "percentage": 82.19, "elapsed_time": "5:41:24", "remaining_time": "1:13:59"}
|
1016 |
+
{"current_steps": 1016, "total_steps": 1235, "loss": 0.0017, "lr": 3.7139502223724823e-06, "epoch": 4.113360323886639, "percentage": 82.27, "elapsed_time": "5:41:43", "remaining_time": "1:13:39"}
|
1017 |
+
{"current_steps": 1017, "total_steps": 1235, "loss": 0.0012, "lr": 3.6811889441300095e-06, "epoch": 4.117408906882591, "percentage": 82.35, "elapsed_time": "5:42:01", "remaining_time": "1:13:18"}
|
1018 |
+
{"current_steps": 1018, "total_steps": 1235, "loss": 0.0016, "lr": 3.648558150665886e-06, "epoch": 4.1214574898785425, "percentage": 82.43, "elapsed_time": "5:42:22", "remaining_time": "1:12:58"}
|
1019 |
+
{"current_steps": 1019, "total_steps": 1235, "loss": 0.0013, "lr": 3.616058102895075e-06, "epoch": 4.125506072874494, "percentage": 82.51, "elapsed_time": "5:42:41", "remaining_time": "1:12:38"}
|
1020 |
+
{"current_steps": 1020, "total_steps": 1235, "loss": 0.0014, "lr": 3.583689060687079e-06, "epoch": 4.129554655870446, "percentage": 82.59, "elapsed_time": "5:42:59", "remaining_time": "1:12:17"}
|
1021 |
+
{"current_steps": 1021, "total_steps": 1235, "loss": 0.0011, "lr": 3.5514512828639023e-06, "epoch": 4.133603238866397, "percentage": 82.67, "elapsed_time": "5:43:18", "remaining_time": "1:11:57"}
|
1022 |
+
{"current_steps": 1022, "total_steps": 1235, "loss": 0.0023, "lr": 3.51934502719796e-06, "epoch": 4.137651821862348, "percentage": 82.75, "elapsed_time": "5:43:40", "remaining_time": "1:11:37"}
|
1023 |
+
{"current_steps": 1023, "total_steps": 1235, "loss": 0.0011, "lr": 3.4873705504100185e-06, "epoch": 4.1417004048583, "percentage": 82.83, "elapsed_time": "5:44:00", "remaining_time": "1:11:17"}
|
1024 |
+
{"current_steps": 1024, "total_steps": 1235, "loss": 0.0013, "lr": 3.4555281081671345e-06, "epoch": 4.145748987854251, "percentage": 82.91, "elapsed_time": "5:44:22", "remaining_time": "1:10:57"}
|
1025 |
+
{"current_steps": 1025, "total_steps": 1235, "loss": 0.0014, "lr": 3.4238179550806326e-06, "epoch": 4.149797570850202, "percentage": 83.0, "elapsed_time": "5:44:43", "remaining_time": "1:10:37"}
|
1026 |
+
{"current_steps": 1026, "total_steps": 1235, "loss": 0.0011, "lr": 3.3922403447040497e-06, "epoch": 4.153846153846154, "percentage": 83.08, "elapsed_time": "5:45:01", "remaining_time": "1:10:17"}
|
1027 |
+
{"current_steps": 1027, "total_steps": 1235, "loss": 0.0015, "lr": 3.3607955295311247e-06, "epoch": 4.157894736842105, "percentage": 83.16, "elapsed_time": "5:45:21", "remaining_time": "1:09:56"}
|
1028 |
+
{"current_steps": 1028, "total_steps": 1235, "loss": 0.0013, "lr": 3.32948376099375e-06, "epoch": 4.161943319838056, "percentage": 83.24, "elapsed_time": "5:45:41", "remaining_time": "1:09:36"}
|
1029 |
+
{"current_steps": 1029, "total_steps": 1235, "loss": 0.001, "lr": 3.2983052894599976e-06, "epoch": 4.165991902834008, "percentage": 83.32, "elapsed_time": "5:46:02", "remaining_time": "1:09:16"}
|
1030 |
+
{"current_steps": 1030, "total_steps": 1235, "loss": 0.0019, "lr": 3.2672603642320945e-06, "epoch": 4.17004048582996, "percentage": 83.4, "elapsed_time": "5:46:22", "remaining_time": "1:08:56"}
|
1031 |
+
{"current_steps": 1031, "total_steps": 1235, "loss": 0.0012, "lr": 3.236349233544438e-06, "epoch": 4.174089068825911, "percentage": 83.48, "elapsed_time": "5:46:44", "remaining_time": "1:08:36"}
|
1032 |
+
{"current_steps": 1032, "total_steps": 1235, "loss": 0.0016, "lr": 3.205572144561604e-06, "epoch": 4.178137651821863, "percentage": 83.56, "elapsed_time": "5:47:03", "remaining_time": "1:08:16"}
|
1033 |
+
{"current_steps": 1033, "total_steps": 1235, "loss": 0.0013, "lr": 3.174929343376374e-06, "epoch": 4.182186234817814, "percentage": 83.64, "elapsed_time": "5:47:22", "remaining_time": "1:07:55"}
|
1034 |
+
{"current_steps": 1034, "total_steps": 1235, "loss": 0.0015, "lr": 3.1444210750077777e-06, "epoch": 4.186234817813765, "percentage": 83.72, "elapsed_time": "5:47:43", "remaining_time": "1:07:35"}
|
1035 |
+
{"current_steps": 1035, "total_steps": 1235, "loss": 0.0013, "lr": 3.1140475833991046e-06, "epoch": 4.190283400809717, "percentage": 83.81, "elapsed_time": "5:48:04", "remaining_time": "1:07:15"}
|
1036 |
+
{"current_steps": 1036, "total_steps": 1235, "loss": 0.0017, "lr": 3.0838091114159895e-06, "epoch": 4.194331983805668, "percentage": 83.89, "elapsed_time": "5:48:25", "remaining_time": "1:06:55"}
|
1037 |
+
{"current_steps": 1037, "total_steps": 1235, "loss": 0.0017, "lr": 3.0537059008444524e-06, "epoch": 4.198380566801619, "percentage": 83.97, "elapsed_time": "5:48:45", "remaining_time": "1:06:35"}
|
1038 |
+
{"current_steps": 1038, "total_steps": 1235, "loss": 0.0012, "lr": 3.0237381923889563e-06, "epoch": 4.202429149797571, "percentage": 84.05, "elapsed_time": "5:49:03", "remaining_time": "1:06:14"}
|
1039 |
+
{"current_steps": 1039, "total_steps": 1235, "loss": 0.0012, "lr": 2.9939062256704997e-06, "epoch": 4.206477732793522, "percentage": 84.13, "elapsed_time": "5:49:22", "remaining_time": "1:05:54"}
|
1040 |
+
{"current_steps": 1040, "total_steps": 1235, "loss": 0.0019, "lr": 2.964210239224696e-06, "epoch": 4.2105263157894735, "percentage": 84.21, "elapsed_time": "5:49:41", "remaining_time": "1:05:34"}
|
1041 |
+
{"current_steps": 1041, "total_steps": 1235, "loss": 0.0016, "lr": 2.934650470499869e-06, "epoch": 4.2145748987854255, "percentage": 84.29, "elapsed_time": "5:50:01", "remaining_time": "1:05:13"}
|
1042 |
+
{"current_steps": 1042, "total_steps": 1235, "loss": 0.0015, "lr": 2.905227155855128e-06, "epoch": 4.218623481781377, "percentage": 84.37, "elapsed_time": "5:50:19", "remaining_time": "1:04:53"}
|
1043 |
+
{"current_steps": 1043, "total_steps": 1235, "loss": 0.0014, "lr": 2.875940530558519e-06, "epoch": 4.222672064777328, "percentage": 84.45, "elapsed_time": "5:50:40", "remaining_time": "1:04:33"}
|
1044 |
+
{"current_steps": 1044, "total_steps": 1235, "loss": 0.0008, "lr": 2.8467908287851154e-06, "epoch": 4.22672064777328, "percentage": 84.53, "elapsed_time": "5:50:58", "remaining_time": "1:04:12"}
|
1045 |
+
{"current_steps": 1045, "total_steps": 1235, "loss": 0.0014, "lr": 2.8177782836151603e-06, "epoch": 4.230769230769231, "percentage": 84.62, "elapsed_time": "5:51:20", "remaining_time": "1:03:52"}
|
1046 |
+
{"current_steps": 1046, "total_steps": 1235, "loss": 0.0014, "lr": 2.7889031270321874e-06, "epoch": 4.234817813765182, "percentage": 84.7, "elapsed_time": "5:51:38", "remaining_time": "1:03:32"}
|
1047 |
+
{"current_steps": 1047, "total_steps": 1235, "loss": 0.0009, "lr": 2.760165589921184e-06, "epoch": 4.238866396761134, "percentage": 84.78, "elapsed_time": "5:51:58", "remaining_time": "1:03:11"}
|
1048 |
+
{"current_steps": 1048, "total_steps": 1235, "loss": 0.0013, "lr": 2.7315659020667305e-06, "epoch": 4.242914979757085, "percentage": 84.86, "elapsed_time": "5:52:17", "remaining_time": "1:02:51"}
|
1049 |
+
{"current_steps": 1049, "total_steps": 1235, "loss": 0.0015, "lr": 2.703104292151164e-06, "epoch": 4.246963562753036, "percentage": 84.94, "elapsed_time": "5:52:39", "remaining_time": "1:02:31"}
|
1050 |
+
{"current_steps": 1050, "total_steps": 1235, "loss": 0.0019, "lr": 2.6747809877527607e-06, "epoch": 4.251012145748988, "percentage": 85.02, "elapsed_time": "5:52:59", "remaining_time": "1:02:11"}
|
1051 |
+
{"current_steps": 1051, "total_steps": 1235, "loss": 0.0012, "lr": 2.6465962153439082e-06, "epoch": 4.255060728744939, "percentage": 85.1, "elapsed_time": "5:53:17", "remaining_time": "1:01:51"}
|
1052 |
+
{"current_steps": 1052, "total_steps": 1235, "loss": 0.0014, "lr": 2.618550200289303e-06, "epoch": 4.2591093117408905, "percentage": 85.18, "elapsed_time": "5:53:34", "remaining_time": "1:01:30"}
|
1053 |
+
{"current_steps": 1053, "total_steps": 1235, "loss": 0.001, "lr": 2.59064316684412e-06, "epoch": 4.2631578947368425, "percentage": 85.26, "elapsed_time": "5:53:52", "remaining_time": "1:01:09"}
|
1054 |
+
{"current_steps": 1054, "total_steps": 1235, "loss": 0.0016, "lr": 2.562875338152264e-06, "epoch": 4.267206477732794, "percentage": 85.34, "elapsed_time": "5:54:13", "remaining_time": "1:00:49"}
|
1055 |
+
{"current_steps": 1055, "total_steps": 1235, "loss": 0.0014, "lr": 2.5352469362445552e-06, "epoch": 4.271255060728745, "percentage": 85.43, "elapsed_time": "5:54:31", "remaining_time": "1:00:29"}
|