Training in progress, step 600
Browse files- model-00001-of-00006.safetensors +1 -1
- model-00002-of-00006.safetensors +1 -1
- model-00003-of-00006.safetensors +1 -1
- model-00004-of-00006.safetensors +1 -1
- model-00005-of-00006.safetensors +1 -1
- model-00006-of-00006.safetensors +1 -1
- trainer_log.jsonl +51 -251
- training_args.bin +1 -1
model-00001-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4933656472
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9f2777087bbcd133c6e507c2669ceaffd7a3cb3bb12c12286fe93cb1765f029f
|
3 |
size 4933656472
|
model-00002-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4954690712
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:03b17d3bb165127e2c8a824b11b2fcf9495696900e53cd809421ba0aaa3a7443
|
3 |
size 4954690712
|
model-00003-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4902241352
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:298c26ed2b3898ab3416ca53c67b73f198b06074b5861c7215a071159c703218
|
3 |
size 4902241352
|
model-00004-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4771169120
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c6adf1ad69c7689be879be78b514105e062f4bc01b78199b462692190a1a3cbc
|
3 |
size 4771169120
|
model-00005-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4771169120
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a77a448273a4f1ae0309e1a0cf13ef22e13a5219068768bbac7c54026d94c0a3
|
3 |
size 4771169120
|
model-00006-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4986116216
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6e772c73805283d90e378e998fef03495c960a32c2e787f029936fbf998e0a25
|
3 |
size 4986116216
|
trainer_log.jsonl
CHANGED
@@ -1,251 +1,51 @@
|
|
1 |
-
{"current_steps":
|
2 |
-
{"current_steps":
|
3 |
-
{"current_steps":
|
4 |
-
{"current_steps":
|
5 |
-
{"current_steps":
|
6 |
-
{"current_steps":
|
7 |
-
{"current_steps":
|
8 |
-
{"current_steps":
|
9 |
-
{"current_steps":
|
10 |
-
{"current_steps":
|
11 |
-
{"current_steps":
|
12 |
-
{"current_steps":
|
13 |
-
{"current_steps":
|
14 |
-
{"current_steps":
|
15 |
-
{"current_steps":
|
16 |
-
{"current_steps":
|
17 |
-
{"current_steps":
|
18 |
-
{"current_steps":
|
19 |
-
{"current_steps":
|
20 |
-
{"current_steps":
|
21 |
-
{"current_steps":
|
22 |
-
{"current_steps":
|
23 |
-
{"current_steps":
|
24 |
-
{"current_steps":
|
25 |
-
{"current_steps":
|
26 |
-
{"current_steps":
|
27 |
-
{"current_steps":
|
28 |
-
{"current_steps":
|
29 |
-
{"current_steps":
|
30 |
-
{"current_steps":
|
31 |
-
{"current_steps":
|
32 |
-
{"current_steps":
|
33 |
-
{"current_steps":
|
34 |
-
{"current_steps":
|
35 |
-
{"current_steps":
|
36 |
-
{"current_steps":
|
37 |
-
{"current_steps":
|
38 |
-
{"current_steps":
|
39 |
-
{"current_steps":
|
40 |
-
{"current_steps":
|
41 |
-
{"current_steps":
|
42 |
-
{"current_steps":
|
43 |
-
{"current_steps":
|
44 |
-
{"current_steps":
|
45 |
-
{"current_steps":
|
46 |
-
{"current_steps":
|
47 |
-
{"current_steps":
|
48 |
-
{"current_steps":
|
49 |
-
{"current_steps":
|
50 |
-
{"current_steps":
|
51 |
-
{"current_steps":
|
52 |
-
{"current_steps": 352, "total_steps": 550, "loss": 1.7456, "lr": 1e-05, "epoch": 0.6398545785048853, "percentage": 64.0, "elapsed_time": "2:44:32", "remaining_time": "1:32:33"}
|
53 |
-
{"current_steps": 353, "total_steps": 550, "loss": 1.7494, "lr": 1e-05, "epoch": 0.6416723471938196, "percentage": 64.18, "elapsed_time": "2:47:41", "remaining_time": "1:33:34"}
|
54 |
-
{"current_steps": 354, "total_steps": 550, "loss": 1.743, "lr": 1e-05, "epoch": 0.643490115882754, "percentage": 64.36, "elapsed_time": "2:50:50", "remaining_time": "1:34:35"}
|
55 |
-
{"current_steps": 355, "total_steps": 550, "loss": 1.7478, "lr": 1e-05, "epoch": 0.6453078845716883, "percentage": 64.55, "elapsed_time": "2:53:58", "remaining_time": "1:35:34"}
|
56 |
-
{"current_steps": 356, "total_steps": 550, "loss": 1.7535, "lr": 1e-05, "epoch": 0.6471256532606225, "percentage": 64.73, "elapsed_time": "2:57:08", "remaining_time": "1:36:31"}
|
57 |
-
{"current_steps": 357, "total_steps": 550, "loss": 1.759, "lr": 1e-05, "epoch": 0.6489434219495569, "percentage": 64.91, "elapsed_time": "3:00:17", "remaining_time": "1:37:28"}
|
58 |
-
{"current_steps": 358, "total_steps": 550, "loss": 1.755, "lr": 1e-05, "epoch": 0.6507611906384912, "percentage": 65.09, "elapsed_time": "3:03:27", "remaining_time": "1:38:23"}
|
59 |
-
{"current_steps": 359, "total_steps": 550, "loss": 1.7597, "lr": 1e-05, "epoch": 0.6525789593274256, "percentage": 65.27, "elapsed_time": "3:06:36", "remaining_time": "1:39:16"}
|
60 |
-
{"current_steps": 360, "total_steps": 550, "loss": 1.7468, "lr": 1e-05, "epoch": 0.65439672801636, "percentage": 65.45, "elapsed_time": "3:09:47", "remaining_time": "1:40:10"}
|
61 |
-
{"current_steps": 361, "total_steps": 550, "loss": 1.7468, "lr": 1e-05, "epoch": 0.6562144967052943, "percentage": 65.64, "elapsed_time": "3:12:57", "remaining_time": "1:41:01"}
|
62 |
-
{"current_steps": 362, "total_steps": 550, "loss": 1.7477, "lr": 1e-05, "epoch": 0.6580322653942285, "percentage": 65.82, "elapsed_time": "3:16:07", "remaining_time": "1:41:51"}
|
63 |
-
{"current_steps": 363, "total_steps": 550, "loss": 1.7643, "lr": 1e-05, "epoch": 0.6598500340831629, "percentage": 66.0, "elapsed_time": "3:19:17", "remaining_time": "1:42:40"}
|
64 |
-
{"current_steps": 364, "total_steps": 550, "loss": 1.7514, "lr": 1e-05, "epoch": 0.6616678027720972, "percentage": 66.18, "elapsed_time": "3:22:28", "remaining_time": "1:43:27"}
|
65 |
-
{"current_steps": 365, "total_steps": 550, "loss": 1.7581, "lr": 1e-05, "epoch": 0.6634855714610316, "percentage": 66.36, "elapsed_time": "3:25:38", "remaining_time": "1:44:13"}
|
66 |
-
{"current_steps": 366, "total_steps": 550, "loss": 1.7455, "lr": 1e-05, "epoch": 0.665303340149966, "percentage": 66.55, "elapsed_time": "3:28:47", "remaining_time": "1:44:57"}
|
67 |
-
{"current_steps": 367, "total_steps": 550, "loss": 1.7483, "lr": 1e-05, "epoch": 0.6671211088389003, "percentage": 66.73, "elapsed_time": "3:31:55", "remaining_time": "1:45:40"}
|
68 |
-
{"current_steps": 368, "total_steps": 550, "loss": 1.7512, "lr": 1e-05, "epoch": 0.6689388775278345, "percentage": 66.91, "elapsed_time": "3:35:04", "remaining_time": "1:46:22"}
|
69 |
-
{"current_steps": 369, "total_steps": 550, "loss": 1.7528, "lr": 1e-05, "epoch": 0.6707566462167689, "percentage": 67.09, "elapsed_time": "3:38:14", "remaining_time": "1:47:03"}
|
70 |
-
{"current_steps": 370, "total_steps": 550, "loss": 1.7446, "lr": 1e-05, "epoch": 0.6725744149057032, "percentage": 67.27, "elapsed_time": "3:41:24", "remaining_time": "1:47:42"}
|
71 |
-
{"current_steps": 371, "total_steps": 550, "loss": 1.7533, "lr": 1e-05, "epoch": 0.6743921835946376, "percentage": 67.45, "elapsed_time": "3:44:33", "remaining_time": "1:48:20"}
|
72 |
-
{"current_steps": 372, "total_steps": 550, "loss": 1.7512, "lr": 1e-05, "epoch": 0.676209952283572, "percentage": 67.64, "elapsed_time": "3:47:44", "remaining_time": "1:48:58"}
|
73 |
-
{"current_steps": 373, "total_steps": 550, "loss": 1.7533, "lr": 1e-05, "epoch": 0.6780277209725063, "percentage": 67.82, "elapsed_time": "3:50:53", "remaining_time": "1:49:33"}
|
74 |
-
{"current_steps": 374, "total_steps": 550, "loss": 1.7468, "lr": 1e-05, "epoch": 0.6798454896614405, "percentage": 68.0, "elapsed_time": "3:54:01", "remaining_time": "1:50:07"}
|
75 |
-
{"current_steps": 375, "total_steps": 550, "loss": 1.7514, "lr": 1e-05, "epoch": 0.6816632583503749, "percentage": 68.18, "elapsed_time": "3:57:10", "remaining_time": "1:50:40"}
|
76 |
-
{"current_steps": 376, "total_steps": 550, "loss": 1.746, "lr": 1e-05, "epoch": 0.6834810270393092, "percentage": 68.36, "elapsed_time": "4:00:19", "remaining_time": "1:51:12"}
|
77 |
-
{"current_steps": 377, "total_steps": 550, "loss": 1.7472, "lr": 1e-05, "epoch": 0.6852987957282436, "percentage": 68.55, "elapsed_time": "4:03:27", "remaining_time": "1:51:43"}
|
78 |
-
{"current_steps": 378, "total_steps": 550, "loss": 1.7445, "lr": 1e-05, "epoch": 0.6871165644171779, "percentage": 68.73, "elapsed_time": "4:06:37", "remaining_time": "1:52:13"}
|
79 |
-
{"current_steps": 379, "total_steps": 550, "loss": 1.7575, "lr": 1e-05, "epoch": 0.6889343331061123, "percentage": 68.91, "elapsed_time": "4:09:47", "remaining_time": "1:52:42"}
|
80 |
-
{"current_steps": 380, "total_steps": 550, "loss": 1.7478, "lr": 1e-05, "epoch": 0.6907521017950465, "percentage": 69.09, "elapsed_time": "4:12:56", "remaining_time": "1:53:09"}
|
81 |
-
{"current_steps": 381, "total_steps": 550, "loss": 1.7577, "lr": 1e-05, "epoch": 0.6925698704839809, "percentage": 69.27, "elapsed_time": "4:16:06", "remaining_time": "1:53:36"}
|
82 |
-
{"current_steps": 382, "total_steps": 550, "loss": 1.7516, "lr": 1e-05, "epoch": 0.6943876391729152, "percentage": 69.45, "elapsed_time": "4:19:16", "remaining_time": "1:54:01"}
|
83 |
-
{"current_steps": 383, "total_steps": 550, "loss": 1.7488, "lr": 1e-05, "epoch": 0.6962054078618496, "percentage": 69.64, "elapsed_time": "4:22:25", "remaining_time": "1:54:25"}
|
84 |
-
{"current_steps": 384, "total_steps": 550, "loss": 1.7545, "lr": 1e-05, "epoch": 0.6980231765507839, "percentage": 69.82, "elapsed_time": "4:25:35", "remaining_time": "1:54:48"}
|
85 |
-
{"current_steps": 385, "total_steps": 550, "loss": 1.7533, "lr": 1e-05, "epoch": 0.6998409452397183, "percentage": 70.0, "elapsed_time": "4:28:45", "remaining_time": "1:55:11"}
|
86 |
-
{"current_steps": 386, "total_steps": 550, "loss": 1.7521, "lr": 1e-05, "epoch": 0.7016587139286525, "percentage": 70.18, "elapsed_time": "4:31:55", "remaining_time": "1:55:31"}
|
87 |
-
{"current_steps": 387, "total_steps": 550, "loss": 1.7548, "lr": 1e-05, "epoch": 0.7034764826175869, "percentage": 70.36, "elapsed_time": "4:35:03", "remaining_time": "1:55:51"}
|
88 |
-
{"current_steps": 388, "total_steps": 550, "loss": 1.7443, "lr": 1e-05, "epoch": 0.7052942513065212, "percentage": 70.55, "elapsed_time": "4:38:13", "remaining_time": "1:56:09"}
|
89 |
-
{"current_steps": 389, "total_steps": 550, "loss": 1.7515, "lr": 1e-05, "epoch": 0.7071120199954556, "percentage": 70.73, "elapsed_time": "4:41:22", "remaining_time": "1:56:27"}
|
90 |
-
{"current_steps": 390, "total_steps": 550, "loss": 1.7478, "lr": 1e-05, "epoch": 0.7089297886843899, "percentage": 70.91, "elapsed_time": "4:44:32", "remaining_time": "1:56:44"}
|
91 |
-
{"current_steps": 391, "total_steps": 550, "loss": 1.7487, "lr": 1e-05, "epoch": 0.7107475573733243, "percentage": 71.09, "elapsed_time": "4:47:41", "remaining_time": "1:56:59"}
|
92 |
-
{"current_steps": 392, "total_steps": 550, "loss": 1.7539, "lr": 1e-05, "epoch": 0.7125653260622585, "percentage": 71.27, "elapsed_time": "4:50:50", "remaining_time": "1:57:13"}
|
93 |
-
{"current_steps": 393, "total_steps": 550, "loss": 1.7488, "lr": 1e-05, "epoch": 0.7143830947511929, "percentage": 71.45, "elapsed_time": "4:53:59", "remaining_time": "1:57:26"}
|
94 |
-
{"current_steps": 394, "total_steps": 550, "loss": 1.7448, "lr": 1e-05, "epoch": 0.7162008634401272, "percentage": 71.64, "elapsed_time": "4:57:08", "remaining_time": "1:57:38"}
|
95 |
-
{"current_steps": 395, "total_steps": 550, "loss": 1.7399, "lr": 1e-05, "epoch": 0.7180186321290616, "percentage": 71.82, "elapsed_time": "5:00:18", "remaining_time": "1:57:50"}
|
96 |
-
{"current_steps": 396, "total_steps": 550, "loss": 1.7566, "lr": 1e-05, "epoch": 0.7198364008179959, "percentage": 72.0, "elapsed_time": "5:03:28", "remaining_time": "1:58:01"}
|
97 |
-
{"current_steps": 397, "total_steps": 550, "loss": 1.751, "lr": 1e-05, "epoch": 0.7216541695069303, "percentage": 72.18, "elapsed_time": "5:06:38", "remaining_time": "1:58:10"}
|
98 |
-
{"current_steps": 398, "total_steps": 550, "loss": 1.7474, "lr": 1e-05, "epoch": 0.7234719381958645, "percentage": 72.36, "elapsed_time": "5:09:48", "remaining_time": "1:58:18"}
|
99 |
-
{"current_steps": 399, "total_steps": 550, "loss": 1.7492, "lr": 1e-05, "epoch": 0.7252897068847989, "percentage": 72.55, "elapsed_time": "5:12:58", "remaining_time": "1:58:26"}
|
100 |
-
{"current_steps": 400, "total_steps": 550, "loss": 1.7571, "lr": 1e-05, "epoch": 0.7271074755737332, "percentage": 72.73, "elapsed_time": "5:16:08", "remaining_time": "1:58:33"}
|
101 |
-
{"current_steps": 401, "total_steps": 550, "loss": 1.7426, "lr": 1e-05, "epoch": 0.7289252442626676, "percentage": 72.91, "elapsed_time": "5:22:24", "remaining_time": "1:59:47"}
|
102 |
-
{"current_steps": 402, "total_steps": 550, "loss": 1.7564, "lr": 1e-05, "epoch": 0.7307430129516019, "percentage": 73.09, "elapsed_time": "5:25:34", "remaining_time": "1:59:51"}
|
103 |
-
{"current_steps": 403, "total_steps": 550, "loss": 1.7495, "lr": 1e-05, "epoch": 0.7325607816405363, "percentage": 73.27, "elapsed_time": "5:28:41", "remaining_time": "1:59:53"}
|
104 |
-
{"current_steps": 404, "total_steps": 550, "loss": 1.7479, "lr": 1e-05, "epoch": 0.7343785503294705, "percentage": 73.45, "elapsed_time": "5:31:49", "remaining_time": "1:59:54"}
|
105 |
-
{"current_steps": 405, "total_steps": 550, "loss": 1.7475, "lr": 1e-05, "epoch": 0.7361963190184049, "percentage": 73.64, "elapsed_time": "5:34:55", "remaining_time": "1:59:54"}
|
106 |
-
{"current_steps": 406, "total_steps": 550, "loss": 1.7517, "lr": 1e-05, "epoch": 0.7380140877073392, "percentage": 73.82, "elapsed_time": "5:38:03", "remaining_time": "1:59:54"}
|
107 |
-
{"current_steps": 407, "total_steps": 550, "loss": 1.7556, "lr": 1e-05, "epoch": 0.7398318563962736, "percentage": 74.0, "elapsed_time": "5:41:10", "remaining_time": "1:59:52"}
|
108 |
-
{"current_steps": 408, "total_steps": 550, "loss": 1.7394, "lr": 1e-05, "epoch": 0.7416496250852079, "percentage": 74.18, "elapsed_time": "5:44:17", "remaining_time": "1:59:49"}
|
109 |
-
{"current_steps": 409, "total_steps": 550, "loss": 1.7483, "lr": 1e-05, "epoch": 0.7434673937741423, "percentage": 74.36, "elapsed_time": "5:47:26", "remaining_time": "1:59:46"}
|
110 |
-
{"current_steps": 410, "total_steps": 550, "loss": 1.7483, "lr": 1e-05, "epoch": 0.7452851624630765, "percentage": 74.55, "elapsed_time": "5:50:34", "remaining_time": "1:59:42"}
|
111 |
-
{"current_steps": 411, "total_steps": 550, "loss": 1.7522, "lr": 1e-05, "epoch": 0.7471029311520109, "percentage": 74.73, "elapsed_time": "5:53:41", "remaining_time": "1:59:37"}
|
112 |
-
{"current_steps": 412, "total_steps": 550, "loss": 1.7478, "lr": 1e-05, "epoch": 0.7489206998409452, "percentage": 74.91, "elapsed_time": "5:56:50", "remaining_time": "1:59:31"}
|
113 |
-
{"current_steps": 413, "total_steps": 550, "loss": 1.7475, "lr": 1e-05, "epoch": 0.7507384685298796, "percentage": 75.09, "elapsed_time": "5:59:57", "remaining_time": "1:59:24"}
|
114 |
-
{"current_steps": 414, "total_steps": 550, "loss": 1.7523, "lr": 1e-05, "epoch": 0.7525562372188139, "percentage": 75.27, "elapsed_time": "6:03:06", "remaining_time": "1:59:16"}
|
115 |
-
{"current_steps": 415, "total_steps": 550, "loss": 1.7422, "lr": 1e-05, "epoch": 0.7543740059077483, "percentage": 75.45, "elapsed_time": "6:06:13", "remaining_time": "1:59:08"}
|
116 |
-
{"current_steps": 416, "total_steps": 550, "loss": 1.7484, "lr": 1e-05, "epoch": 0.7561917745966825, "percentage": 75.64, "elapsed_time": "6:09:21", "remaining_time": "1:58:58"}
|
117 |
-
{"current_steps": 417, "total_steps": 550, "loss": 1.7543, "lr": 1e-05, "epoch": 0.7580095432856169, "percentage": 75.82, "elapsed_time": "6:12:29", "remaining_time": "1:58:48"}
|
118 |
-
{"current_steps": 418, "total_steps": 550, "loss": 1.7511, "lr": 1e-05, "epoch": 0.7598273119745512, "percentage": 76.0, "elapsed_time": "6:15:37", "remaining_time": "1:58:37"}
|
119 |
-
{"current_steps": 419, "total_steps": 550, "loss": 1.747, "lr": 1e-05, "epoch": 0.7616450806634856, "percentage": 76.18, "elapsed_time": "6:18:47", "remaining_time": "1:58:25"}
|
120 |
-
{"current_steps": 420, "total_steps": 550, "loss": 1.741, "lr": 1e-05, "epoch": 0.7634628493524199, "percentage": 76.36, "elapsed_time": "6:21:57", "remaining_time": "1:58:13"}
|
121 |
-
{"current_steps": 421, "total_steps": 550, "loss": 1.7427, "lr": 1e-05, "epoch": 0.7652806180413543, "percentage": 76.55, "elapsed_time": "6:25:07", "remaining_time": "1:58:00"}
|
122 |
-
{"current_steps": 422, "total_steps": 550, "loss": 1.7413, "lr": 1e-05, "epoch": 0.7670983867302885, "percentage": 76.73, "elapsed_time": "6:28:16", "remaining_time": "1:57:46"}
|
123 |
-
{"current_steps": 423, "total_steps": 550, "loss": 1.7483, "lr": 1e-05, "epoch": 0.7689161554192229, "percentage": 76.91, "elapsed_time": "6:31:27", "remaining_time": "1:57:31"}
|
124 |
-
{"current_steps": 424, "total_steps": 550, "loss": 1.7463, "lr": 1e-05, "epoch": 0.7707339241081572, "percentage": 77.09, "elapsed_time": "6:34:36", "remaining_time": "1:57:15"}
|
125 |
-
{"current_steps": 425, "total_steps": 550, "loss": 1.7482, "lr": 1e-05, "epoch": 0.7725516927970916, "percentage": 77.27, "elapsed_time": "6:37:45", "remaining_time": "1:56:59"}
|
126 |
-
{"current_steps": 426, "total_steps": 550, "loss": 1.7517, "lr": 1e-05, "epoch": 0.7743694614860259, "percentage": 77.45, "elapsed_time": "6:40:53", "remaining_time": "1:56:41"}
|
127 |
-
{"current_steps": 427, "total_steps": 550, "loss": 1.7437, "lr": 1e-05, "epoch": 0.7761872301749603, "percentage": 77.64, "elapsed_time": "6:44:02", "remaining_time": "1:56:23"}
|
128 |
-
{"current_steps": 428, "total_steps": 550, "loss": 1.7479, "lr": 1e-05, "epoch": 0.7780049988638945, "percentage": 77.82, "elapsed_time": "6:47:12", "remaining_time": "1:56:04"}
|
129 |
-
{"current_steps": 429, "total_steps": 550, "loss": 1.7438, "lr": 1e-05, "epoch": 0.7798227675528289, "percentage": 78.0, "elapsed_time": "6:50:20", "remaining_time": "1:55:44"}
|
130 |
-
{"current_steps": 430, "total_steps": 550, "loss": 1.743, "lr": 1e-05, "epoch": 0.7816405362417632, "percentage": 78.18, "elapsed_time": "6:53:30", "remaining_time": "1:55:23"}
|
131 |
-
{"current_steps": 431, "total_steps": 550, "loss": 1.7521, "lr": 1e-05, "epoch": 0.7834583049306976, "percentage": 78.36, "elapsed_time": "6:56:39", "remaining_time": "1:55:02"}
|
132 |
-
{"current_steps": 432, "total_steps": 550, "loss": 1.7489, "lr": 1e-05, "epoch": 0.7852760736196319, "percentage": 78.55, "elapsed_time": "6:59:50", "remaining_time": "1:54:40"}
|
133 |
-
{"current_steps": 433, "total_steps": 550, "loss": 1.7483, "lr": 1e-05, "epoch": 0.7870938423085663, "percentage": 78.73, "elapsed_time": "7:02:58", "remaining_time": "1:54:17"}
|
134 |
-
{"current_steps": 434, "total_steps": 550, "loss": 1.7454, "lr": 1e-05, "epoch": 0.7889116109975006, "percentage": 78.91, "elapsed_time": "7:06:07", "remaining_time": "1:53:53"}
|
135 |
-
{"current_steps": 435, "total_steps": 550, "loss": 1.7447, "lr": 1e-05, "epoch": 0.7907293796864349, "percentage": 79.09, "elapsed_time": "7:09:16", "remaining_time": "1:53:29"}
|
136 |
-
{"current_steps": 436, "total_steps": 550, "loss": 1.7465, "lr": 1e-05, "epoch": 0.7925471483753692, "percentage": 79.27, "elapsed_time": "7:12:26", "remaining_time": "1:53:04"}
|
137 |
-
{"current_steps": 437, "total_steps": 550, "loss": 1.7437, "lr": 1e-05, "epoch": 0.7943649170643036, "percentage": 79.45, "elapsed_time": "7:15:35", "remaining_time": "1:52:38"}
|
138 |
-
{"current_steps": 438, "total_steps": 550, "loss": 1.7432, "lr": 1e-05, "epoch": 0.7961826857532379, "percentage": 79.64, "elapsed_time": "7:18:44", "remaining_time": "1:52:11"}
|
139 |
-
{"current_steps": 439, "total_steps": 550, "loss": 1.7363, "lr": 1e-05, "epoch": 0.7980004544421723, "percentage": 79.82, "elapsed_time": "7:21:53", "remaining_time": "1:51:43"}
|
140 |
-
{"current_steps": 440, "total_steps": 550, "loss": 1.7509, "lr": 1e-05, "epoch": 0.7998182231311066, "percentage": 80.0, "elapsed_time": "7:25:03", "remaining_time": "1:51:15"}
|
141 |
-
{"current_steps": 441, "total_steps": 550, "loss": 1.7446, "lr": 1e-05, "epoch": 0.8016359918200409, "percentage": 80.18, "elapsed_time": "7:28:13", "remaining_time": "1:50:47"}
|
142 |
-
{"current_steps": 442, "total_steps": 550, "loss": 1.7491, "lr": 1e-05, "epoch": 0.8034537605089752, "percentage": 80.36, "elapsed_time": "7:31:23", "remaining_time": "1:50:17"}
|
143 |
-
{"current_steps": 443, "total_steps": 550, "loss": 1.7408, "lr": 1e-05, "epoch": 0.8052715291979096, "percentage": 80.55, "elapsed_time": "7:34:32", "remaining_time": "1:49:47"}
|
144 |
-
{"current_steps": 444, "total_steps": 550, "loss": 1.7485, "lr": 1e-05, "epoch": 0.8070892978868439, "percentage": 80.73, "elapsed_time": "7:37:41", "remaining_time": "1:49:16"}
|
145 |
-
{"current_steps": 445, "total_steps": 550, "loss": 1.7507, "lr": 1e-05, "epoch": 0.8089070665757783, "percentage": 80.91, "elapsed_time": "7:40:50", "remaining_time": "1:48:44"}
|
146 |
-
{"current_steps": 446, "total_steps": 550, "loss": 1.7508, "lr": 1e-05, "epoch": 0.8107248352647126, "percentage": 81.09, "elapsed_time": "7:43:59", "remaining_time": "1:48:11"}
|
147 |
-
{"current_steps": 447, "total_steps": 550, "loss": 1.745, "lr": 1e-05, "epoch": 0.8125426039536469, "percentage": 81.27, "elapsed_time": "7:47:08", "remaining_time": "1:47:38"}
|
148 |
-
{"current_steps": 448, "total_steps": 550, "loss": 1.7564, "lr": 1e-05, "epoch": 0.8143603726425812, "percentage": 81.45, "elapsed_time": "7:50:18", "remaining_time": "1:47:04"}
|
149 |
-
{"current_steps": 449, "total_steps": 550, "loss": 1.7491, "lr": 1e-05, "epoch": 0.8161781413315156, "percentage": 81.64, "elapsed_time": "7:53:27", "remaining_time": "1:46:30"}
|
150 |
-
{"current_steps": 450, "total_steps": 550, "loss": 1.7534, "lr": 1e-05, "epoch": 0.8179959100204499, "percentage": 81.82, "elapsed_time": "7:56:36", "remaining_time": "1:45:54"}
|
151 |
-
{"current_steps": 451, "total_steps": 550, "loss": 1.734, "lr": 1e-05, "epoch": 0.8198136787093843, "percentage": 82.0, "elapsed_time": "7:59:47", "remaining_time": "1:45:19"}
|
152 |
-
{"current_steps": 452, "total_steps": 550, "loss": 1.748, "lr": 1e-05, "epoch": 0.8216314473983186, "percentage": 82.18, "elapsed_time": "8:02:56", "remaining_time": "1:44:42"}
|
153 |
-
{"current_steps": 453, "total_steps": 550, "loss": 1.7581, "lr": 1e-05, "epoch": 0.8234492160872529, "percentage": 82.36, "elapsed_time": "8:06:05", "remaining_time": "1:44:05"}
|
154 |
-
{"current_steps": 454, "total_steps": 550, "loss": 1.7483, "lr": 1e-05, "epoch": 0.8252669847761872, "percentage": 82.55, "elapsed_time": "8:09:14", "remaining_time": "1:43:27"}
|
155 |
-
{"current_steps": 455, "total_steps": 550, "loss": 1.753, "lr": 1e-05, "epoch": 0.8270847534651216, "percentage": 82.73, "elapsed_time": "8:12:22", "remaining_time": "1:42:48"}
|
156 |
-
{"current_steps": 456, "total_steps": 550, "loss": 1.7509, "lr": 1e-05, "epoch": 0.8289025221540559, "percentage": 82.91, "elapsed_time": "8:15:32", "remaining_time": "1:42:08"}
|
157 |
-
{"current_steps": 457, "total_steps": 550, "loss": 1.7421, "lr": 1e-05, "epoch": 0.8307202908429903, "percentage": 83.09, "elapsed_time": "8:18:43", "remaining_time": "1:41:29"}
|
158 |
-
{"current_steps": 458, "total_steps": 550, "loss": 1.7531, "lr": 1e-05, "epoch": 0.8325380595319246, "percentage": 83.27, "elapsed_time": "8:21:52", "remaining_time": "1:40:48"}
|
159 |
-
{"current_steps": 459, "total_steps": 550, "loss": 1.7453, "lr": 1e-05, "epoch": 0.8343558282208589, "percentage": 83.45, "elapsed_time": "8:25:04", "remaining_time": "1:40:08"}
|
160 |
-
{"current_steps": 460, "total_steps": 550, "loss": 1.7468, "lr": 1e-05, "epoch": 0.8361735969097932, "percentage": 83.64, "elapsed_time": "8:28:16", "remaining_time": "1:39:26"}
|
161 |
-
{"current_steps": 461, "total_steps": 550, "loss": 1.7496, "lr": 1e-05, "epoch": 0.8379913655987276, "percentage": 83.82, "elapsed_time": "8:31:27", "remaining_time": "1:38:44"}
|
162 |
-
{"current_steps": 462, "total_steps": 550, "loss": 1.7485, "lr": 1e-05, "epoch": 0.8398091342876619, "percentage": 84.0, "elapsed_time": "8:34:40", "remaining_time": "1:38:01"}
|
163 |
-
{"current_steps": 463, "total_steps": 550, "loss": 1.7405, "lr": 1e-05, "epoch": 0.8416269029765963, "percentage": 84.18, "elapsed_time": "8:37:50", "remaining_time": "1:37:18"}
|
164 |
-
{"current_steps": 464, "total_steps": 550, "loss": 1.7464, "lr": 1e-05, "epoch": 0.8434446716655306, "percentage": 84.36, "elapsed_time": "8:40:58", "remaining_time": "1:36:33"}
|
165 |
-
{"current_steps": 465, "total_steps": 550, "loss": 1.7564, "lr": 1e-05, "epoch": 0.8452624403544649, "percentage": 84.55, "elapsed_time": "8:44:06", "remaining_time": "1:35:48"}
|
166 |
-
{"current_steps": 466, "total_steps": 550, "loss": 1.745, "lr": 1e-05, "epoch": 0.8470802090433992, "percentage": 84.73, "elapsed_time": "8:47:16", "remaining_time": "1:35:02"}
|
167 |
-
{"current_steps": 467, "total_steps": 550, "loss": 1.741, "lr": 1e-05, "epoch": 0.8488979777323336, "percentage": 84.91, "elapsed_time": "8:50:27", "remaining_time": "1:34:16"}
|
168 |
-
{"current_steps": 468, "total_steps": 550, "loss": 1.7553, "lr": 1e-05, "epoch": 0.8507157464212679, "percentage": 85.09, "elapsed_time": "8:53:36", "remaining_time": "1:33:29"}
|
169 |
-
{"current_steps": 469, "total_steps": 550, "loss": 1.734, "lr": 1e-05, "epoch": 0.8525335151102023, "percentage": 85.27, "elapsed_time": "8:56:45", "remaining_time": "1:32:42"}
|
170 |
-
{"current_steps": 470, "total_steps": 550, "loss": 1.7443, "lr": 1e-05, "epoch": 0.8543512837991366, "percentage": 85.45, "elapsed_time": "8:59:54", "remaining_time": "1:31:53"}
|
171 |
-
{"current_steps": 471, "total_steps": 550, "loss": 1.7496, "lr": 1e-05, "epoch": 0.8561690524880708, "percentage": 85.64, "elapsed_time": "9:03:03", "remaining_time": "1:31:05"}
|
172 |
-
{"current_steps": 472, "total_steps": 550, "loss": 1.7444, "lr": 1e-05, "epoch": 0.8579868211770052, "percentage": 85.82, "elapsed_time": "9:06:13", "remaining_time": "1:30:15"}
|
173 |
-
{"current_steps": 473, "total_steps": 550, "loss": 1.7436, "lr": 1e-05, "epoch": 0.8598045898659396, "percentage": 86.0, "elapsed_time": "9:09:22", "remaining_time": "1:29:26"}
|
174 |
-
{"current_steps": 474, "total_steps": 550, "loss": 1.7488, "lr": 1e-05, "epoch": 0.8616223585548739, "percentage": 86.18, "elapsed_time": "9:12:32", "remaining_time": "1:28:35"}
|
175 |
-
{"current_steps": 475, "total_steps": 550, "loss": 1.7406, "lr": 1e-05, "epoch": 0.8634401272438083, "percentage": 86.36, "elapsed_time": "9:15:40", "remaining_time": "1:27:44"}
|
176 |
-
{"current_steps": 476, "total_steps": 550, "loss": 1.7463, "lr": 1e-05, "epoch": 0.8652578959327426, "percentage": 86.55, "elapsed_time": "9:18:49", "remaining_time": "1:26:52"}
|
177 |
-
{"current_steps": 477, "total_steps": 550, "loss": 1.751, "lr": 1e-05, "epoch": 0.8670756646216768, "percentage": 86.73, "elapsed_time": "9:21:58", "remaining_time": "1:26:00"}
|
178 |
-
{"current_steps": 478, "total_steps": 550, "loss": 1.7402, "lr": 1e-05, "epoch": 0.8688934333106112, "percentage": 86.91, "elapsed_time": "9:25:08", "remaining_time": "1:25:07"}
|
179 |
-
{"current_steps": 479, "total_steps": 550, "loss": 1.7457, "lr": 1e-05, "epoch": 0.8707112019995455, "percentage": 87.09, "elapsed_time": "9:28:18", "remaining_time": "1:24:14"}
|
180 |
-
{"current_steps": 480, "total_steps": 550, "loss": 1.7453, "lr": 1e-05, "epoch": 0.8725289706884799, "percentage": 87.27, "elapsed_time": "9:31:27", "remaining_time": "1:23:20"}
|
181 |
-
{"current_steps": 481, "total_steps": 550, "loss": 1.7386, "lr": 1e-05, "epoch": 0.8743467393774143, "percentage": 87.45, "elapsed_time": "9:34:36", "remaining_time": "1:22:25"}
|
182 |
-
{"current_steps": 482, "total_steps": 550, "loss": 1.7412, "lr": 1e-05, "epoch": 0.8761645080663486, "percentage": 87.64, "elapsed_time": "9:37:45", "remaining_time": "1:21:30"}
|
183 |
-
{"current_steps": 483, "total_steps": 550, "loss": 1.7462, "lr": 1e-05, "epoch": 0.8779822767552828, "percentage": 87.82, "elapsed_time": "9:40:55", "remaining_time": "1:20:35"}
|
184 |
-
{"current_steps": 484, "total_steps": 550, "loss": 1.7443, "lr": 1e-05, "epoch": 0.8798000454442172, "percentage": 88.0, "elapsed_time": "9:44:04", "remaining_time": "1:19:38"}
|
185 |
-
{"current_steps": 485, "total_steps": 550, "loss": 1.7345, "lr": 1e-05, "epoch": 0.8816178141331515, "percentage": 88.18, "elapsed_time": "9:47:14", "remaining_time": "1:18:42"}
|
186 |
-
{"current_steps": 486, "total_steps": 550, "loss": 1.7425, "lr": 1e-05, "epoch": 0.8834355828220859, "percentage": 88.36, "elapsed_time": "9:50:23", "remaining_time": "1:17:44"}
|
187 |
-
{"current_steps": 487, "total_steps": 550, "loss": 1.746, "lr": 1e-05, "epoch": 0.8852533515110202, "percentage": 88.55, "elapsed_time": "9:53:32", "remaining_time": "1:16:46"}
|
188 |
-
{"current_steps": 488, "total_steps": 550, "loss": 1.7327, "lr": 1e-05, "epoch": 0.8870711201999546, "percentage": 88.73, "elapsed_time": "9:56:41", "remaining_time": "1:15:48"}
|
189 |
-
{"current_steps": 489, "total_steps": 550, "loss": 1.7385, "lr": 1e-05, "epoch": 0.8888888888888888, "percentage": 88.91, "elapsed_time": "9:59:50", "remaining_time": "1:14:49"}
|
190 |
-
{"current_steps": 490, "total_steps": 550, "loss": 1.7405, "lr": 1e-05, "epoch": 0.8907066575778232, "percentage": 89.09, "elapsed_time": "10:03:00", "remaining_time": "1:13:50"}
|
191 |
-
{"current_steps": 491, "total_steps": 550, "loss": 1.748, "lr": 1e-05, "epoch": 0.8925244262667575, "percentage": 89.27, "elapsed_time": "10:06:09", "remaining_time": "1:12:50"}
|
192 |
-
{"current_steps": 492, "total_steps": 550, "loss": 1.7465, "lr": 1e-05, "epoch": 0.8943421949556919, "percentage": 89.45, "elapsed_time": "10:09:18", "remaining_time": "1:11:49"}
|
193 |
-
{"current_steps": 493, "total_steps": 550, "loss": 1.7331, "lr": 1e-05, "epoch": 0.8961599636446262, "percentage": 89.64, "elapsed_time": "10:12:28", "remaining_time": "1:10:48"}
|
194 |
-
{"current_steps": 494, "total_steps": 550, "loss": 1.7383, "lr": 1e-05, "epoch": 0.8979777323335606, "percentage": 89.82, "elapsed_time": "10:15:37", "remaining_time": "1:09:47"}
|
195 |
-
{"current_steps": 495, "total_steps": 550, "loss": 1.7416, "lr": 1e-05, "epoch": 0.8997955010224948, "percentage": 90.0, "elapsed_time": "10:18:46", "remaining_time": "1:08:45"}
|
196 |
-
{"current_steps": 496, "total_steps": 550, "loss": 1.742, "lr": 1e-05, "epoch": 0.9016132697114292, "percentage": 90.18, "elapsed_time": "10:21:55", "remaining_time": "1:07:42"}
|
197 |
-
{"current_steps": 497, "total_steps": 550, "loss": 1.7397, "lr": 1e-05, "epoch": 0.9034310384003635, "percentage": 90.36, "elapsed_time": "10:25:05", "remaining_time": "1:06:39"}
|
198 |
-
{"current_steps": 498, "total_steps": 550, "loss": 1.7511, "lr": 1e-05, "epoch": 0.9052488070892979, "percentage": 90.55, "elapsed_time": "10:28:14", "remaining_time": "1:05:35"}
|
199 |
-
{"current_steps": 499, "total_steps": 550, "loss": 1.7468, "lr": 1e-05, "epoch": 0.9070665757782322, "percentage": 90.73, "elapsed_time": "10:31:23", "remaining_time": "1:04:31"}
|
200 |
-
{"current_steps": 500, "total_steps": 550, "loss": 1.7327, "lr": 1e-05, "epoch": 0.9088843444671666, "percentage": 90.91, "elapsed_time": "10:34:32", "remaining_time": "1:03:27"}
|
201 |
-
{"current_steps": 501, "total_steps": 550, "loss": 1.7454, "lr": 1e-05, "epoch": 0.9107021131561008, "percentage": 91.09, "elapsed_time": "10:40:46", "remaining_time": "1:02:40"}
|
202 |
-
{"current_steps": 502, "total_steps": 550, "loss": 1.7476, "lr": 1e-05, "epoch": 0.9125198818450352, "percentage": 91.27, "elapsed_time": "10:43:57", "remaining_time": "1:01:34"}
|
203 |
-
{"current_steps": 503, "total_steps": 550, "loss": 1.7461, "lr": 1e-05, "epoch": 0.9143376505339695, "percentage": 91.45, "elapsed_time": "10:47:05", "remaining_time": "1:00:27"}
|
204 |
-
{"current_steps": 504, "total_steps": 550, "loss": 1.7361, "lr": 1e-05, "epoch": 0.9161554192229039, "percentage": 91.64, "elapsed_time": "10:50:12", "remaining_time": "0:59:20"}
|
205 |
-
{"current_steps": 505, "total_steps": 550, "loss": 1.7441, "lr": 1e-05, "epoch": 0.9179731879118382, "percentage": 91.82, "elapsed_time": "10:53:22", "remaining_time": "0:58:13"}
|
206 |
-
{"current_steps": 506, "total_steps": 550, "loss": 1.742, "lr": 1e-05, "epoch": 0.9197909566007726, "percentage": 92.0, "elapsed_time": "10:56:30", "remaining_time": "0:57:05"}
|
207 |
-
{"current_steps": 507, "total_steps": 550, "loss": 1.7391, "lr": 1e-05, "epoch": 0.9216087252897068, "percentage": 92.18, "elapsed_time": "10:59:38", "remaining_time": "0:55:56"}
|
208 |
-
{"current_steps": 508, "total_steps": 550, "loss": 1.7405, "lr": 1e-05, "epoch": 0.9234264939786412, "percentage": 92.36, "elapsed_time": "11:02:46", "remaining_time": "0:54:47"}
|
209 |
-
{"current_steps": 509, "total_steps": 550, "loss": 1.7458, "lr": 1e-05, "epoch": 0.9252442626675755, "percentage": 92.55, "elapsed_time": "11:05:55", "remaining_time": "0:53:38"}
|
210 |
-
{"current_steps": 510, "total_steps": 550, "loss": 1.7351, "lr": 1e-05, "epoch": 0.9270620313565099, "percentage": 92.73, "elapsed_time": "11:09:04", "remaining_time": "0:52:28"}
|
211 |
-
{"current_steps": 511, "total_steps": 550, "loss": 1.7397, "lr": 1e-05, "epoch": 0.9288798000454442, "percentage": 92.91, "elapsed_time": "11:12:12", "remaining_time": "0:51:18"}
|
212 |
-
{"current_steps": 512, "total_steps": 550, "loss": 1.7471, "lr": 1e-05, "epoch": 0.9306975687343786, "percentage": 93.09, "elapsed_time": "11:15:21", "remaining_time": "0:50:07"}
|
213 |
-
{"current_steps": 513, "total_steps": 550, "loss": 1.7454, "lr": 1e-05, "epoch": 0.9325153374233128, "percentage": 93.27, "elapsed_time": "11:18:34", "remaining_time": "0:48:56"}
|
214 |
-
{"current_steps": 514, "total_steps": 550, "loss": 1.7375, "lr": 1e-05, "epoch": 0.9343331061122472, "percentage": 93.45, "elapsed_time": "11:21:43", "remaining_time": "0:47:44"}
|
215 |
-
{"current_steps": 515, "total_steps": 550, "loss": 1.7394, "lr": 1e-05, "epoch": 0.9361508748011815, "percentage": 93.64, "elapsed_time": "11:24:53", "remaining_time": "0:46:32"}
|
216 |
-
{"current_steps": 516, "total_steps": 550, "loss": 1.7452, "lr": 1e-05, "epoch": 0.9379686434901159, "percentage": 93.82, "elapsed_time": "11:28:03", "remaining_time": "0:45:20"}
|
217 |
-
{"current_steps": 517, "total_steps": 550, "loss": 1.7441, "lr": 1e-05, "epoch": 0.9397864121790502, "percentage": 94.0, "elapsed_time": "11:31:12", "remaining_time": "0:44:07"}
|
218 |
-
{"current_steps": 518, "total_steps": 550, "loss": 1.7417, "lr": 1e-05, "epoch": 0.9416041808679846, "percentage": 94.18, "elapsed_time": "11:34:21", "remaining_time": "0:42:53"}
|
219 |
-
{"current_steps": 519, "total_steps": 550, "loss": 1.7428, "lr": 1e-05, "epoch": 0.9434219495569189, "percentage": 94.36, "elapsed_time": "11:37:32", "remaining_time": "0:41:39"}
|
220 |
-
{"current_steps": 520, "total_steps": 550, "loss": 1.7345, "lr": 1e-05, "epoch": 0.9452397182458532, "percentage": 94.55, "elapsed_time": "11:40:42", "remaining_time": "0:40:25"}
|
221 |
-
{"current_steps": 521, "total_steps": 550, "loss": 1.7362, "lr": 1e-05, "epoch": 0.9470574869347875, "percentage": 94.73, "elapsed_time": "11:43:51", "remaining_time": "0:39:10"}
|
222 |
-
{"current_steps": 522, "total_steps": 550, "loss": 1.7355, "lr": 1e-05, "epoch": 0.9488752556237219, "percentage": 94.91, "elapsed_time": "11:47:03", "remaining_time": "0:37:55"}
|
223 |
-
{"current_steps": 523, "total_steps": 550, "loss": 1.7468, "lr": 1e-05, "epoch": 0.9506930243126562, "percentage": 95.09, "elapsed_time": "11:50:13", "remaining_time": "0:36:39"}
|
224 |
-
{"current_steps": 524, "total_steps": 550, "loss": 1.7422, "lr": 1e-05, "epoch": 0.9525107930015906, "percentage": 95.27, "elapsed_time": "11:53:21", "remaining_time": "0:35:23"}
|
225 |
-
{"current_steps": 525, "total_steps": 550, "loss": 1.7393, "lr": 1e-05, "epoch": 0.9543285616905249, "percentage": 95.45, "elapsed_time": "11:56:31", "remaining_time": "0:34:07"}
|
226 |
-
{"current_steps": 526, "total_steps": 550, "loss": 1.7341, "lr": 1e-05, "epoch": 0.9561463303794592, "percentage": 95.64, "elapsed_time": "11:59:39", "remaining_time": "0:32:50"}
|
227 |
-
{"current_steps": 527, "total_steps": 550, "loss": 1.7428, "lr": 1e-05, "epoch": 0.9579640990683935, "percentage": 95.82, "elapsed_time": "12:02:49", "remaining_time": "0:31:32"}
|
228 |
-
{"current_steps": 528, "total_steps": 550, "loss": 1.7496, "lr": 1e-05, "epoch": 0.9597818677573279, "percentage": 96.0, "elapsed_time": "12:05:59", "remaining_time": "0:30:14"}
|
229 |
-
{"current_steps": 529, "total_steps": 550, "loss": 1.7413, "lr": 1e-05, "epoch": 0.9615996364462622, "percentage": 96.18, "elapsed_time": "12:09:09", "remaining_time": "0:28:56"}
|
230 |
-
{"current_steps": 530, "total_steps": 550, "loss": 1.7395, "lr": 1e-05, "epoch": 0.9634174051351966, "percentage": 96.36, "elapsed_time": "12:12:19", "remaining_time": "0:27:38"}
|
231 |
-
{"current_steps": 531, "total_steps": 550, "loss": 1.7342, "lr": 1e-05, "epoch": 0.9652351738241309, "percentage": 96.55, "elapsed_time": "12:15:28", "remaining_time": "0:26:18"}
|
232 |
-
{"current_steps": 532, "total_steps": 550, "loss": 1.7384, "lr": 1e-05, "epoch": 0.9670529425130652, "percentage": 96.73, "elapsed_time": "12:18:37", "remaining_time": "0:24:59"}
|
233 |
-
{"current_steps": 533, "total_steps": 550, "loss": 1.7425, "lr": 1e-05, "epoch": 0.9688707112019995, "percentage": 96.91, "elapsed_time": "12:21:45", "remaining_time": "0:23:39"}
|
234 |
-
{"current_steps": 534, "total_steps": 550, "loss": 1.7521, "lr": 1e-05, "epoch": 0.9706884798909339, "percentage": 97.09, "elapsed_time": "12:24:54", "remaining_time": "0:22:19"}
|
235 |
-
{"current_steps": 535, "total_steps": 550, "loss": 1.7455, "lr": 1e-05, "epoch": 0.9725062485798682, "percentage": 97.27, "elapsed_time": "12:28:04", "remaining_time": "0:20:58"}
|
236 |
-
{"current_steps": 536, "total_steps": 550, "loss": 1.7509, "lr": 1e-05, "epoch": 0.9743240172688026, "percentage": 97.45, "elapsed_time": "12:31:14", "remaining_time": "0:19:37"}
|
237 |
-
{"current_steps": 537, "total_steps": 550, "loss": 1.7392, "lr": 1e-05, "epoch": 0.9761417859577369, "percentage": 97.64, "elapsed_time": "12:34:23", "remaining_time": "0:18:15"}
|
238 |
-
{"current_steps": 538, "total_steps": 550, "loss": 1.7341, "lr": 1e-05, "epoch": 0.9779595546466712, "percentage": 97.82, "elapsed_time": "12:37:32", "remaining_time": "0:16:53"}
|
239 |
-
{"current_steps": 539, "total_steps": 550, "loss": 1.7367, "lr": 1e-05, "epoch": 0.9797773233356055, "percentage": 98.0, "elapsed_time": "12:40:42", "remaining_time": "0:15:31"}
|
240 |
-
{"current_steps": 540, "total_steps": 550, "loss": 1.7423, "lr": 1e-05, "epoch": 0.9815950920245399, "percentage": 98.18, "elapsed_time": "12:43:52", "remaining_time": "0:14:08"}
|
241 |
-
{"current_steps": 541, "total_steps": 550, "loss": 1.7429, "lr": 1e-05, "epoch": 0.9834128607134742, "percentage": 98.36, "elapsed_time": "12:47:01", "remaining_time": "0:12:45"}
|
242 |
-
{"current_steps": 542, "total_steps": 550, "loss": 1.7348, "lr": 1e-05, "epoch": 0.9852306294024086, "percentage": 98.55, "elapsed_time": "12:50:10", "remaining_time": "0:11:22"}
|
243 |
-
{"current_steps": 543, "total_steps": 550, "loss": 1.7382, "lr": 1e-05, "epoch": 0.9870483980913429, "percentage": 98.73, "elapsed_time": "12:53:20", "remaining_time": "0:09:58"}
|
244 |
-
{"current_steps": 544, "total_steps": 550, "loss": 1.7412, "lr": 1e-05, "epoch": 0.9888661667802772, "percentage": 98.91, "elapsed_time": "12:56:28", "remaining_time": "0:08:33"}
|
245 |
-
{"current_steps": 545, "total_steps": 550, "loss": 1.7287, "lr": 1e-05, "epoch": 0.9906839354692115, "percentage": 99.09, "elapsed_time": "12:59:38", "remaining_time": "0:07:09"}
|
246 |
-
{"current_steps": 546, "total_steps": 550, "loss": 1.7345, "lr": 1e-05, "epoch": 0.9925017041581459, "percentage": 99.27, "elapsed_time": "13:02:48", "remaining_time": "0:05:44"}
|
247 |
-
{"current_steps": 547, "total_steps": 550, "loss": 1.7282, "lr": 1e-05, "epoch": 0.9943194728470802, "percentage": 99.45, "elapsed_time": "13:05:58", "remaining_time": "0:04:18"}
|
248 |
-
{"current_steps": 548, "total_steps": 550, "loss": 1.7358, "lr": 1e-05, "epoch": 0.9961372415360146, "percentage": 99.64, "elapsed_time": "13:09:08", "remaining_time": "0:02:52"}
|
249 |
-
{"current_steps": 549, "total_steps": 550, "loss": 1.7371, "lr": 1e-05, "epoch": 0.9979550102249489, "percentage": 99.82, "elapsed_time": "13:12:18", "remaining_time": "0:01:26"}
|
250 |
-
{"current_steps": 550, "total_steps": 550, "loss": 1.7397, "lr": 1e-05, "epoch": 0.9997727789138832, "percentage": 100.0, "elapsed_time": "13:15:28", "remaining_time": "0:00:00"}
|
251 |
-
{"current_steps": 550, "total_steps": 550, "epoch": 0.9997727789138832, "percentage": 100.0, "elapsed_time": "13:18:32", "remaining_time": "0:00:00"}
|
|
|
1 |
+
{"current_steps": 551, "total_steps": 2200, "loss": 1.7215, "lr": 1e-05, "epoch": 1.0018177686889342, "percentage": 25.05, "elapsed_time": "0:03:22", "remaining_time": "0:10:07"}
|
2 |
+
{"current_steps": 552, "total_steps": 2200, "loss": 1.7231, "lr": 1e-05, "epoch": 1.0036355373778687, "percentage": 25.09, "elapsed_time": "0:06:37", "remaining_time": "0:19:46"}
|
3 |
+
{"current_steps": 553, "total_steps": 2200, "loss": 1.72, "lr": 1e-05, "epoch": 1.005453306066803, "percentage": 25.14, "elapsed_time": "0:09:47", "remaining_time": "0:29:08"}
|
4 |
+
{"current_steps": 554, "total_steps": 2200, "loss": 1.7254, "lr": 1e-05, "epoch": 1.0072710747557374, "percentage": 25.18, "elapsed_time": "0:12:55", "remaining_time": "0:38:23"}
|
5 |
+
{"current_steps": 555, "total_steps": 2200, "loss": 1.7207, "lr": 1e-05, "epoch": 1.0090888434446716, "percentage": 25.23, "elapsed_time": "0:16:03", "remaining_time": "0:47:34"}
|
6 |
+
{"current_steps": 556, "total_steps": 2200, "loss": 1.7205, "lr": 1e-05, "epoch": 1.010906612133606, "percentage": 25.27, "elapsed_time": "0:19:12", "remaining_time": "0:56:46"}
|
7 |
+
{"current_steps": 557, "total_steps": 2200, "loss": 1.7136, "lr": 1e-05, "epoch": 1.0127243808225403, "percentage": 25.32, "elapsed_time": "0:22:20", "remaining_time": "1:05:53"}
|
8 |
+
{"current_steps": 558, "total_steps": 2200, "loss": 1.7201, "lr": 1e-05, "epoch": 1.0145421495114746, "percentage": 25.36, "elapsed_time": "0:25:28", "remaining_time": "1:14:58"}
|
9 |
+
{"current_steps": 559, "total_steps": 2200, "loss": 1.7165, "lr": 1e-05, "epoch": 1.016359918200409, "percentage": 25.41, "elapsed_time": "0:28:37", "remaining_time": "1:24:00"}
|
10 |
+
{"current_steps": 560, "total_steps": 2200, "loss": 1.7138, "lr": 1e-05, "epoch": 1.0181776868893433, "percentage": 25.45, "elapsed_time": "0:31:46", "remaining_time": "1:33:03"}
|
11 |
+
{"current_steps": 561, "total_steps": 2200, "loss": 1.7087, "lr": 1e-05, "epoch": 1.0199954555782778, "percentage": 25.5, "elapsed_time": "0:34:57", "remaining_time": "1:42:06"}
|
12 |
+
{"current_steps": 562, "total_steps": 2200, "loss": 1.7211, "lr": 1e-05, "epoch": 1.021813224267212, "percentage": 25.55, "elapsed_time": "0:38:05", "remaining_time": "1:51:01"}
|
13 |
+
{"current_steps": 563, "total_steps": 2200, "loss": 1.7132, "lr": 1e-05, "epoch": 1.0236309929561462, "percentage": 25.59, "elapsed_time": "0:41:14", "remaining_time": "1:59:54"}
|
14 |
+
{"current_steps": 564, "total_steps": 2200, "loss": 1.7169, "lr": 1e-05, "epoch": 1.0254487616450807, "percentage": 25.64, "elapsed_time": "0:44:22", "remaining_time": "2:08:43"}
|
15 |
+
{"current_steps": 565, "total_steps": 2200, "loss": 1.7255, "lr": 1e-05, "epoch": 1.027266530334015, "percentage": 25.68, "elapsed_time": "0:47:30", "remaining_time": "2:17:29"}
|
16 |
+
{"current_steps": 566, "total_steps": 2200, "loss": 1.7211, "lr": 1e-05, "epoch": 1.0290842990229494, "percentage": 25.73, "elapsed_time": "0:50:40", "remaining_time": "2:26:17"}
|
17 |
+
{"current_steps": 567, "total_steps": 2200, "loss": 1.7143, "lr": 1e-05, "epoch": 1.0309020677118836, "percentage": 25.77, "elapsed_time": "0:53:50", "remaining_time": "2:35:03"}
|
18 |
+
{"current_steps": 568, "total_steps": 2200, "loss": 1.7185, "lr": 1e-05, "epoch": 1.032719836400818, "percentage": 25.82, "elapsed_time": "0:57:00", "remaining_time": "2:43:46"}
|
19 |
+
{"current_steps": 569, "total_steps": 2200, "loss": 1.722, "lr": 1e-05, "epoch": 1.0345376050897523, "percentage": 25.86, "elapsed_time": "1:00:08", "remaining_time": "2:52:24"}
|
20 |
+
{"current_steps": 570, "total_steps": 2200, "loss": 1.7247, "lr": 1e-05, "epoch": 1.0363553737786866, "percentage": 25.91, "elapsed_time": "1:03:17", "remaining_time": "3:01:00"}
|
21 |
+
{"current_steps": 571, "total_steps": 2200, "loss": 1.7196, "lr": 1e-05, "epoch": 1.038173142467621, "percentage": 25.95, "elapsed_time": "1:06:28", "remaining_time": "3:09:37"}
|
22 |
+
{"current_steps": 572, "total_steps": 2200, "loss": 1.7133, "lr": 1e-05, "epoch": 1.0399909111565553, "percentage": 26.0, "elapsed_time": "1:09:37", "remaining_time": "3:18:10"}
|
23 |
+
{"current_steps": 573, "total_steps": 2200, "loss": 1.7169, "lr": 1e-05, "epoch": 1.0418086798454897, "percentage": 26.05, "elapsed_time": "1:12:47", "remaining_time": "3:26:41"}
|
24 |
+
{"current_steps": 574, "total_steps": 2200, "loss": 1.7152, "lr": 1e-05, "epoch": 1.043626448534424, "percentage": 26.09, "elapsed_time": "1:15:57", "remaining_time": "3:35:11"}
|
25 |
+
{"current_steps": 575, "total_steps": 2200, "loss": 1.7206, "lr": 1e-05, "epoch": 1.0454442172233582, "percentage": 26.14, "elapsed_time": "1:19:06", "remaining_time": "3:43:32"}
|
26 |
+
{"current_steps": 576, "total_steps": 2200, "loss": 1.706, "lr": 1e-05, "epoch": 1.0472619859122927, "percentage": 26.18, "elapsed_time": "1:22:15", "remaining_time": "3:51:55"}
|
27 |
+
{"current_steps": 577, "total_steps": 2200, "loss": 1.7131, "lr": 1e-05, "epoch": 1.049079754601227, "percentage": 26.23, "elapsed_time": "1:25:23", "remaining_time": "4:00:10"}
|
28 |
+
{"current_steps": 578, "total_steps": 2200, "loss": 1.7191, "lr": 1e-05, "epoch": 1.0508975232901614, "percentage": 26.27, "elapsed_time": "1:28:31", "remaining_time": "4:08:25"}
|
29 |
+
{"current_steps": 579, "total_steps": 2200, "loss": 1.7066, "lr": 1e-05, "epoch": 1.0527152919790956, "percentage": 26.32, "elapsed_time": "1:31:40", "remaining_time": "4:16:39"}
|
30 |
+
{"current_steps": 580, "total_steps": 2200, "loss": 1.7223, "lr": 1e-05, "epoch": 1.05453306066803, "percentage": 26.36, "elapsed_time": "1:34:49", "remaining_time": "4:24:51"}
|
31 |
+
{"current_steps": 581, "total_steps": 2200, "loss": 1.7164, "lr": 1e-05, "epoch": 1.0563508293569643, "percentage": 26.41, "elapsed_time": "1:37:58", "remaining_time": "4:33:00"}
|
32 |
+
{"current_steps": 582, "total_steps": 2200, "loss": 1.7082, "lr": 1e-05, "epoch": 1.0581685980458986, "percentage": 26.45, "elapsed_time": "1:41:06", "remaining_time": "4:41:06"}
|
33 |
+
{"current_steps": 583, "total_steps": 2200, "loss": 1.7155, "lr": 1e-05, "epoch": 1.059986366734833, "percentage": 26.5, "elapsed_time": "1:44:16", "remaining_time": "4:49:14"}
|
34 |
+
{"current_steps": 584, "total_steps": 2200, "loss": 1.7195, "lr": 1e-05, "epoch": 1.0618041354237673, "percentage": 26.55, "elapsed_time": "1:47:26", "remaining_time": "4:57:19"}
|
35 |
+
{"current_steps": 585, "total_steps": 2200, "loss": 1.7139, "lr": 1e-05, "epoch": 1.0636219041127017, "percentage": 26.59, "elapsed_time": "1:50:35", "remaining_time": "5:05:19"}
|
36 |
+
{"current_steps": 586, "total_steps": 2200, "loss": 1.7076, "lr": 1e-05, "epoch": 1.065439672801636, "percentage": 26.64, "elapsed_time": "1:53:44", "remaining_time": "5:13:15"}
|
37 |
+
{"current_steps": 587, "total_steps": 2200, "loss": 1.716, "lr": 1e-05, "epoch": 1.0672574414905702, "percentage": 26.68, "elapsed_time": "1:56:53", "remaining_time": "5:21:12"}
|
38 |
+
{"current_steps": 588, "total_steps": 2200, "loss": 1.715, "lr": 1e-05, "epoch": 1.0690752101795047, "percentage": 26.73, "elapsed_time": "2:00:02", "remaining_time": "5:29:05"}
|
39 |
+
{"current_steps": 589, "total_steps": 2200, "loss": 1.7197, "lr": 1e-05, "epoch": 1.070892978868439, "percentage": 26.77, "elapsed_time": "2:03:10", "remaining_time": "5:36:53"}
|
40 |
+
{"current_steps": 590, "total_steps": 2200, "loss": 1.7139, "lr": 1e-05, "epoch": 1.0727107475573734, "percentage": 26.82, "elapsed_time": "2:06:18", "remaining_time": "5:44:41"}
|
41 |
+
{"current_steps": 591, "total_steps": 2200, "loss": 1.7211, "lr": 1e-05, "epoch": 1.0745285162463076, "percentage": 26.86, "elapsed_time": "2:09:27", "remaining_time": "5:52:27"}
|
42 |
+
{"current_steps": 592, "total_steps": 2200, "loss": 1.7077, "lr": 1e-05, "epoch": 1.076346284935242, "percentage": 26.91, "elapsed_time": "2:12:37", "remaining_time": "6:00:13"}
|
43 |
+
{"current_steps": 593, "total_steps": 2200, "loss": 1.7122, "lr": 1e-05, "epoch": 1.0781640536241763, "percentage": 26.95, "elapsed_time": "2:15:48", "remaining_time": "6:08:01"}
|
44 |
+
{"current_steps": 594, "total_steps": 2200, "loss": 1.7185, "lr": 1e-05, "epoch": 1.0799818223131106, "percentage": 27.0, "elapsed_time": "2:18:59", "remaining_time": "6:15:47"}
|
45 |
+
{"current_steps": 595, "total_steps": 2200, "loss": 1.7139, "lr": 1e-05, "epoch": 1.081799591002045, "percentage": 27.05, "elapsed_time": "2:22:08", "remaining_time": "6:23:26"}
|
46 |
+
{"current_steps": 596, "total_steps": 2200, "loss": 1.7136, "lr": 1e-05, "epoch": 1.0836173596909793, "percentage": 27.09, "elapsed_time": "2:25:18", "remaining_time": "6:31:04"}
|
47 |
+
{"current_steps": 597, "total_steps": 2200, "loss": 1.7165, "lr": 1e-05, "epoch": 1.0854351283799137, "percentage": 27.14, "elapsed_time": "2:28:27", "remaining_time": "6:38:38"}
|
48 |
+
{"current_steps": 598, "total_steps": 2200, "loss": 1.7177, "lr": 1e-05, "epoch": 1.087252897068848, "percentage": 27.18, "elapsed_time": "2:31:37", "remaining_time": "6:46:12"}
|
49 |
+
{"current_steps": 599, "total_steps": 2200, "loss": 1.7129, "lr": 1e-05, "epoch": 1.0890706657577822, "percentage": 27.23, "elapsed_time": "2:34:46", "remaining_time": "6:53:39"}
|
50 |
+
{"current_steps": 600, "total_steps": 2200, "loss": 1.7267, "lr": 1e-05, "epoch": 1.0908884344467167, "percentage": 27.27, "elapsed_time": "2:37:55", "remaining_time": "7:01:08"}
|
51 |
+
{"current_steps": 601, "total_steps": 2200, "loss": 1.7212, "lr": 1e-05, "epoch": 1.092706203135651, "percentage": 27.32, "elapsed_time": "2:44:27", "remaining_time": "7:17:33"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 7672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6ca41750297033af1f4e715f9a53c1574c6b50c268cfbdd3aeb59e901d1e27f
|
3 |
size 7672
|