furmaniak commited on
Commit
5b8d2e1
·
verified ·
1 Parent(s): b95e3e6

Training in progress, step 600

Browse files
model-00001-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bf0ee0a475d1ebfa972693fef768d594bff3cc3d71e824a175b6f2fe3e8c9caf
3
  size 4933656472
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f2777087bbcd133c6e507c2669ceaffd7a3cb3bb12c12286fe93cb1765f029f
3
  size 4933656472
model-00002-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:17c8eec037873090704a9142967bb748609c6928ebf15f984139cc6cd1ebcb18
3
  size 4954690712
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03b17d3bb165127e2c8a824b11b2fcf9495696900e53cd809421ba0aaa3a7443
3
  size 4954690712
model-00003-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4c7dae149c1fa9ee6329e67e7dcdf5cb3ae85250fb95fa4e2cc59d210dbade69
3
  size 4902241352
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:298c26ed2b3898ab3416ca53c67b73f198b06074b5861c7215a071159c703218
3
  size 4902241352
model-00004-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d9cdd47b2f31cf295b01f82831d5b6cb59879405214db51e5d9100fddf9b9c79
3
  size 4771169120
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6adf1ad69c7689be879be78b514105e062f4bc01b78199b462692190a1a3cbc
3
  size 4771169120
model-00005-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:765ee5a84a70187412f93cf35573415c16ad0b5db2adaee0822d4964e3617a13
3
  size 4771169120
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a77a448273a4f1ae0309e1a0cf13ef22e13a5219068768bbac7c54026d94c0a3
3
  size 4771169120
model-00006-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c244d5e95e5d827079f9d2d72ee8f62121386db81921f82eb6540bbc21467cdd
3
  size 4986116216
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e772c73805283d90e378e998fef03495c960a32c2e787f029936fbf998e0a25
3
  size 4986116216
trainer_log.jsonl CHANGED
@@ -1,251 +1,51 @@
1
- {"current_steps": 301, "total_steps": 550, "loss": 1.7592, "lr": 1e-05, "epoch": 0.5471483753692342, "percentage": 54.73, "elapsed_time": "0:03:25", "remaining_time": "0:02:50"}
2
- {"current_steps": 302, "total_steps": 550, "loss": 1.7495, "lr": 1e-05, "epoch": 0.5489661440581686, "percentage": 54.91, "elapsed_time": "0:06:41", "remaining_time": "0:05:29"}
3
- {"current_steps": 303, "total_steps": 550, "loss": 1.7564, "lr": 1e-05, "epoch": 0.5507839127471029, "percentage": 55.09, "elapsed_time": "0:09:54", "remaining_time": "0:08:04"}
4
- {"current_steps": 304, "total_steps": 550, "loss": 1.7635, "lr": 1e-05, "epoch": 0.5526016814360373, "percentage": 55.27, "elapsed_time": "0:13:08", "remaining_time": "0:10:38"}
5
- {"current_steps": 305, "total_steps": 550, "loss": 1.748, "lr": 1e-05, "epoch": 0.5544194501249716, "percentage": 55.45, "elapsed_time": "0:16:23", "remaining_time": "0:13:10"}
6
- {"current_steps": 306, "total_steps": 550, "loss": 1.7467, "lr": 1e-05, "epoch": 0.556237218813906, "percentage": 55.64, "elapsed_time": "0:19:34", "remaining_time": "0:15:36"}
7
- {"current_steps": 307, "total_steps": 550, "loss": 1.751, "lr": 1e-05, "epoch": 0.5580549875028402, "percentage": 55.82, "elapsed_time": "0:22:44", "remaining_time": "0:17:59"}
8
- {"current_steps": 308, "total_steps": 550, "loss": 1.7605, "lr": 1e-05, "epoch": 0.5598727561917746, "percentage": 56.0, "elapsed_time": "0:25:52", "remaining_time": "0:20:20"}
9
- {"current_steps": 309, "total_steps": 550, "loss": 1.7516, "lr": 1e-05, "epoch": 0.5616905248807089, "percentage": 56.18, "elapsed_time": "0:29:01", "remaining_time": "0:22:38"}
10
- {"current_steps": 310, "total_steps": 550, "loss": 1.7557, "lr": 1e-05, "epoch": 0.5635082935696433, "percentage": 56.36, "elapsed_time": "0:32:09", "remaining_time": "0:24:53"}
11
- {"current_steps": 311, "total_steps": 550, "loss": 1.7548, "lr": 1e-05, "epoch": 0.5653260622585776, "percentage": 56.55, "elapsed_time": "0:35:17", "remaining_time": "0:27:07"}
12
- {"current_steps": 312, "total_steps": 550, "loss": 1.7569, "lr": 1e-05, "epoch": 0.567143830947512, "percentage": 56.73, "elapsed_time": "0:38:24", "remaining_time": "0:29:18"}
13
- {"current_steps": 313, "total_steps": 550, "loss": 1.7499, "lr": 1e-05, "epoch": 0.5689615996364462, "percentage": 56.91, "elapsed_time": "0:41:32", "remaining_time": "0:31:26"}
14
- {"current_steps": 314, "total_steps": 550, "loss": 1.7628, "lr": 1e-05, "epoch": 0.5707793683253806, "percentage": 57.09, "elapsed_time": "0:44:42", "remaining_time": "0:33:36"}
15
- {"current_steps": 315, "total_steps": 550, "loss": 1.7695, "lr": 1e-05, "epoch": 0.5725971370143149, "percentage": 57.27, "elapsed_time": "0:47:53", "remaining_time": "0:35:43"}
16
- {"current_steps": 316, "total_steps": 550, "loss": 1.7573, "lr": 1e-05, "epoch": 0.5744149057032493, "percentage": 57.45, "elapsed_time": "0:51:03", "remaining_time": "0:37:48"}
17
- {"current_steps": 317, "total_steps": 550, "loss": 1.7672, "lr": 1e-05, "epoch": 0.5762326743921836, "percentage": 57.64, "elapsed_time": "0:54:13", "remaining_time": "0:39:51"}
18
- {"current_steps": 318, "total_steps": 550, "loss": 1.7481, "lr": 1e-05, "epoch": 0.578050443081118, "percentage": 57.82, "elapsed_time": "0:57:23", "remaining_time": "0:41:52"}
19
- {"current_steps": 319, "total_steps": 550, "loss": 1.7543, "lr": 1e-05, "epoch": 0.5798682117700522, "percentage": 58.0, "elapsed_time": "1:00:31", "remaining_time": "0:43:50"}
20
- {"current_steps": 320, "total_steps": 550, "loss": 1.7595, "lr": 1e-05, "epoch": 0.5816859804589866, "percentage": 58.18, "elapsed_time": "1:03:40", "remaining_time": "0:45:45"}
21
- {"current_steps": 321, "total_steps": 550, "loss": 1.7624, "lr": 1e-05, "epoch": 0.5835037491479209, "percentage": 58.36, "elapsed_time": "1:06:47", "remaining_time": "0:47:38"}
22
- {"current_steps": 322, "total_steps": 550, "loss": 1.7633, "lr": 1e-05, "epoch": 0.5853215178368553, "percentage": 58.55, "elapsed_time": "1:09:57", "remaining_time": "0:49:32"}
23
- {"current_steps": 323, "total_steps": 550, "loss": 1.753, "lr": 1e-05, "epoch": 0.5871392865257896, "percentage": 58.73, "elapsed_time": "1:13:07", "remaining_time": "0:51:23"}
24
- {"current_steps": 324, "total_steps": 550, "loss": 1.7553, "lr": 1e-05, "epoch": 0.588957055214724, "percentage": 58.91, "elapsed_time": "1:16:16", "remaining_time": "0:53:12"}
25
- {"current_steps": 325, "total_steps": 550, "loss": 1.759, "lr": 1e-05, "epoch": 0.5907748239036582, "percentage": 59.09, "elapsed_time": "1:19:26", "remaining_time": "0:54:59"}
26
- {"current_steps": 326, "total_steps": 550, "loss": 1.7545, "lr": 1e-05, "epoch": 0.5925925925925926, "percentage": 59.27, "elapsed_time": "1:22:34", "remaining_time": "0:56:44"}
27
- {"current_steps": 327, "total_steps": 550, "loss": 1.7569, "lr": 1e-05, "epoch": 0.5944103612815269, "percentage": 59.45, "elapsed_time": "1:25:42", "remaining_time": "0:58:27"}
28
- {"current_steps": 328, "total_steps": 550, "loss": 1.7551, "lr": 1e-05, "epoch": 0.5962281299704613, "percentage": 59.64, "elapsed_time": "1:28:52", "remaining_time": "1:00:09"}
29
- {"current_steps": 329, "total_steps": 550, "loss": 1.7489, "lr": 1e-05, "epoch": 0.5980458986593956, "percentage": 59.82, "elapsed_time": "1:32:02", "remaining_time": "1:01:49"}
30
- {"current_steps": 330, "total_steps": 550, "loss": 1.7584, "lr": 1e-05, "epoch": 0.59986366734833, "percentage": 60.0, "elapsed_time": "1:35:10", "remaining_time": "1:03:26"}
31
- {"current_steps": 331, "total_steps": 550, "loss": 1.7484, "lr": 1e-05, "epoch": 0.6016814360372642, "percentage": 60.18, "elapsed_time": "1:38:18", "remaining_time": "1:05:02"}
32
- {"current_steps": 332, "total_steps": 550, "loss": 1.7549, "lr": 1e-05, "epoch": 0.6034992047261986, "percentage": 60.36, "elapsed_time": "1:41:27", "remaining_time": "1:06:37"}
33
- {"current_steps": 333, "total_steps": 550, "loss": 1.7503, "lr": 1e-05, "epoch": 0.6053169734151329, "percentage": 60.55, "elapsed_time": "1:44:37", "remaining_time": "1:08:10"}
34
- {"current_steps": 334, "total_steps": 550, "loss": 1.7613, "lr": 1e-05, "epoch": 0.6071347421040673, "percentage": 60.73, "elapsed_time": "1:47:46", "remaining_time": "1:09:41"}
35
- {"current_steps": 335, "total_steps": 550, "loss": 1.7539, "lr": 1e-05, "epoch": 0.6089525107930016, "percentage": 60.91, "elapsed_time": "1:50:54", "remaining_time": "1:11:10"}
36
- {"current_steps": 336, "total_steps": 550, "loss": 1.752, "lr": 1e-05, "epoch": 0.610770279481936, "percentage": 61.09, "elapsed_time": "1:54:07", "remaining_time": "1:12:41"}
37
- {"current_steps": 337, "total_steps": 550, "loss": 1.753, "lr": 1e-05, "epoch": 0.6125880481708702, "percentage": 61.27, "elapsed_time": "1:57:19", "remaining_time": "1:14:09"}
38
- {"current_steps": 338, "total_steps": 550, "loss": 1.7574, "lr": 1e-05, "epoch": 0.6144058168598046, "percentage": 61.45, "elapsed_time": "2:00:28", "remaining_time": "1:15:34"}
39
- {"current_steps": 339, "total_steps": 550, "loss": 1.7552, "lr": 1e-05, "epoch": 0.6162235855487389, "percentage": 61.64, "elapsed_time": "2:03:38", "remaining_time": "1:16:57"}
40
- {"current_steps": 340, "total_steps": 550, "loss": 1.7538, "lr": 1e-05, "epoch": 0.6180413542376733, "percentage": 61.82, "elapsed_time": "2:06:48", "remaining_time": "1:18:19"}
41
- {"current_steps": 341, "total_steps": 550, "loss": 1.7589, "lr": 1e-05, "epoch": 0.6198591229266076, "percentage": 62.0, "elapsed_time": "2:09:57", "remaining_time": "1:19:38"}
42
- {"current_steps": 342, "total_steps": 550, "loss": 1.7514, "lr": 1e-05, "epoch": 0.621676891615542, "percentage": 62.18, "elapsed_time": "2:13:05", "remaining_time": "1:20:56"}
43
- {"current_steps": 343, "total_steps": 550, "loss": 1.7578, "lr": 1e-05, "epoch": 0.6234946603044762, "percentage": 62.36, "elapsed_time": "2:16:13", "remaining_time": "1:22:12"}
44
- {"current_steps": 344, "total_steps": 550, "loss": 1.7528, "lr": 1e-05, "epoch": 0.6253124289934106, "percentage": 62.55, "elapsed_time": "2:19:23", "remaining_time": "1:23:28"}
45
- {"current_steps": 345, "total_steps": 550, "loss": 1.7511, "lr": 1e-05, "epoch": 0.6271301976823449, "percentage": 62.73, "elapsed_time": "2:22:31", "remaining_time": "1:24:41"}
46
- {"current_steps": 346, "total_steps": 550, "loss": 1.7504, "lr": 1e-05, "epoch": 0.6289479663712793, "percentage": 62.91, "elapsed_time": "2:25:39", "remaining_time": "1:25:52"}
47
- {"current_steps": 347, "total_steps": 550, "loss": 1.7545, "lr": 1e-05, "epoch": 0.6307657350602136, "percentage": 63.09, "elapsed_time": "2:28:48", "remaining_time": "1:27:03"}
48
- {"current_steps": 348, "total_steps": 550, "loss": 1.7481, "lr": 1e-05, "epoch": 0.632583503749148, "percentage": 63.27, "elapsed_time": "2:31:57", "remaining_time": "1:28:12"}
49
- {"current_steps": 349, "total_steps": 550, "loss": 1.7614, "lr": 1e-05, "epoch": 0.6344012724380823, "percentage": 63.45, "elapsed_time": "2:35:05", "remaining_time": "1:29:19"}
50
- {"current_steps": 350, "total_steps": 550, "loss": 1.7497, "lr": 1e-05, "epoch": 0.6362190411270165, "percentage": 63.64, "elapsed_time": "2:38:14", "remaining_time": "1:30:25"}
51
- {"current_steps": 351, "total_steps": 550, "loss": 1.7537, "lr": 1e-05, "epoch": 0.6380368098159509, "percentage": 63.82, "elapsed_time": "2:41:23", "remaining_time": "1:31:29"}
52
- {"current_steps": 352, "total_steps": 550, "loss": 1.7456, "lr": 1e-05, "epoch": 0.6398545785048853, "percentage": 64.0, "elapsed_time": "2:44:32", "remaining_time": "1:32:33"}
53
- {"current_steps": 353, "total_steps": 550, "loss": 1.7494, "lr": 1e-05, "epoch": 0.6416723471938196, "percentage": 64.18, "elapsed_time": "2:47:41", "remaining_time": "1:33:34"}
54
- {"current_steps": 354, "total_steps": 550, "loss": 1.743, "lr": 1e-05, "epoch": 0.643490115882754, "percentage": 64.36, "elapsed_time": "2:50:50", "remaining_time": "1:34:35"}
55
- {"current_steps": 355, "total_steps": 550, "loss": 1.7478, "lr": 1e-05, "epoch": 0.6453078845716883, "percentage": 64.55, "elapsed_time": "2:53:58", "remaining_time": "1:35:34"}
56
- {"current_steps": 356, "total_steps": 550, "loss": 1.7535, "lr": 1e-05, "epoch": 0.6471256532606225, "percentage": 64.73, "elapsed_time": "2:57:08", "remaining_time": "1:36:31"}
57
- {"current_steps": 357, "total_steps": 550, "loss": 1.759, "lr": 1e-05, "epoch": 0.6489434219495569, "percentage": 64.91, "elapsed_time": "3:00:17", "remaining_time": "1:37:28"}
58
- {"current_steps": 358, "total_steps": 550, "loss": 1.755, "lr": 1e-05, "epoch": 0.6507611906384912, "percentage": 65.09, "elapsed_time": "3:03:27", "remaining_time": "1:38:23"}
59
- {"current_steps": 359, "total_steps": 550, "loss": 1.7597, "lr": 1e-05, "epoch": 0.6525789593274256, "percentage": 65.27, "elapsed_time": "3:06:36", "remaining_time": "1:39:16"}
60
- {"current_steps": 360, "total_steps": 550, "loss": 1.7468, "lr": 1e-05, "epoch": 0.65439672801636, "percentage": 65.45, "elapsed_time": "3:09:47", "remaining_time": "1:40:10"}
61
- {"current_steps": 361, "total_steps": 550, "loss": 1.7468, "lr": 1e-05, "epoch": 0.6562144967052943, "percentage": 65.64, "elapsed_time": "3:12:57", "remaining_time": "1:41:01"}
62
- {"current_steps": 362, "total_steps": 550, "loss": 1.7477, "lr": 1e-05, "epoch": 0.6580322653942285, "percentage": 65.82, "elapsed_time": "3:16:07", "remaining_time": "1:41:51"}
63
- {"current_steps": 363, "total_steps": 550, "loss": 1.7643, "lr": 1e-05, "epoch": 0.6598500340831629, "percentage": 66.0, "elapsed_time": "3:19:17", "remaining_time": "1:42:40"}
64
- {"current_steps": 364, "total_steps": 550, "loss": 1.7514, "lr": 1e-05, "epoch": 0.6616678027720972, "percentage": 66.18, "elapsed_time": "3:22:28", "remaining_time": "1:43:27"}
65
- {"current_steps": 365, "total_steps": 550, "loss": 1.7581, "lr": 1e-05, "epoch": 0.6634855714610316, "percentage": 66.36, "elapsed_time": "3:25:38", "remaining_time": "1:44:13"}
66
- {"current_steps": 366, "total_steps": 550, "loss": 1.7455, "lr": 1e-05, "epoch": 0.665303340149966, "percentage": 66.55, "elapsed_time": "3:28:47", "remaining_time": "1:44:57"}
67
- {"current_steps": 367, "total_steps": 550, "loss": 1.7483, "lr": 1e-05, "epoch": 0.6671211088389003, "percentage": 66.73, "elapsed_time": "3:31:55", "remaining_time": "1:45:40"}
68
- {"current_steps": 368, "total_steps": 550, "loss": 1.7512, "lr": 1e-05, "epoch": 0.6689388775278345, "percentage": 66.91, "elapsed_time": "3:35:04", "remaining_time": "1:46:22"}
69
- {"current_steps": 369, "total_steps": 550, "loss": 1.7528, "lr": 1e-05, "epoch": 0.6707566462167689, "percentage": 67.09, "elapsed_time": "3:38:14", "remaining_time": "1:47:03"}
70
- {"current_steps": 370, "total_steps": 550, "loss": 1.7446, "lr": 1e-05, "epoch": 0.6725744149057032, "percentage": 67.27, "elapsed_time": "3:41:24", "remaining_time": "1:47:42"}
71
- {"current_steps": 371, "total_steps": 550, "loss": 1.7533, "lr": 1e-05, "epoch": 0.6743921835946376, "percentage": 67.45, "elapsed_time": "3:44:33", "remaining_time": "1:48:20"}
72
- {"current_steps": 372, "total_steps": 550, "loss": 1.7512, "lr": 1e-05, "epoch": 0.676209952283572, "percentage": 67.64, "elapsed_time": "3:47:44", "remaining_time": "1:48:58"}
73
- {"current_steps": 373, "total_steps": 550, "loss": 1.7533, "lr": 1e-05, "epoch": 0.6780277209725063, "percentage": 67.82, "elapsed_time": "3:50:53", "remaining_time": "1:49:33"}
74
- {"current_steps": 374, "total_steps": 550, "loss": 1.7468, "lr": 1e-05, "epoch": 0.6798454896614405, "percentage": 68.0, "elapsed_time": "3:54:01", "remaining_time": "1:50:07"}
75
- {"current_steps": 375, "total_steps": 550, "loss": 1.7514, "lr": 1e-05, "epoch": 0.6816632583503749, "percentage": 68.18, "elapsed_time": "3:57:10", "remaining_time": "1:50:40"}
76
- {"current_steps": 376, "total_steps": 550, "loss": 1.746, "lr": 1e-05, "epoch": 0.6834810270393092, "percentage": 68.36, "elapsed_time": "4:00:19", "remaining_time": "1:51:12"}
77
- {"current_steps": 377, "total_steps": 550, "loss": 1.7472, "lr": 1e-05, "epoch": 0.6852987957282436, "percentage": 68.55, "elapsed_time": "4:03:27", "remaining_time": "1:51:43"}
78
- {"current_steps": 378, "total_steps": 550, "loss": 1.7445, "lr": 1e-05, "epoch": 0.6871165644171779, "percentage": 68.73, "elapsed_time": "4:06:37", "remaining_time": "1:52:13"}
79
- {"current_steps": 379, "total_steps": 550, "loss": 1.7575, "lr": 1e-05, "epoch": 0.6889343331061123, "percentage": 68.91, "elapsed_time": "4:09:47", "remaining_time": "1:52:42"}
80
- {"current_steps": 380, "total_steps": 550, "loss": 1.7478, "lr": 1e-05, "epoch": 0.6907521017950465, "percentage": 69.09, "elapsed_time": "4:12:56", "remaining_time": "1:53:09"}
81
- {"current_steps": 381, "total_steps": 550, "loss": 1.7577, "lr": 1e-05, "epoch": 0.6925698704839809, "percentage": 69.27, "elapsed_time": "4:16:06", "remaining_time": "1:53:36"}
82
- {"current_steps": 382, "total_steps": 550, "loss": 1.7516, "lr": 1e-05, "epoch": 0.6943876391729152, "percentage": 69.45, "elapsed_time": "4:19:16", "remaining_time": "1:54:01"}
83
- {"current_steps": 383, "total_steps": 550, "loss": 1.7488, "lr": 1e-05, "epoch": 0.6962054078618496, "percentage": 69.64, "elapsed_time": "4:22:25", "remaining_time": "1:54:25"}
84
- {"current_steps": 384, "total_steps": 550, "loss": 1.7545, "lr": 1e-05, "epoch": 0.6980231765507839, "percentage": 69.82, "elapsed_time": "4:25:35", "remaining_time": "1:54:48"}
85
- {"current_steps": 385, "total_steps": 550, "loss": 1.7533, "lr": 1e-05, "epoch": 0.6998409452397183, "percentage": 70.0, "elapsed_time": "4:28:45", "remaining_time": "1:55:11"}
86
- {"current_steps": 386, "total_steps": 550, "loss": 1.7521, "lr": 1e-05, "epoch": 0.7016587139286525, "percentage": 70.18, "elapsed_time": "4:31:55", "remaining_time": "1:55:31"}
87
- {"current_steps": 387, "total_steps": 550, "loss": 1.7548, "lr": 1e-05, "epoch": 0.7034764826175869, "percentage": 70.36, "elapsed_time": "4:35:03", "remaining_time": "1:55:51"}
88
- {"current_steps": 388, "total_steps": 550, "loss": 1.7443, "lr": 1e-05, "epoch": 0.7052942513065212, "percentage": 70.55, "elapsed_time": "4:38:13", "remaining_time": "1:56:09"}
89
- {"current_steps": 389, "total_steps": 550, "loss": 1.7515, "lr": 1e-05, "epoch": 0.7071120199954556, "percentage": 70.73, "elapsed_time": "4:41:22", "remaining_time": "1:56:27"}
90
- {"current_steps": 390, "total_steps": 550, "loss": 1.7478, "lr": 1e-05, "epoch": 0.7089297886843899, "percentage": 70.91, "elapsed_time": "4:44:32", "remaining_time": "1:56:44"}
91
- {"current_steps": 391, "total_steps": 550, "loss": 1.7487, "lr": 1e-05, "epoch": 0.7107475573733243, "percentage": 71.09, "elapsed_time": "4:47:41", "remaining_time": "1:56:59"}
92
- {"current_steps": 392, "total_steps": 550, "loss": 1.7539, "lr": 1e-05, "epoch": 0.7125653260622585, "percentage": 71.27, "elapsed_time": "4:50:50", "remaining_time": "1:57:13"}
93
- {"current_steps": 393, "total_steps": 550, "loss": 1.7488, "lr": 1e-05, "epoch": 0.7143830947511929, "percentage": 71.45, "elapsed_time": "4:53:59", "remaining_time": "1:57:26"}
94
- {"current_steps": 394, "total_steps": 550, "loss": 1.7448, "lr": 1e-05, "epoch": 0.7162008634401272, "percentage": 71.64, "elapsed_time": "4:57:08", "remaining_time": "1:57:38"}
95
- {"current_steps": 395, "total_steps": 550, "loss": 1.7399, "lr": 1e-05, "epoch": 0.7180186321290616, "percentage": 71.82, "elapsed_time": "5:00:18", "remaining_time": "1:57:50"}
96
- {"current_steps": 396, "total_steps": 550, "loss": 1.7566, "lr": 1e-05, "epoch": 0.7198364008179959, "percentage": 72.0, "elapsed_time": "5:03:28", "remaining_time": "1:58:01"}
97
- {"current_steps": 397, "total_steps": 550, "loss": 1.751, "lr": 1e-05, "epoch": 0.7216541695069303, "percentage": 72.18, "elapsed_time": "5:06:38", "remaining_time": "1:58:10"}
98
- {"current_steps": 398, "total_steps": 550, "loss": 1.7474, "lr": 1e-05, "epoch": 0.7234719381958645, "percentage": 72.36, "elapsed_time": "5:09:48", "remaining_time": "1:58:18"}
99
- {"current_steps": 399, "total_steps": 550, "loss": 1.7492, "lr": 1e-05, "epoch": 0.7252897068847989, "percentage": 72.55, "elapsed_time": "5:12:58", "remaining_time": "1:58:26"}
100
- {"current_steps": 400, "total_steps": 550, "loss": 1.7571, "lr": 1e-05, "epoch": 0.7271074755737332, "percentage": 72.73, "elapsed_time": "5:16:08", "remaining_time": "1:58:33"}
101
- {"current_steps": 401, "total_steps": 550, "loss": 1.7426, "lr": 1e-05, "epoch": 0.7289252442626676, "percentage": 72.91, "elapsed_time": "5:22:24", "remaining_time": "1:59:47"}
102
- {"current_steps": 402, "total_steps": 550, "loss": 1.7564, "lr": 1e-05, "epoch": 0.7307430129516019, "percentage": 73.09, "elapsed_time": "5:25:34", "remaining_time": "1:59:51"}
103
- {"current_steps": 403, "total_steps": 550, "loss": 1.7495, "lr": 1e-05, "epoch": 0.7325607816405363, "percentage": 73.27, "elapsed_time": "5:28:41", "remaining_time": "1:59:53"}
104
- {"current_steps": 404, "total_steps": 550, "loss": 1.7479, "lr": 1e-05, "epoch": 0.7343785503294705, "percentage": 73.45, "elapsed_time": "5:31:49", "remaining_time": "1:59:54"}
105
- {"current_steps": 405, "total_steps": 550, "loss": 1.7475, "lr": 1e-05, "epoch": 0.7361963190184049, "percentage": 73.64, "elapsed_time": "5:34:55", "remaining_time": "1:59:54"}
106
- {"current_steps": 406, "total_steps": 550, "loss": 1.7517, "lr": 1e-05, "epoch": 0.7380140877073392, "percentage": 73.82, "elapsed_time": "5:38:03", "remaining_time": "1:59:54"}
107
- {"current_steps": 407, "total_steps": 550, "loss": 1.7556, "lr": 1e-05, "epoch": 0.7398318563962736, "percentage": 74.0, "elapsed_time": "5:41:10", "remaining_time": "1:59:52"}
108
- {"current_steps": 408, "total_steps": 550, "loss": 1.7394, "lr": 1e-05, "epoch": 0.7416496250852079, "percentage": 74.18, "elapsed_time": "5:44:17", "remaining_time": "1:59:49"}
109
- {"current_steps": 409, "total_steps": 550, "loss": 1.7483, "lr": 1e-05, "epoch": 0.7434673937741423, "percentage": 74.36, "elapsed_time": "5:47:26", "remaining_time": "1:59:46"}
110
- {"current_steps": 410, "total_steps": 550, "loss": 1.7483, "lr": 1e-05, "epoch": 0.7452851624630765, "percentage": 74.55, "elapsed_time": "5:50:34", "remaining_time": "1:59:42"}
111
- {"current_steps": 411, "total_steps": 550, "loss": 1.7522, "lr": 1e-05, "epoch": 0.7471029311520109, "percentage": 74.73, "elapsed_time": "5:53:41", "remaining_time": "1:59:37"}
112
- {"current_steps": 412, "total_steps": 550, "loss": 1.7478, "lr": 1e-05, "epoch": 0.7489206998409452, "percentage": 74.91, "elapsed_time": "5:56:50", "remaining_time": "1:59:31"}
113
- {"current_steps": 413, "total_steps": 550, "loss": 1.7475, "lr": 1e-05, "epoch": 0.7507384685298796, "percentage": 75.09, "elapsed_time": "5:59:57", "remaining_time": "1:59:24"}
114
- {"current_steps": 414, "total_steps": 550, "loss": 1.7523, "lr": 1e-05, "epoch": 0.7525562372188139, "percentage": 75.27, "elapsed_time": "6:03:06", "remaining_time": "1:59:16"}
115
- {"current_steps": 415, "total_steps": 550, "loss": 1.7422, "lr": 1e-05, "epoch": 0.7543740059077483, "percentage": 75.45, "elapsed_time": "6:06:13", "remaining_time": "1:59:08"}
116
- {"current_steps": 416, "total_steps": 550, "loss": 1.7484, "lr": 1e-05, "epoch": 0.7561917745966825, "percentage": 75.64, "elapsed_time": "6:09:21", "remaining_time": "1:58:58"}
117
- {"current_steps": 417, "total_steps": 550, "loss": 1.7543, "lr": 1e-05, "epoch": 0.7580095432856169, "percentage": 75.82, "elapsed_time": "6:12:29", "remaining_time": "1:58:48"}
118
- {"current_steps": 418, "total_steps": 550, "loss": 1.7511, "lr": 1e-05, "epoch": 0.7598273119745512, "percentage": 76.0, "elapsed_time": "6:15:37", "remaining_time": "1:58:37"}
119
- {"current_steps": 419, "total_steps": 550, "loss": 1.747, "lr": 1e-05, "epoch": 0.7616450806634856, "percentage": 76.18, "elapsed_time": "6:18:47", "remaining_time": "1:58:25"}
120
- {"current_steps": 420, "total_steps": 550, "loss": 1.741, "lr": 1e-05, "epoch": 0.7634628493524199, "percentage": 76.36, "elapsed_time": "6:21:57", "remaining_time": "1:58:13"}
121
- {"current_steps": 421, "total_steps": 550, "loss": 1.7427, "lr": 1e-05, "epoch": 0.7652806180413543, "percentage": 76.55, "elapsed_time": "6:25:07", "remaining_time": "1:58:00"}
122
- {"current_steps": 422, "total_steps": 550, "loss": 1.7413, "lr": 1e-05, "epoch": 0.7670983867302885, "percentage": 76.73, "elapsed_time": "6:28:16", "remaining_time": "1:57:46"}
123
- {"current_steps": 423, "total_steps": 550, "loss": 1.7483, "lr": 1e-05, "epoch": 0.7689161554192229, "percentage": 76.91, "elapsed_time": "6:31:27", "remaining_time": "1:57:31"}
124
- {"current_steps": 424, "total_steps": 550, "loss": 1.7463, "lr": 1e-05, "epoch": 0.7707339241081572, "percentage": 77.09, "elapsed_time": "6:34:36", "remaining_time": "1:57:15"}
125
- {"current_steps": 425, "total_steps": 550, "loss": 1.7482, "lr": 1e-05, "epoch": 0.7725516927970916, "percentage": 77.27, "elapsed_time": "6:37:45", "remaining_time": "1:56:59"}
126
- {"current_steps": 426, "total_steps": 550, "loss": 1.7517, "lr": 1e-05, "epoch": 0.7743694614860259, "percentage": 77.45, "elapsed_time": "6:40:53", "remaining_time": "1:56:41"}
127
- {"current_steps": 427, "total_steps": 550, "loss": 1.7437, "lr": 1e-05, "epoch": 0.7761872301749603, "percentage": 77.64, "elapsed_time": "6:44:02", "remaining_time": "1:56:23"}
128
- {"current_steps": 428, "total_steps": 550, "loss": 1.7479, "lr": 1e-05, "epoch": 0.7780049988638945, "percentage": 77.82, "elapsed_time": "6:47:12", "remaining_time": "1:56:04"}
129
- {"current_steps": 429, "total_steps": 550, "loss": 1.7438, "lr": 1e-05, "epoch": 0.7798227675528289, "percentage": 78.0, "elapsed_time": "6:50:20", "remaining_time": "1:55:44"}
130
- {"current_steps": 430, "total_steps": 550, "loss": 1.743, "lr": 1e-05, "epoch": 0.7816405362417632, "percentage": 78.18, "elapsed_time": "6:53:30", "remaining_time": "1:55:23"}
131
- {"current_steps": 431, "total_steps": 550, "loss": 1.7521, "lr": 1e-05, "epoch": 0.7834583049306976, "percentage": 78.36, "elapsed_time": "6:56:39", "remaining_time": "1:55:02"}
132
- {"current_steps": 432, "total_steps": 550, "loss": 1.7489, "lr": 1e-05, "epoch": 0.7852760736196319, "percentage": 78.55, "elapsed_time": "6:59:50", "remaining_time": "1:54:40"}
133
- {"current_steps": 433, "total_steps": 550, "loss": 1.7483, "lr": 1e-05, "epoch": 0.7870938423085663, "percentage": 78.73, "elapsed_time": "7:02:58", "remaining_time": "1:54:17"}
134
- {"current_steps": 434, "total_steps": 550, "loss": 1.7454, "lr": 1e-05, "epoch": 0.7889116109975006, "percentage": 78.91, "elapsed_time": "7:06:07", "remaining_time": "1:53:53"}
135
- {"current_steps": 435, "total_steps": 550, "loss": 1.7447, "lr": 1e-05, "epoch": 0.7907293796864349, "percentage": 79.09, "elapsed_time": "7:09:16", "remaining_time": "1:53:29"}
136
- {"current_steps": 436, "total_steps": 550, "loss": 1.7465, "lr": 1e-05, "epoch": 0.7925471483753692, "percentage": 79.27, "elapsed_time": "7:12:26", "remaining_time": "1:53:04"}
137
- {"current_steps": 437, "total_steps": 550, "loss": 1.7437, "lr": 1e-05, "epoch": 0.7943649170643036, "percentage": 79.45, "elapsed_time": "7:15:35", "remaining_time": "1:52:38"}
138
- {"current_steps": 438, "total_steps": 550, "loss": 1.7432, "lr": 1e-05, "epoch": 0.7961826857532379, "percentage": 79.64, "elapsed_time": "7:18:44", "remaining_time": "1:52:11"}
139
- {"current_steps": 439, "total_steps": 550, "loss": 1.7363, "lr": 1e-05, "epoch": 0.7980004544421723, "percentage": 79.82, "elapsed_time": "7:21:53", "remaining_time": "1:51:43"}
140
- {"current_steps": 440, "total_steps": 550, "loss": 1.7509, "lr": 1e-05, "epoch": 0.7998182231311066, "percentage": 80.0, "elapsed_time": "7:25:03", "remaining_time": "1:51:15"}
141
- {"current_steps": 441, "total_steps": 550, "loss": 1.7446, "lr": 1e-05, "epoch": 0.8016359918200409, "percentage": 80.18, "elapsed_time": "7:28:13", "remaining_time": "1:50:47"}
142
- {"current_steps": 442, "total_steps": 550, "loss": 1.7491, "lr": 1e-05, "epoch": 0.8034537605089752, "percentage": 80.36, "elapsed_time": "7:31:23", "remaining_time": "1:50:17"}
143
- {"current_steps": 443, "total_steps": 550, "loss": 1.7408, "lr": 1e-05, "epoch": 0.8052715291979096, "percentage": 80.55, "elapsed_time": "7:34:32", "remaining_time": "1:49:47"}
144
- {"current_steps": 444, "total_steps": 550, "loss": 1.7485, "lr": 1e-05, "epoch": 0.8070892978868439, "percentage": 80.73, "elapsed_time": "7:37:41", "remaining_time": "1:49:16"}
145
- {"current_steps": 445, "total_steps": 550, "loss": 1.7507, "lr": 1e-05, "epoch": 0.8089070665757783, "percentage": 80.91, "elapsed_time": "7:40:50", "remaining_time": "1:48:44"}
146
- {"current_steps": 446, "total_steps": 550, "loss": 1.7508, "lr": 1e-05, "epoch": 0.8107248352647126, "percentage": 81.09, "elapsed_time": "7:43:59", "remaining_time": "1:48:11"}
147
- {"current_steps": 447, "total_steps": 550, "loss": 1.745, "lr": 1e-05, "epoch": 0.8125426039536469, "percentage": 81.27, "elapsed_time": "7:47:08", "remaining_time": "1:47:38"}
148
- {"current_steps": 448, "total_steps": 550, "loss": 1.7564, "lr": 1e-05, "epoch": 0.8143603726425812, "percentage": 81.45, "elapsed_time": "7:50:18", "remaining_time": "1:47:04"}
149
- {"current_steps": 449, "total_steps": 550, "loss": 1.7491, "lr": 1e-05, "epoch": 0.8161781413315156, "percentage": 81.64, "elapsed_time": "7:53:27", "remaining_time": "1:46:30"}
150
- {"current_steps": 450, "total_steps": 550, "loss": 1.7534, "lr": 1e-05, "epoch": 0.8179959100204499, "percentage": 81.82, "elapsed_time": "7:56:36", "remaining_time": "1:45:54"}
151
- {"current_steps": 451, "total_steps": 550, "loss": 1.734, "lr": 1e-05, "epoch": 0.8198136787093843, "percentage": 82.0, "elapsed_time": "7:59:47", "remaining_time": "1:45:19"}
152
- {"current_steps": 452, "total_steps": 550, "loss": 1.748, "lr": 1e-05, "epoch": 0.8216314473983186, "percentage": 82.18, "elapsed_time": "8:02:56", "remaining_time": "1:44:42"}
153
- {"current_steps": 453, "total_steps": 550, "loss": 1.7581, "lr": 1e-05, "epoch": 0.8234492160872529, "percentage": 82.36, "elapsed_time": "8:06:05", "remaining_time": "1:44:05"}
154
- {"current_steps": 454, "total_steps": 550, "loss": 1.7483, "lr": 1e-05, "epoch": 0.8252669847761872, "percentage": 82.55, "elapsed_time": "8:09:14", "remaining_time": "1:43:27"}
155
- {"current_steps": 455, "total_steps": 550, "loss": 1.753, "lr": 1e-05, "epoch": 0.8270847534651216, "percentage": 82.73, "elapsed_time": "8:12:22", "remaining_time": "1:42:48"}
156
- {"current_steps": 456, "total_steps": 550, "loss": 1.7509, "lr": 1e-05, "epoch": 0.8289025221540559, "percentage": 82.91, "elapsed_time": "8:15:32", "remaining_time": "1:42:08"}
157
- {"current_steps": 457, "total_steps": 550, "loss": 1.7421, "lr": 1e-05, "epoch": 0.8307202908429903, "percentage": 83.09, "elapsed_time": "8:18:43", "remaining_time": "1:41:29"}
158
- {"current_steps": 458, "total_steps": 550, "loss": 1.7531, "lr": 1e-05, "epoch": 0.8325380595319246, "percentage": 83.27, "elapsed_time": "8:21:52", "remaining_time": "1:40:48"}
159
- {"current_steps": 459, "total_steps": 550, "loss": 1.7453, "lr": 1e-05, "epoch": 0.8343558282208589, "percentage": 83.45, "elapsed_time": "8:25:04", "remaining_time": "1:40:08"}
160
- {"current_steps": 460, "total_steps": 550, "loss": 1.7468, "lr": 1e-05, "epoch": 0.8361735969097932, "percentage": 83.64, "elapsed_time": "8:28:16", "remaining_time": "1:39:26"}
161
- {"current_steps": 461, "total_steps": 550, "loss": 1.7496, "lr": 1e-05, "epoch": 0.8379913655987276, "percentage": 83.82, "elapsed_time": "8:31:27", "remaining_time": "1:38:44"}
162
- {"current_steps": 462, "total_steps": 550, "loss": 1.7485, "lr": 1e-05, "epoch": 0.8398091342876619, "percentage": 84.0, "elapsed_time": "8:34:40", "remaining_time": "1:38:01"}
163
- {"current_steps": 463, "total_steps": 550, "loss": 1.7405, "lr": 1e-05, "epoch": 0.8416269029765963, "percentage": 84.18, "elapsed_time": "8:37:50", "remaining_time": "1:37:18"}
164
- {"current_steps": 464, "total_steps": 550, "loss": 1.7464, "lr": 1e-05, "epoch": 0.8434446716655306, "percentage": 84.36, "elapsed_time": "8:40:58", "remaining_time": "1:36:33"}
165
- {"current_steps": 465, "total_steps": 550, "loss": 1.7564, "lr": 1e-05, "epoch": 0.8452624403544649, "percentage": 84.55, "elapsed_time": "8:44:06", "remaining_time": "1:35:48"}
166
- {"current_steps": 466, "total_steps": 550, "loss": 1.745, "lr": 1e-05, "epoch": 0.8470802090433992, "percentage": 84.73, "elapsed_time": "8:47:16", "remaining_time": "1:35:02"}
167
- {"current_steps": 467, "total_steps": 550, "loss": 1.741, "lr": 1e-05, "epoch": 0.8488979777323336, "percentage": 84.91, "elapsed_time": "8:50:27", "remaining_time": "1:34:16"}
168
- {"current_steps": 468, "total_steps": 550, "loss": 1.7553, "lr": 1e-05, "epoch": 0.8507157464212679, "percentage": 85.09, "elapsed_time": "8:53:36", "remaining_time": "1:33:29"}
169
- {"current_steps": 469, "total_steps": 550, "loss": 1.734, "lr": 1e-05, "epoch": 0.8525335151102023, "percentage": 85.27, "elapsed_time": "8:56:45", "remaining_time": "1:32:42"}
170
- {"current_steps": 470, "total_steps": 550, "loss": 1.7443, "lr": 1e-05, "epoch": 0.8543512837991366, "percentage": 85.45, "elapsed_time": "8:59:54", "remaining_time": "1:31:53"}
171
- {"current_steps": 471, "total_steps": 550, "loss": 1.7496, "lr": 1e-05, "epoch": 0.8561690524880708, "percentage": 85.64, "elapsed_time": "9:03:03", "remaining_time": "1:31:05"}
172
- {"current_steps": 472, "total_steps": 550, "loss": 1.7444, "lr": 1e-05, "epoch": 0.8579868211770052, "percentage": 85.82, "elapsed_time": "9:06:13", "remaining_time": "1:30:15"}
173
- {"current_steps": 473, "total_steps": 550, "loss": 1.7436, "lr": 1e-05, "epoch": 0.8598045898659396, "percentage": 86.0, "elapsed_time": "9:09:22", "remaining_time": "1:29:26"}
174
- {"current_steps": 474, "total_steps": 550, "loss": 1.7488, "lr": 1e-05, "epoch": 0.8616223585548739, "percentage": 86.18, "elapsed_time": "9:12:32", "remaining_time": "1:28:35"}
175
- {"current_steps": 475, "total_steps": 550, "loss": 1.7406, "lr": 1e-05, "epoch": 0.8634401272438083, "percentage": 86.36, "elapsed_time": "9:15:40", "remaining_time": "1:27:44"}
176
- {"current_steps": 476, "total_steps": 550, "loss": 1.7463, "lr": 1e-05, "epoch": 0.8652578959327426, "percentage": 86.55, "elapsed_time": "9:18:49", "remaining_time": "1:26:52"}
177
- {"current_steps": 477, "total_steps": 550, "loss": 1.751, "lr": 1e-05, "epoch": 0.8670756646216768, "percentage": 86.73, "elapsed_time": "9:21:58", "remaining_time": "1:26:00"}
178
- {"current_steps": 478, "total_steps": 550, "loss": 1.7402, "lr": 1e-05, "epoch": 0.8688934333106112, "percentage": 86.91, "elapsed_time": "9:25:08", "remaining_time": "1:25:07"}
179
- {"current_steps": 479, "total_steps": 550, "loss": 1.7457, "lr": 1e-05, "epoch": 0.8707112019995455, "percentage": 87.09, "elapsed_time": "9:28:18", "remaining_time": "1:24:14"}
180
- {"current_steps": 480, "total_steps": 550, "loss": 1.7453, "lr": 1e-05, "epoch": 0.8725289706884799, "percentage": 87.27, "elapsed_time": "9:31:27", "remaining_time": "1:23:20"}
181
- {"current_steps": 481, "total_steps": 550, "loss": 1.7386, "lr": 1e-05, "epoch": 0.8743467393774143, "percentage": 87.45, "elapsed_time": "9:34:36", "remaining_time": "1:22:25"}
182
- {"current_steps": 482, "total_steps": 550, "loss": 1.7412, "lr": 1e-05, "epoch": 0.8761645080663486, "percentage": 87.64, "elapsed_time": "9:37:45", "remaining_time": "1:21:30"}
183
- {"current_steps": 483, "total_steps": 550, "loss": 1.7462, "lr": 1e-05, "epoch": 0.8779822767552828, "percentage": 87.82, "elapsed_time": "9:40:55", "remaining_time": "1:20:35"}
184
- {"current_steps": 484, "total_steps": 550, "loss": 1.7443, "lr": 1e-05, "epoch": 0.8798000454442172, "percentage": 88.0, "elapsed_time": "9:44:04", "remaining_time": "1:19:38"}
185
- {"current_steps": 485, "total_steps": 550, "loss": 1.7345, "lr": 1e-05, "epoch": 0.8816178141331515, "percentage": 88.18, "elapsed_time": "9:47:14", "remaining_time": "1:18:42"}
186
- {"current_steps": 486, "total_steps": 550, "loss": 1.7425, "lr": 1e-05, "epoch": 0.8834355828220859, "percentage": 88.36, "elapsed_time": "9:50:23", "remaining_time": "1:17:44"}
187
- {"current_steps": 487, "total_steps": 550, "loss": 1.746, "lr": 1e-05, "epoch": 0.8852533515110202, "percentage": 88.55, "elapsed_time": "9:53:32", "remaining_time": "1:16:46"}
188
- {"current_steps": 488, "total_steps": 550, "loss": 1.7327, "lr": 1e-05, "epoch": 0.8870711201999546, "percentage": 88.73, "elapsed_time": "9:56:41", "remaining_time": "1:15:48"}
189
- {"current_steps": 489, "total_steps": 550, "loss": 1.7385, "lr": 1e-05, "epoch": 0.8888888888888888, "percentage": 88.91, "elapsed_time": "9:59:50", "remaining_time": "1:14:49"}
190
- {"current_steps": 490, "total_steps": 550, "loss": 1.7405, "lr": 1e-05, "epoch": 0.8907066575778232, "percentage": 89.09, "elapsed_time": "10:03:00", "remaining_time": "1:13:50"}
191
- {"current_steps": 491, "total_steps": 550, "loss": 1.748, "lr": 1e-05, "epoch": 0.8925244262667575, "percentage": 89.27, "elapsed_time": "10:06:09", "remaining_time": "1:12:50"}
192
- {"current_steps": 492, "total_steps": 550, "loss": 1.7465, "lr": 1e-05, "epoch": 0.8943421949556919, "percentage": 89.45, "elapsed_time": "10:09:18", "remaining_time": "1:11:49"}
193
- {"current_steps": 493, "total_steps": 550, "loss": 1.7331, "lr": 1e-05, "epoch": 0.8961599636446262, "percentage": 89.64, "elapsed_time": "10:12:28", "remaining_time": "1:10:48"}
194
- {"current_steps": 494, "total_steps": 550, "loss": 1.7383, "lr": 1e-05, "epoch": 0.8979777323335606, "percentage": 89.82, "elapsed_time": "10:15:37", "remaining_time": "1:09:47"}
195
- {"current_steps": 495, "total_steps": 550, "loss": 1.7416, "lr": 1e-05, "epoch": 0.8997955010224948, "percentage": 90.0, "elapsed_time": "10:18:46", "remaining_time": "1:08:45"}
196
- {"current_steps": 496, "total_steps": 550, "loss": 1.742, "lr": 1e-05, "epoch": 0.9016132697114292, "percentage": 90.18, "elapsed_time": "10:21:55", "remaining_time": "1:07:42"}
197
- {"current_steps": 497, "total_steps": 550, "loss": 1.7397, "lr": 1e-05, "epoch": 0.9034310384003635, "percentage": 90.36, "elapsed_time": "10:25:05", "remaining_time": "1:06:39"}
198
- {"current_steps": 498, "total_steps": 550, "loss": 1.7511, "lr": 1e-05, "epoch": 0.9052488070892979, "percentage": 90.55, "elapsed_time": "10:28:14", "remaining_time": "1:05:35"}
199
- {"current_steps": 499, "total_steps": 550, "loss": 1.7468, "lr": 1e-05, "epoch": 0.9070665757782322, "percentage": 90.73, "elapsed_time": "10:31:23", "remaining_time": "1:04:31"}
200
- {"current_steps": 500, "total_steps": 550, "loss": 1.7327, "lr": 1e-05, "epoch": 0.9088843444671666, "percentage": 90.91, "elapsed_time": "10:34:32", "remaining_time": "1:03:27"}
201
- {"current_steps": 501, "total_steps": 550, "loss": 1.7454, "lr": 1e-05, "epoch": 0.9107021131561008, "percentage": 91.09, "elapsed_time": "10:40:46", "remaining_time": "1:02:40"}
202
- {"current_steps": 502, "total_steps": 550, "loss": 1.7476, "lr": 1e-05, "epoch": 0.9125198818450352, "percentage": 91.27, "elapsed_time": "10:43:57", "remaining_time": "1:01:34"}
203
- {"current_steps": 503, "total_steps": 550, "loss": 1.7461, "lr": 1e-05, "epoch": 0.9143376505339695, "percentage": 91.45, "elapsed_time": "10:47:05", "remaining_time": "1:00:27"}
204
- {"current_steps": 504, "total_steps": 550, "loss": 1.7361, "lr": 1e-05, "epoch": 0.9161554192229039, "percentage": 91.64, "elapsed_time": "10:50:12", "remaining_time": "0:59:20"}
205
- {"current_steps": 505, "total_steps": 550, "loss": 1.7441, "lr": 1e-05, "epoch": 0.9179731879118382, "percentage": 91.82, "elapsed_time": "10:53:22", "remaining_time": "0:58:13"}
206
- {"current_steps": 506, "total_steps": 550, "loss": 1.742, "lr": 1e-05, "epoch": 0.9197909566007726, "percentage": 92.0, "elapsed_time": "10:56:30", "remaining_time": "0:57:05"}
207
- {"current_steps": 507, "total_steps": 550, "loss": 1.7391, "lr": 1e-05, "epoch": 0.9216087252897068, "percentage": 92.18, "elapsed_time": "10:59:38", "remaining_time": "0:55:56"}
208
- {"current_steps": 508, "total_steps": 550, "loss": 1.7405, "lr": 1e-05, "epoch": 0.9234264939786412, "percentage": 92.36, "elapsed_time": "11:02:46", "remaining_time": "0:54:47"}
209
- {"current_steps": 509, "total_steps": 550, "loss": 1.7458, "lr": 1e-05, "epoch": 0.9252442626675755, "percentage": 92.55, "elapsed_time": "11:05:55", "remaining_time": "0:53:38"}
210
- {"current_steps": 510, "total_steps": 550, "loss": 1.7351, "lr": 1e-05, "epoch": 0.9270620313565099, "percentage": 92.73, "elapsed_time": "11:09:04", "remaining_time": "0:52:28"}
211
- {"current_steps": 511, "total_steps": 550, "loss": 1.7397, "lr": 1e-05, "epoch": 0.9288798000454442, "percentage": 92.91, "elapsed_time": "11:12:12", "remaining_time": "0:51:18"}
212
- {"current_steps": 512, "total_steps": 550, "loss": 1.7471, "lr": 1e-05, "epoch": 0.9306975687343786, "percentage": 93.09, "elapsed_time": "11:15:21", "remaining_time": "0:50:07"}
213
- {"current_steps": 513, "total_steps": 550, "loss": 1.7454, "lr": 1e-05, "epoch": 0.9325153374233128, "percentage": 93.27, "elapsed_time": "11:18:34", "remaining_time": "0:48:56"}
214
- {"current_steps": 514, "total_steps": 550, "loss": 1.7375, "lr": 1e-05, "epoch": 0.9343331061122472, "percentage": 93.45, "elapsed_time": "11:21:43", "remaining_time": "0:47:44"}
215
- {"current_steps": 515, "total_steps": 550, "loss": 1.7394, "lr": 1e-05, "epoch": 0.9361508748011815, "percentage": 93.64, "elapsed_time": "11:24:53", "remaining_time": "0:46:32"}
216
- {"current_steps": 516, "total_steps": 550, "loss": 1.7452, "lr": 1e-05, "epoch": 0.9379686434901159, "percentage": 93.82, "elapsed_time": "11:28:03", "remaining_time": "0:45:20"}
217
- {"current_steps": 517, "total_steps": 550, "loss": 1.7441, "lr": 1e-05, "epoch": 0.9397864121790502, "percentage": 94.0, "elapsed_time": "11:31:12", "remaining_time": "0:44:07"}
218
- {"current_steps": 518, "total_steps": 550, "loss": 1.7417, "lr": 1e-05, "epoch": 0.9416041808679846, "percentage": 94.18, "elapsed_time": "11:34:21", "remaining_time": "0:42:53"}
219
- {"current_steps": 519, "total_steps": 550, "loss": 1.7428, "lr": 1e-05, "epoch": 0.9434219495569189, "percentage": 94.36, "elapsed_time": "11:37:32", "remaining_time": "0:41:39"}
220
- {"current_steps": 520, "total_steps": 550, "loss": 1.7345, "lr": 1e-05, "epoch": 0.9452397182458532, "percentage": 94.55, "elapsed_time": "11:40:42", "remaining_time": "0:40:25"}
221
- {"current_steps": 521, "total_steps": 550, "loss": 1.7362, "lr": 1e-05, "epoch": 0.9470574869347875, "percentage": 94.73, "elapsed_time": "11:43:51", "remaining_time": "0:39:10"}
222
- {"current_steps": 522, "total_steps": 550, "loss": 1.7355, "lr": 1e-05, "epoch": 0.9488752556237219, "percentage": 94.91, "elapsed_time": "11:47:03", "remaining_time": "0:37:55"}
223
- {"current_steps": 523, "total_steps": 550, "loss": 1.7468, "lr": 1e-05, "epoch": 0.9506930243126562, "percentage": 95.09, "elapsed_time": "11:50:13", "remaining_time": "0:36:39"}
224
- {"current_steps": 524, "total_steps": 550, "loss": 1.7422, "lr": 1e-05, "epoch": 0.9525107930015906, "percentage": 95.27, "elapsed_time": "11:53:21", "remaining_time": "0:35:23"}
225
- {"current_steps": 525, "total_steps": 550, "loss": 1.7393, "lr": 1e-05, "epoch": 0.9543285616905249, "percentage": 95.45, "elapsed_time": "11:56:31", "remaining_time": "0:34:07"}
226
- {"current_steps": 526, "total_steps": 550, "loss": 1.7341, "lr": 1e-05, "epoch": 0.9561463303794592, "percentage": 95.64, "elapsed_time": "11:59:39", "remaining_time": "0:32:50"}
227
- {"current_steps": 527, "total_steps": 550, "loss": 1.7428, "lr": 1e-05, "epoch": 0.9579640990683935, "percentage": 95.82, "elapsed_time": "12:02:49", "remaining_time": "0:31:32"}
228
- {"current_steps": 528, "total_steps": 550, "loss": 1.7496, "lr": 1e-05, "epoch": 0.9597818677573279, "percentage": 96.0, "elapsed_time": "12:05:59", "remaining_time": "0:30:14"}
229
- {"current_steps": 529, "total_steps": 550, "loss": 1.7413, "lr": 1e-05, "epoch": 0.9615996364462622, "percentage": 96.18, "elapsed_time": "12:09:09", "remaining_time": "0:28:56"}
230
- {"current_steps": 530, "total_steps": 550, "loss": 1.7395, "lr": 1e-05, "epoch": 0.9634174051351966, "percentage": 96.36, "elapsed_time": "12:12:19", "remaining_time": "0:27:38"}
231
- {"current_steps": 531, "total_steps": 550, "loss": 1.7342, "lr": 1e-05, "epoch": 0.9652351738241309, "percentage": 96.55, "elapsed_time": "12:15:28", "remaining_time": "0:26:18"}
232
- {"current_steps": 532, "total_steps": 550, "loss": 1.7384, "lr": 1e-05, "epoch": 0.9670529425130652, "percentage": 96.73, "elapsed_time": "12:18:37", "remaining_time": "0:24:59"}
233
- {"current_steps": 533, "total_steps": 550, "loss": 1.7425, "lr": 1e-05, "epoch": 0.9688707112019995, "percentage": 96.91, "elapsed_time": "12:21:45", "remaining_time": "0:23:39"}
234
- {"current_steps": 534, "total_steps": 550, "loss": 1.7521, "lr": 1e-05, "epoch": 0.9706884798909339, "percentage": 97.09, "elapsed_time": "12:24:54", "remaining_time": "0:22:19"}
235
- {"current_steps": 535, "total_steps": 550, "loss": 1.7455, "lr": 1e-05, "epoch": 0.9725062485798682, "percentage": 97.27, "elapsed_time": "12:28:04", "remaining_time": "0:20:58"}
236
- {"current_steps": 536, "total_steps": 550, "loss": 1.7509, "lr": 1e-05, "epoch": 0.9743240172688026, "percentage": 97.45, "elapsed_time": "12:31:14", "remaining_time": "0:19:37"}
237
- {"current_steps": 537, "total_steps": 550, "loss": 1.7392, "lr": 1e-05, "epoch": 0.9761417859577369, "percentage": 97.64, "elapsed_time": "12:34:23", "remaining_time": "0:18:15"}
238
- {"current_steps": 538, "total_steps": 550, "loss": 1.7341, "lr": 1e-05, "epoch": 0.9779595546466712, "percentage": 97.82, "elapsed_time": "12:37:32", "remaining_time": "0:16:53"}
239
- {"current_steps": 539, "total_steps": 550, "loss": 1.7367, "lr": 1e-05, "epoch": 0.9797773233356055, "percentage": 98.0, "elapsed_time": "12:40:42", "remaining_time": "0:15:31"}
240
- {"current_steps": 540, "total_steps": 550, "loss": 1.7423, "lr": 1e-05, "epoch": 0.9815950920245399, "percentage": 98.18, "elapsed_time": "12:43:52", "remaining_time": "0:14:08"}
241
- {"current_steps": 541, "total_steps": 550, "loss": 1.7429, "lr": 1e-05, "epoch": 0.9834128607134742, "percentage": 98.36, "elapsed_time": "12:47:01", "remaining_time": "0:12:45"}
242
- {"current_steps": 542, "total_steps": 550, "loss": 1.7348, "lr": 1e-05, "epoch": 0.9852306294024086, "percentage": 98.55, "elapsed_time": "12:50:10", "remaining_time": "0:11:22"}
243
- {"current_steps": 543, "total_steps": 550, "loss": 1.7382, "lr": 1e-05, "epoch": 0.9870483980913429, "percentage": 98.73, "elapsed_time": "12:53:20", "remaining_time": "0:09:58"}
244
- {"current_steps": 544, "total_steps": 550, "loss": 1.7412, "lr": 1e-05, "epoch": 0.9888661667802772, "percentage": 98.91, "elapsed_time": "12:56:28", "remaining_time": "0:08:33"}
245
- {"current_steps": 545, "total_steps": 550, "loss": 1.7287, "lr": 1e-05, "epoch": 0.9906839354692115, "percentage": 99.09, "elapsed_time": "12:59:38", "remaining_time": "0:07:09"}
246
- {"current_steps": 546, "total_steps": 550, "loss": 1.7345, "lr": 1e-05, "epoch": 0.9925017041581459, "percentage": 99.27, "elapsed_time": "13:02:48", "remaining_time": "0:05:44"}
247
- {"current_steps": 547, "total_steps": 550, "loss": 1.7282, "lr": 1e-05, "epoch": 0.9943194728470802, "percentage": 99.45, "elapsed_time": "13:05:58", "remaining_time": "0:04:18"}
248
- {"current_steps": 548, "total_steps": 550, "loss": 1.7358, "lr": 1e-05, "epoch": 0.9961372415360146, "percentage": 99.64, "elapsed_time": "13:09:08", "remaining_time": "0:02:52"}
249
- {"current_steps": 549, "total_steps": 550, "loss": 1.7371, "lr": 1e-05, "epoch": 0.9979550102249489, "percentage": 99.82, "elapsed_time": "13:12:18", "remaining_time": "0:01:26"}
250
- {"current_steps": 550, "total_steps": 550, "loss": 1.7397, "lr": 1e-05, "epoch": 0.9997727789138832, "percentage": 100.0, "elapsed_time": "13:15:28", "remaining_time": "0:00:00"}
251
- {"current_steps": 550, "total_steps": 550, "epoch": 0.9997727789138832, "percentage": 100.0, "elapsed_time": "13:18:32", "remaining_time": "0:00:00"}
 
1
+ {"current_steps": 551, "total_steps": 2200, "loss": 1.7215, "lr": 1e-05, "epoch": 1.0018177686889342, "percentage": 25.05, "elapsed_time": "0:03:22", "remaining_time": "0:10:07"}
2
+ {"current_steps": 552, "total_steps": 2200, "loss": 1.7231, "lr": 1e-05, "epoch": 1.0036355373778687, "percentage": 25.09, "elapsed_time": "0:06:37", "remaining_time": "0:19:46"}
3
+ {"current_steps": 553, "total_steps": 2200, "loss": 1.72, "lr": 1e-05, "epoch": 1.005453306066803, "percentage": 25.14, "elapsed_time": "0:09:47", "remaining_time": "0:29:08"}
4
+ {"current_steps": 554, "total_steps": 2200, "loss": 1.7254, "lr": 1e-05, "epoch": 1.0072710747557374, "percentage": 25.18, "elapsed_time": "0:12:55", "remaining_time": "0:38:23"}
5
+ {"current_steps": 555, "total_steps": 2200, "loss": 1.7207, "lr": 1e-05, "epoch": 1.0090888434446716, "percentage": 25.23, "elapsed_time": "0:16:03", "remaining_time": "0:47:34"}
6
+ {"current_steps": 556, "total_steps": 2200, "loss": 1.7205, "lr": 1e-05, "epoch": 1.010906612133606, "percentage": 25.27, "elapsed_time": "0:19:12", "remaining_time": "0:56:46"}
7
+ {"current_steps": 557, "total_steps": 2200, "loss": 1.7136, "lr": 1e-05, "epoch": 1.0127243808225403, "percentage": 25.32, "elapsed_time": "0:22:20", "remaining_time": "1:05:53"}
8
+ {"current_steps": 558, "total_steps": 2200, "loss": 1.7201, "lr": 1e-05, "epoch": 1.0145421495114746, "percentage": 25.36, "elapsed_time": "0:25:28", "remaining_time": "1:14:58"}
9
+ {"current_steps": 559, "total_steps": 2200, "loss": 1.7165, "lr": 1e-05, "epoch": 1.016359918200409, "percentage": 25.41, "elapsed_time": "0:28:37", "remaining_time": "1:24:00"}
10
+ {"current_steps": 560, "total_steps": 2200, "loss": 1.7138, "lr": 1e-05, "epoch": 1.0181776868893433, "percentage": 25.45, "elapsed_time": "0:31:46", "remaining_time": "1:33:03"}
11
+ {"current_steps": 561, "total_steps": 2200, "loss": 1.7087, "lr": 1e-05, "epoch": 1.0199954555782778, "percentage": 25.5, "elapsed_time": "0:34:57", "remaining_time": "1:42:06"}
12
+ {"current_steps": 562, "total_steps": 2200, "loss": 1.7211, "lr": 1e-05, "epoch": 1.021813224267212, "percentage": 25.55, "elapsed_time": "0:38:05", "remaining_time": "1:51:01"}
13
+ {"current_steps": 563, "total_steps": 2200, "loss": 1.7132, "lr": 1e-05, "epoch": 1.0236309929561462, "percentage": 25.59, "elapsed_time": "0:41:14", "remaining_time": "1:59:54"}
14
+ {"current_steps": 564, "total_steps": 2200, "loss": 1.7169, "lr": 1e-05, "epoch": 1.0254487616450807, "percentage": 25.64, "elapsed_time": "0:44:22", "remaining_time": "2:08:43"}
15
+ {"current_steps": 565, "total_steps": 2200, "loss": 1.7255, "lr": 1e-05, "epoch": 1.027266530334015, "percentage": 25.68, "elapsed_time": "0:47:30", "remaining_time": "2:17:29"}
16
+ {"current_steps": 566, "total_steps": 2200, "loss": 1.7211, "lr": 1e-05, "epoch": 1.0290842990229494, "percentage": 25.73, "elapsed_time": "0:50:40", "remaining_time": "2:26:17"}
17
+ {"current_steps": 567, "total_steps": 2200, "loss": 1.7143, "lr": 1e-05, "epoch": 1.0309020677118836, "percentage": 25.77, "elapsed_time": "0:53:50", "remaining_time": "2:35:03"}
18
+ {"current_steps": 568, "total_steps": 2200, "loss": 1.7185, "lr": 1e-05, "epoch": 1.032719836400818, "percentage": 25.82, "elapsed_time": "0:57:00", "remaining_time": "2:43:46"}
19
+ {"current_steps": 569, "total_steps": 2200, "loss": 1.722, "lr": 1e-05, "epoch": 1.0345376050897523, "percentage": 25.86, "elapsed_time": "1:00:08", "remaining_time": "2:52:24"}
20
+ {"current_steps": 570, "total_steps": 2200, "loss": 1.7247, "lr": 1e-05, "epoch": 1.0363553737786866, "percentage": 25.91, "elapsed_time": "1:03:17", "remaining_time": "3:01:00"}
21
+ {"current_steps": 571, "total_steps": 2200, "loss": 1.7196, "lr": 1e-05, "epoch": 1.038173142467621, "percentage": 25.95, "elapsed_time": "1:06:28", "remaining_time": "3:09:37"}
22
+ {"current_steps": 572, "total_steps": 2200, "loss": 1.7133, "lr": 1e-05, "epoch": 1.0399909111565553, "percentage": 26.0, "elapsed_time": "1:09:37", "remaining_time": "3:18:10"}
23
+ {"current_steps": 573, "total_steps": 2200, "loss": 1.7169, "lr": 1e-05, "epoch": 1.0418086798454897, "percentage": 26.05, "elapsed_time": "1:12:47", "remaining_time": "3:26:41"}
24
+ {"current_steps": 574, "total_steps": 2200, "loss": 1.7152, "lr": 1e-05, "epoch": 1.043626448534424, "percentage": 26.09, "elapsed_time": "1:15:57", "remaining_time": "3:35:11"}
25
+ {"current_steps": 575, "total_steps": 2200, "loss": 1.7206, "lr": 1e-05, "epoch": 1.0454442172233582, "percentage": 26.14, "elapsed_time": "1:19:06", "remaining_time": "3:43:32"}
26
+ {"current_steps": 576, "total_steps": 2200, "loss": 1.706, "lr": 1e-05, "epoch": 1.0472619859122927, "percentage": 26.18, "elapsed_time": "1:22:15", "remaining_time": "3:51:55"}
27
+ {"current_steps": 577, "total_steps": 2200, "loss": 1.7131, "lr": 1e-05, "epoch": 1.049079754601227, "percentage": 26.23, "elapsed_time": "1:25:23", "remaining_time": "4:00:10"}
28
+ {"current_steps": 578, "total_steps": 2200, "loss": 1.7191, "lr": 1e-05, "epoch": 1.0508975232901614, "percentage": 26.27, "elapsed_time": "1:28:31", "remaining_time": "4:08:25"}
29
+ {"current_steps": 579, "total_steps": 2200, "loss": 1.7066, "lr": 1e-05, "epoch": 1.0527152919790956, "percentage": 26.32, "elapsed_time": "1:31:40", "remaining_time": "4:16:39"}
30
+ {"current_steps": 580, "total_steps": 2200, "loss": 1.7223, "lr": 1e-05, "epoch": 1.05453306066803, "percentage": 26.36, "elapsed_time": "1:34:49", "remaining_time": "4:24:51"}
31
+ {"current_steps": 581, "total_steps": 2200, "loss": 1.7164, "lr": 1e-05, "epoch": 1.0563508293569643, "percentage": 26.41, "elapsed_time": "1:37:58", "remaining_time": "4:33:00"}
32
+ {"current_steps": 582, "total_steps": 2200, "loss": 1.7082, "lr": 1e-05, "epoch": 1.0581685980458986, "percentage": 26.45, "elapsed_time": "1:41:06", "remaining_time": "4:41:06"}
33
+ {"current_steps": 583, "total_steps": 2200, "loss": 1.7155, "lr": 1e-05, "epoch": 1.059986366734833, "percentage": 26.5, "elapsed_time": "1:44:16", "remaining_time": "4:49:14"}
34
+ {"current_steps": 584, "total_steps": 2200, "loss": 1.7195, "lr": 1e-05, "epoch": 1.0618041354237673, "percentage": 26.55, "elapsed_time": "1:47:26", "remaining_time": "4:57:19"}
35
+ {"current_steps": 585, "total_steps": 2200, "loss": 1.7139, "lr": 1e-05, "epoch": 1.0636219041127017, "percentage": 26.59, "elapsed_time": "1:50:35", "remaining_time": "5:05:19"}
36
+ {"current_steps": 586, "total_steps": 2200, "loss": 1.7076, "lr": 1e-05, "epoch": 1.065439672801636, "percentage": 26.64, "elapsed_time": "1:53:44", "remaining_time": "5:13:15"}
37
+ {"current_steps": 587, "total_steps": 2200, "loss": 1.716, "lr": 1e-05, "epoch": 1.0672574414905702, "percentage": 26.68, "elapsed_time": "1:56:53", "remaining_time": "5:21:12"}
38
+ {"current_steps": 588, "total_steps": 2200, "loss": 1.715, "lr": 1e-05, "epoch": 1.0690752101795047, "percentage": 26.73, "elapsed_time": "2:00:02", "remaining_time": "5:29:05"}
39
+ {"current_steps": 589, "total_steps": 2200, "loss": 1.7197, "lr": 1e-05, "epoch": 1.070892978868439, "percentage": 26.77, "elapsed_time": "2:03:10", "remaining_time": "5:36:53"}
40
+ {"current_steps": 590, "total_steps": 2200, "loss": 1.7139, "lr": 1e-05, "epoch": 1.0727107475573734, "percentage": 26.82, "elapsed_time": "2:06:18", "remaining_time": "5:44:41"}
41
+ {"current_steps": 591, "total_steps": 2200, "loss": 1.7211, "lr": 1e-05, "epoch": 1.0745285162463076, "percentage": 26.86, "elapsed_time": "2:09:27", "remaining_time": "5:52:27"}
42
+ {"current_steps": 592, "total_steps": 2200, "loss": 1.7077, "lr": 1e-05, "epoch": 1.076346284935242, "percentage": 26.91, "elapsed_time": "2:12:37", "remaining_time": "6:00:13"}
43
+ {"current_steps": 593, "total_steps": 2200, "loss": 1.7122, "lr": 1e-05, "epoch": 1.0781640536241763, "percentage": 26.95, "elapsed_time": "2:15:48", "remaining_time": "6:08:01"}
44
+ {"current_steps": 594, "total_steps": 2200, "loss": 1.7185, "lr": 1e-05, "epoch": 1.0799818223131106, "percentage": 27.0, "elapsed_time": "2:18:59", "remaining_time": "6:15:47"}
45
+ {"current_steps": 595, "total_steps": 2200, "loss": 1.7139, "lr": 1e-05, "epoch": 1.081799591002045, "percentage": 27.05, "elapsed_time": "2:22:08", "remaining_time": "6:23:26"}
46
+ {"current_steps": 596, "total_steps": 2200, "loss": 1.7136, "lr": 1e-05, "epoch": 1.0836173596909793, "percentage": 27.09, "elapsed_time": "2:25:18", "remaining_time": "6:31:04"}
47
+ {"current_steps": 597, "total_steps": 2200, "loss": 1.7165, "lr": 1e-05, "epoch": 1.0854351283799137, "percentage": 27.14, "elapsed_time": "2:28:27", "remaining_time": "6:38:38"}
48
+ {"current_steps": 598, "total_steps": 2200, "loss": 1.7177, "lr": 1e-05, "epoch": 1.087252897068848, "percentage": 27.18, "elapsed_time": "2:31:37", "remaining_time": "6:46:12"}
49
+ {"current_steps": 599, "total_steps": 2200, "loss": 1.7129, "lr": 1e-05, "epoch": 1.0890706657577822, "percentage": 27.23, "elapsed_time": "2:34:46", "remaining_time": "6:53:39"}
50
+ {"current_steps": 600, "total_steps": 2200, "loss": 1.7267, "lr": 1e-05, "epoch": 1.0908884344467167, "percentage": 27.27, "elapsed_time": "2:37:55", "remaining_time": "7:01:08"}
51
+ {"current_steps": 601, "total_steps": 2200, "loss": 1.7212, "lr": 1e-05, "epoch": 1.092706203135651, "percentage": 27.32, "elapsed_time": "2:44:27", "remaining_time": "7:17:33"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:66b5fe5da312e27d110644377582e9652cbbff1fc886c823afdc1e606d4b4e85
3
  size 7672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6ca41750297033af1f4e715f9a53c1574c6b50c268cfbdd3aeb59e901d1e27f
3
  size 7672