sedrickkeh commited on
Commit
136c528
·
verified ·
1 Parent(s): e7123b3

Training in progress, epoch 4

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3f5ba80a558c58723fdeedbf78e873e26c4134693ef193510c457c426fd9aae2
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82ccbb889498fbadeade9904cf90b36a3f0b9830e3cb496e7c366184cfbd4c35
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:879d122d9414f741ef71c29e2e71d96196226313c71ea08486a05fc82b78d143
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97a706afd8a0d543eb58b12fc142478580234ed5162234edce0bb41731458870
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f9e9e793625087b96ef3183be39d27afcd8b930d03e8c93af75dc98f509d9558
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aeab4e86b44e756bf20a4d77919192758de4b5fb12e1319e24047d543d666816
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:49c6afb095fda3259f6d147f34b6819390483d3e399033bbbc97543fa2663608
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:499bc64fc6e797b1d45271ea76f96e38766e6f49c8e59822767e0a1160a9e7b2
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -1565,3 +1565,387 @@
1565
  {"current_steps": 1565, "total_steps": 1950, "loss": 0.2002, "lr": 4.5646621393177e-06, "epoch": 4.00511836212412, "percentage": 80.26, "elapsed_time": "16:28:17", "remaining_time": "4:03:07"}
1566
  {"current_steps": 1566, "total_steps": 1950, "loss": 0.1689, "lr": 4.541920429589168e-06, "epoch": 4.007677543186181, "percentage": 80.31, "elapsed_time": "16:28:52", "remaining_time": "4:02:29"}
1567
  {"current_steps": 1567, "total_steps": 1950, "loss": 0.162, "lr": 4.519228253578514e-06, "epoch": 4.010236724248241, "percentage": 80.36, "elapsed_time": "16:29:28", "remaining_time": "4:01:50"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1565
  {"current_steps": 1565, "total_steps": 1950, "loss": 0.2002, "lr": 4.5646621393177e-06, "epoch": 4.00511836212412, "percentage": 80.26, "elapsed_time": "16:28:17", "remaining_time": "4:03:07"}
1566
  {"current_steps": 1566, "total_steps": 1950, "loss": 0.1689, "lr": 4.541920429589168e-06, "epoch": 4.007677543186181, "percentage": 80.31, "elapsed_time": "16:28:52", "remaining_time": "4:02:29"}
1567
  {"current_steps": 1567, "total_steps": 1950, "loss": 0.162, "lr": 4.519228253578514e-06, "epoch": 4.010236724248241, "percentage": 80.36, "elapsed_time": "16:29:28", "remaining_time": "4:01:50"}
1568
+ {"current_steps": 1568, "total_steps": 1950, "loss": 0.1905, "lr": 4.496585684000332e-06, "epoch": 4.012795905310301, "percentage": 80.41, "elapsed_time": "16:30:02", "remaining_time": "4:01:11"}
1569
+ {"current_steps": 1569, "total_steps": 1950, "loss": 0.1883, "lr": 4.47399279341024e-06, "epoch": 4.015355086372361, "percentage": 80.46, "elapsed_time": "16:30:39", "remaining_time": "4:00:33"}
1570
+ {"current_steps": 1570, "total_steps": 1950, "loss": 0.1792, "lr": 4.451449654204685e-06, "epoch": 4.017914267434421, "percentage": 80.51, "elapsed_time": "16:31:23", "remaining_time": "3:59:57"}
1571
+ {"current_steps": 1571, "total_steps": 1950, "loss": 0.1549, "lr": 4.428956338620671e-06, "epoch": 4.020473448496481, "percentage": 80.56, "elapsed_time": "16:31:51", "remaining_time": "3:59:17"}
1572
+ {"current_steps": 1572, "total_steps": 1950, "loss": 0.168, "lr": 4.406512918735555e-06, "epoch": 4.023032629558541, "percentage": 80.62, "elapsed_time": "16:32:31", "remaining_time": "3:58:39"}
1573
+ {"current_steps": 1573, "total_steps": 1950, "loss": 0.1546, "lr": 4.384119466466816e-06, "epoch": 4.025591810620601, "percentage": 80.67, "elapsed_time": "16:33:02", "remaining_time": "3:58:00"}
1574
+ {"current_steps": 1574, "total_steps": 1950, "loss": 0.1553, "lr": 4.361776053571816e-06, "epoch": 4.028150991682661, "percentage": 80.72, "elapsed_time": "16:33:41", "remaining_time": "3:57:22"}
1575
+ {"current_steps": 1575, "total_steps": 1950, "loss": 0.1672, "lr": 4.339482751647557e-06, "epoch": 4.030710172744722, "percentage": 80.77, "elapsed_time": "16:34:15", "remaining_time": "3:56:43"}
1576
+ {"current_steps": 1576, "total_steps": 1950, "loss": 0.1694, "lr": 4.317239632130485e-06, "epoch": 4.033269353806782, "percentage": 80.82, "elapsed_time": "16:34:43", "remaining_time": "3:56:03"}
1577
+ {"current_steps": 1577, "total_steps": 1950, "loss": 0.1652, "lr": 4.295046766296224e-06, "epoch": 4.035828534868842, "percentage": 80.87, "elapsed_time": "16:35:24", "remaining_time": "3:55:26"}
1578
+ {"current_steps": 1578, "total_steps": 1950, "loss": 0.1643, "lr": 4.272904225259387e-06, "epoch": 4.038387715930902, "percentage": 80.92, "elapsed_time": "16:35:57", "remaining_time": "3:54:47"}
1579
+ {"current_steps": 1579, "total_steps": 1950, "loss": 0.1693, "lr": 4.250812079973301e-06, "epoch": 4.0409468969929625, "percentage": 80.97, "elapsed_time": "16:36:30", "remaining_time": "3:54:08"}
1580
+ {"current_steps": 1580, "total_steps": 1950, "loss": 0.1676, "lr": 4.228770401229824e-06, "epoch": 4.043506078055023, "percentage": 81.03, "elapsed_time": "16:37:13", "remaining_time": "3:53:31"}
1581
+ {"current_steps": 1581, "total_steps": 1950, "loss": 0.1837, "lr": 4.206779259659102e-06, "epoch": 4.046065259117083, "percentage": 81.08, "elapsed_time": "16:37:54", "remaining_time": "3:52:54"}
1582
+ {"current_steps": 1582, "total_steps": 1950, "loss": 0.1606, "lr": 4.184838725729326e-06, "epoch": 4.048624440179142, "percentage": 81.13, "elapsed_time": "16:38:27", "remaining_time": "3:52:15"}
1583
+ {"current_steps": 1583, "total_steps": 1950, "loss": 0.1701, "lr": 4.1629488697465195e-06, "epoch": 4.0511836212412025, "percentage": 81.18, "elapsed_time": "16:39:12", "remaining_time": "3:51:39"}
1584
+ {"current_steps": 1584, "total_steps": 1950, "loss": 0.1586, "lr": 4.141109761854332e-06, "epoch": 4.053742802303263, "percentage": 81.23, "elapsed_time": "16:39:50", "remaining_time": "3:51:01"}
1585
+ {"current_steps": 1585, "total_steps": 1950, "loss": 0.1787, "lr": 4.119321472033779e-06, "epoch": 4.056301983365323, "percentage": 81.28, "elapsed_time": "16:40:31", "remaining_time": "3:50:24"}
1586
+ {"current_steps": 1586, "total_steps": 1950, "loss": 0.153, "lr": 4.097584070103042e-06, "epoch": 4.058861164427383, "percentage": 81.33, "elapsed_time": "16:41:06", "remaining_time": "3:49:45"}
1587
+ {"current_steps": 1587, "total_steps": 1950, "loss": 0.1593, "lr": 4.075897625717249e-06, "epoch": 4.061420345489443, "percentage": 81.38, "elapsed_time": "16:41:50", "remaining_time": "3:49:09"}
1588
+ {"current_steps": 1588, "total_steps": 1950, "loss": 0.1805, "lr": 4.054262208368216e-06, "epoch": 4.0639795265515035, "percentage": 81.44, "elapsed_time": "16:42:29", "remaining_time": "3:48:31"}
1589
+ {"current_steps": 1589, "total_steps": 1950, "loss": 0.1702, "lr": 4.032677887384262e-06, "epoch": 4.066538707613564, "percentage": 81.49, "elapsed_time": "16:43:05", "remaining_time": "3:47:53"}
1590
+ {"current_steps": 1590, "total_steps": 1950, "loss": 0.1913, "lr": 4.011144731929981e-06, "epoch": 4.069097888675624, "percentage": 81.54, "elapsed_time": "16:43:43", "remaining_time": "3:47:15"}
1591
+ {"current_steps": 1591, "total_steps": 1950, "loss": 0.1727, "lr": 3.989662811005992e-06, "epoch": 4.071657069737684, "percentage": 81.59, "elapsed_time": "16:44:22", "remaining_time": "3:46:37"}
1592
+ {"current_steps": 1592, "total_steps": 1950, "loss": 0.2085, "lr": 3.96823219344876e-06, "epoch": 4.074216250799744, "percentage": 81.64, "elapsed_time": "16:45:05", "remaining_time": "3:46:01"}
1593
+ {"current_steps": 1593, "total_steps": 1950, "loss": 0.1746, "lr": 3.9468529479303445e-06, "epoch": 4.076775431861805, "percentage": 81.69, "elapsed_time": "16:45:40", "remaining_time": "3:45:22"}
1594
+ {"current_steps": 1594, "total_steps": 1950, "loss": 0.1949, "lr": 3.925525142958189e-06, "epoch": 4.079334612923865, "percentage": 81.74, "elapsed_time": "16:46:16", "remaining_time": "3:44:44"}
1595
+ {"current_steps": 1595, "total_steps": 1950, "loss": 0.1665, "lr": 3.904248846874894e-06, "epoch": 4.081893793985924, "percentage": 81.79, "elapsed_time": "16:46:55", "remaining_time": "3:44:06"}
1596
+ {"current_steps": 1596, "total_steps": 1950, "loss": 0.1725, "lr": 3.883024127858017e-06, "epoch": 4.084452975047984, "percentage": 81.85, "elapsed_time": "16:47:33", "remaining_time": "3:43:28"}
1597
+ {"current_steps": 1597, "total_steps": 1950, "loss": 0.1873, "lr": 3.861851053919847e-06, "epoch": 4.0870121561100445, "percentage": 81.9, "elapsed_time": "16:48:13", "remaining_time": "3:42:51"}
1598
+ {"current_steps": 1598, "total_steps": 1950, "loss": 0.1789, "lr": 3.840729692907164e-06, "epoch": 4.089571337172105, "percentage": 81.95, "elapsed_time": "16:48:55", "remaining_time": "3:42:14"}
1599
+ {"current_steps": 1599, "total_steps": 1950, "loss": 0.1587, "lr": 3.819660112501053e-06, "epoch": 4.092130518234165, "percentage": 82.0, "elapsed_time": "16:49:28", "remaining_time": "3:41:35"}
1600
+ {"current_steps": 1600, "total_steps": 1950, "loss": 0.1564, "lr": 3.7986423802166705e-06, "epoch": 4.094689699296225, "percentage": 82.05, "elapsed_time": "16:50:08", "remaining_time": "3:40:58"}
1601
+ {"current_steps": 1601, "total_steps": 1950, "loss": 0.1636, "lr": 3.7776765634030234e-06, "epoch": 4.097248880358285, "percentage": 82.1, "elapsed_time": "16:50:36", "remaining_time": "3:40:18"}
1602
+ {"current_steps": 1602, "total_steps": 1950, "loss": 0.1991, "lr": 3.756762729242773e-06, "epoch": 4.099808061420346, "percentage": 82.15, "elapsed_time": "16:51:11", "remaining_time": "3:39:39"}
1603
+ {"current_steps": 1603, "total_steps": 1950, "loss": 0.165, "lr": 3.7359009447520112e-06, "epoch": 4.102367242482406, "percentage": 82.21, "elapsed_time": "16:51:47", "remaining_time": "3:39:01"}
1604
+ {"current_steps": 1604, "total_steps": 1950, "loss": 0.1897, "lr": 3.715091276780023e-06, "epoch": 4.104926423544466, "percentage": 82.26, "elapsed_time": "16:52:28", "remaining_time": "3:38:24"}
1605
+ {"current_steps": 1605, "total_steps": 1950, "loss": 0.1967, "lr": 3.694333792009115e-06, "epoch": 4.107485604606526, "percentage": 82.31, "elapsed_time": "16:53:02", "remaining_time": "3:37:45"}
1606
+ {"current_steps": 1606, "total_steps": 1950, "loss": 0.1705, "lr": 3.6736285569543585e-06, "epoch": 4.110044785668586, "percentage": 82.36, "elapsed_time": "16:53:36", "remaining_time": "3:37:06"}
1607
+ {"current_steps": 1607, "total_steps": 1950, "loss": 0.1865, "lr": 3.652975637963401e-06, "epoch": 4.112603966730646, "percentage": 82.41, "elapsed_time": "16:54:11", "remaining_time": "3:36:28"}
1608
+ {"current_steps": 1608, "total_steps": 1950, "loss": 0.1804, "lr": 3.632375101216259e-06, "epoch": 4.115163147792706, "percentage": 82.46, "elapsed_time": "16:54:53", "remaining_time": "3:35:51"}
1609
+ {"current_steps": 1609, "total_steps": 1950, "loss": 0.139, "lr": 3.6118270127250954e-06, "epoch": 4.117722328854766, "percentage": 82.51, "elapsed_time": "16:55:27", "remaining_time": "3:35:12"}
1610
+ {"current_steps": 1610, "total_steps": 1950, "loss": 0.1533, "lr": 3.5913314383339937e-06, "epoch": 4.120281509916826, "percentage": 82.56, "elapsed_time": "16:56:03", "remaining_time": "3:34:34"}
1611
+ {"current_steps": 1611, "total_steps": 1950, "loss": 0.1614, "lr": 3.5708884437187673e-06, "epoch": 4.122840690978887, "percentage": 82.62, "elapsed_time": "16:56:41", "remaining_time": "3:33:56"}
1612
+ {"current_steps": 1612, "total_steps": 1950, "loss": 0.1868, "lr": 3.5504980943867538e-06, "epoch": 4.125399872040947, "percentage": 82.67, "elapsed_time": "16:57:25", "remaining_time": "3:33:19"}
1613
+ {"current_steps": 1613, "total_steps": 1950, "loss": 0.1634, "lr": 3.53016045567659e-06, "epoch": 4.127959053103007, "percentage": 82.72, "elapsed_time": "16:58:01", "remaining_time": "3:32:41"}
1614
+ {"current_steps": 1614, "total_steps": 1950, "loss": 0.2041, "lr": 3.509875592757999e-06, "epoch": 4.130518234165067, "percentage": 82.77, "elapsed_time": "16:58:44", "remaining_time": "3:32:04"}
1615
+ {"current_steps": 1615, "total_steps": 1950, "loss": 0.1676, "lr": 3.4896435706316e-06, "epoch": 4.1330774152271275, "percentage": 82.82, "elapsed_time": "16:59:22", "remaining_time": "3:31:26"}
1616
+ {"current_steps": 1616, "total_steps": 1950, "loss": 0.1714, "lr": 3.469464454128684e-06, "epoch": 4.135636596289188, "percentage": 82.87, "elapsed_time": "17:00:02", "remaining_time": "3:30:49"}
1617
+ {"current_steps": 1617, "total_steps": 1950, "loss": 0.2032, "lr": 3.4493383079110054e-06, "epoch": 4.138195777351248, "percentage": 82.92, "elapsed_time": "17:00:38", "remaining_time": "3:30:11"}
1618
+ {"current_steps": 1618, "total_steps": 1950, "loss": 0.1654, "lr": 3.429265196470599e-06, "epoch": 4.140754958413308, "percentage": 82.97, "elapsed_time": "17:01:16", "remaining_time": "3:29:33"}
1619
+ {"current_steps": 1619, "total_steps": 1950, "loss": 0.1753, "lr": 3.409245184129546e-06, "epoch": 4.143314139475368, "percentage": 83.03, "elapsed_time": "17:01:53", "remaining_time": "3:28:55"}
1620
+ {"current_steps": 1620, "total_steps": 1950, "loss": 0.1605, "lr": 3.3892783350397675e-06, "epoch": 4.145873320537428, "percentage": 83.08, "elapsed_time": "17:02:29", "remaining_time": "3:28:17"}
1621
+ {"current_steps": 1621, "total_steps": 1950, "loss": 0.1546, "lr": 3.369364713182848e-06, "epoch": 4.148432501599488, "percentage": 83.13, "elapsed_time": "17:03:07", "remaining_time": "3:27:39"}
1622
+ {"current_steps": 1622, "total_steps": 1950, "loss": 0.1606, "lr": 3.349504382369795e-06, "epoch": 4.150991682661548, "percentage": 83.18, "elapsed_time": "17:03:45", "remaining_time": "3:27:01"}
1623
+ {"current_steps": 1623, "total_steps": 1950, "loss": 0.1802, "lr": 3.329697406240855e-06, "epoch": 4.153550863723608, "percentage": 83.23, "elapsed_time": "17:04:22", "remaining_time": "3:26:23"}
1624
+ {"current_steps": 1624, "total_steps": 1950, "loss": 0.1685, "lr": 3.309943848265311e-06, "epoch": 4.1561100447856685, "percentage": 83.28, "elapsed_time": "17:05:00", "remaining_time": "3:25:45"}
1625
+ {"current_steps": 1625, "total_steps": 1950, "loss": 0.1712, "lr": 3.290243771741275e-06, "epoch": 4.158669225847729, "percentage": 83.33, "elapsed_time": "17:05:38", "remaining_time": "3:25:07"}
1626
+ {"current_steps": 1626, "total_steps": 1950, "loss": 0.1888, "lr": 3.2705972397954655e-06, "epoch": 4.161228406909789, "percentage": 83.38, "elapsed_time": "17:06:17", "remaining_time": "3:24:30"}
1627
+ {"current_steps": 1627, "total_steps": 1950, "loss": 0.1877, "lr": 3.2510043153830486e-06, "epoch": 4.163787587971849, "percentage": 83.44, "elapsed_time": "17:06:51", "remaining_time": "3:23:51"}
1628
+ {"current_steps": 1628, "total_steps": 1950, "loss": 0.1844, "lr": 3.231465061287391e-06, "epoch": 4.166346769033909, "percentage": 83.49, "elapsed_time": "17:07:22", "remaining_time": "3:23:12"}
1629
+ {"current_steps": 1629, "total_steps": 1950, "loss": 0.1489, "lr": 3.211979540119883e-06, "epoch": 4.1689059500959695, "percentage": 83.54, "elapsed_time": "17:08:06", "remaining_time": "3:22:35"}
1630
+ {"current_steps": 1630, "total_steps": 1950, "loss": 0.1651, "lr": 3.1925478143197418e-06, "epoch": 4.17146513115803, "percentage": 83.59, "elapsed_time": "17:08:48", "remaining_time": "3:21:58"}
1631
+ {"current_steps": 1631, "total_steps": 1950, "loss": 0.1809, "lr": 3.1731699461537958e-06, "epoch": 4.17402431222009, "percentage": 83.64, "elapsed_time": "17:09:33", "remaining_time": "3:21:21"}
1632
+ {"current_steps": 1632, "total_steps": 1950, "loss": 0.1608, "lr": 3.153845997716303e-06, "epoch": 4.176583493282149, "percentage": 83.69, "elapsed_time": "17:10:08", "remaining_time": "3:20:43"}
1633
+ {"current_steps": 1633, "total_steps": 1950, "loss": 0.1486, "lr": 3.1345760309287264e-06, "epoch": 4.1791426743442095, "percentage": 83.74, "elapsed_time": "17:10:46", "remaining_time": "3:20:05"}
1634
+ {"current_steps": 1634, "total_steps": 1950, "loss": 0.1742, "lr": 3.1153601075395533e-06, "epoch": 4.18170185540627, "percentage": 83.79, "elapsed_time": "17:11:27", "remaining_time": "3:19:28"}
1635
+ {"current_steps": 1635, "total_steps": 1950, "loss": 0.1892, "lr": 3.0961982891241083e-06, "epoch": 4.18426103646833, "percentage": 83.85, "elapsed_time": "17:12:05", "remaining_time": "3:18:50"}
1636
+ {"current_steps": 1636, "total_steps": 1950, "loss": 0.176, "lr": 3.0770906370843234e-06, "epoch": 4.18682021753039, "percentage": 83.9, "elapsed_time": "17:12:50", "remaining_time": "3:18:14"}
1637
+ {"current_steps": 1637, "total_steps": 1950, "loss": 0.1942, "lr": 3.058037212648579e-06, "epoch": 4.18937939859245, "percentage": 83.95, "elapsed_time": "17:13:29", "remaining_time": "3:17:36"}
1638
+ {"current_steps": 1638, "total_steps": 1950, "loss": 0.1722, "lr": 3.039038076871481e-06, "epoch": 4.1919385796545106, "percentage": 84.0, "elapsed_time": "17:14:04", "remaining_time": "3:16:57"}
1639
+ {"current_steps": 1639, "total_steps": 1950, "loss": 0.1819, "lr": 3.02009329063367e-06, "epoch": 4.194497760716571, "percentage": 84.05, "elapsed_time": "17:14:43", "remaining_time": "3:16:20"}
1640
+ {"current_steps": 1640, "total_steps": 1950, "loss": 0.1855, "lr": 3.001202914641628e-06, "epoch": 4.197056941778631, "percentage": 84.1, "elapsed_time": "17:15:19", "remaining_time": "3:15:42"}
1641
+ {"current_steps": 1641, "total_steps": 1950, "loss": 0.1671, "lr": 2.9823670094275e-06, "epoch": 4.199616122840691, "percentage": 84.15, "elapsed_time": "17:15:55", "remaining_time": "3:15:03"}
1642
+ {"current_steps": 1642, "total_steps": 1950, "loss": 0.1731, "lr": 2.9635856353488645e-06, "epoch": 4.202175303902751, "percentage": 84.21, "elapsed_time": "17:16:40", "remaining_time": "3:14:27"}
1643
+ {"current_steps": 1643, "total_steps": 1950, "loss": 0.1845, "lr": 2.9448588525885746e-06, "epoch": 4.204734484964812, "percentage": 84.26, "elapsed_time": "17:17:22", "remaining_time": "3:13:50"}
1644
+ {"current_steps": 1644, "total_steps": 1950, "loss": 0.1748, "lr": 2.9261867211545603e-06, "epoch": 4.207293666026872, "percentage": 84.31, "elapsed_time": "17:18:01", "remaining_time": "3:13:12"}
1645
+ {"current_steps": 1645, "total_steps": 1950, "loss": 0.1994, "lr": 2.907569300879596e-06, "epoch": 4.209852847088931, "percentage": 84.36, "elapsed_time": "17:18:37", "remaining_time": "3:12:34"}
1646
+ {"current_steps": 1646, "total_steps": 1950, "loss": 0.1788, "lr": 2.889006651421169e-06, "epoch": 4.212412028150991, "percentage": 84.41, "elapsed_time": "17:19:09", "remaining_time": "3:11:55"}
1647
+ {"current_steps": 1647, "total_steps": 1950, "loss": 0.1486, "lr": 2.870498832261257e-06, "epoch": 4.214971209213052, "percentage": 84.46, "elapsed_time": "17:19:44", "remaining_time": "3:11:16"}
1648
+ {"current_steps": 1648, "total_steps": 1950, "loss": 0.1832, "lr": 2.85204590270612e-06, "epoch": 4.217530390275112, "percentage": 84.51, "elapsed_time": "17:20:13", "remaining_time": "3:10:37"}
1649
+ {"current_steps": 1649, "total_steps": 1950, "loss": 0.1626, "lr": 2.8336479218861556e-06, "epoch": 4.220089571337172, "percentage": 84.56, "elapsed_time": "17:20:50", "remaining_time": "3:09:59"}
1650
+ {"current_steps": 1650, "total_steps": 1950, "loss": 0.1686, "lr": 2.815304948755664e-06, "epoch": 4.222648752399232, "percentage": 84.62, "elapsed_time": "17:21:34", "remaining_time": "3:09:22"}
1651
+ {"current_steps": 1651, "total_steps": 1950, "loss": 0.1713, "lr": 2.7970170420926957e-06, "epoch": 4.225207933461292, "percentage": 84.67, "elapsed_time": "17:22:15", "remaining_time": "3:08:45"}
1652
+ {"current_steps": 1652, "total_steps": 1950, "loss": 0.1681, "lr": 2.778784260498828e-06, "epoch": 4.227767114523353, "percentage": 84.72, "elapsed_time": "17:22:46", "remaining_time": "3:08:06"}
1653
+ {"current_steps": 1653, "total_steps": 1950, "loss": 0.1869, "lr": 2.7606066623990145e-06, "epoch": 4.230326295585413, "percentage": 84.77, "elapsed_time": "17:23:31", "remaining_time": "3:07:29"}
1654
+ {"current_steps": 1654, "total_steps": 1950, "loss": 0.174, "lr": 2.742484306041373e-06, "epoch": 4.232885476647473, "percentage": 84.82, "elapsed_time": "17:24:07", "remaining_time": "3:06:51"}
1655
+ {"current_steps": 1655, "total_steps": 1950, "loss": 0.1855, "lr": 2.7244172494969978e-06, "epoch": 4.235444657709533, "percentage": 84.87, "elapsed_time": "17:24:45", "remaining_time": "3:06:13"}
1656
+ {"current_steps": 1656, "total_steps": 1950, "loss": 0.1641, "lr": 2.7064055506597875e-06, "epoch": 4.2380038387715935, "percentage": 84.92, "elapsed_time": "17:25:25", "remaining_time": "3:05:36"}
1657
+ {"current_steps": 1657, "total_steps": 1950, "loss": 0.1923, "lr": 2.688449267246258e-06, "epoch": 4.240563019833653, "percentage": 84.97, "elapsed_time": "17:26:08", "remaining_time": "3:04:59"}
1658
+ {"current_steps": 1658, "total_steps": 1950, "loss": 0.2104, "lr": 2.6705484567953386e-06, "epoch": 4.243122200895713, "percentage": 85.03, "elapsed_time": "17:26:50", "remaining_time": "3:04:21"}
1659
+ {"current_steps": 1659, "total_steps": 1950, "loss": 0.1718, "lr": 2.6527031766682142e-06, "epoch": 4.245681381957773, "percentage": 85.08, "elapsed_time": "17:27:30", "remaining_time": "3:03:44"}
1660
+ {"current_steps": 1660, "total_steps": 1950, "loss": 0.1711, "lr": 2.6349134840481294e-06, "epoch": 4.248240563019833, "percentage": 85.13, "elapsed_time": "17:28:15", "remaining_time": "3:03:07"}
1661
+ {"current_steps": 1661, "total_steps": 1950, "loss": 0.1532, "lr": 2.6171794359401957e-06, "epoch": 4.250799744081894, "percentage": 85.18, "elapsed_time": "17:28:47", "remaining_time": "3:02:28"}
1662
+ {"current_steps": 1662, "total_steps": 1950, "loss": 0.1552, "lr": 2.599501089171217e-06, "epoch": 4.253358925143954, "percentage": 85.23, "elapsed_time": "17:29:22", "remaining_time": "3:01:50"}
1663
+ {"current_steps": 1663, "total_steps": 1950, "loss": 0.1755, "lr": 2.581878500389523e-06, "epoch": 4.255918106206014, "percentage": 85.28, "elapsed_time": "17:29:58", "remaining_time": "3:01:12"}
1664
+ {"current_steps": 1664, "total_steps": 1950, "loss": 0.1898, "lr": 2.564311726064754e-06, "epoch": 4.258477287268074, "percentage": 85.33, "elapsed_time": "17:30:39", "remaining_time": "3:00:34"}
1665
+ {"current_steps": 1665, "total_steps": 1950, "loss": 0.1698, "lr": 2.546800822487714e-06, "epoch": 4.2610364683301345, "percentage": 85.38, "elapsed_time": "17:31:16", "remaining_time": "2:59:56"}
1666
+ {"current_steps": 1666, "total_steps": 1950, "loss": 0.2087, "lr": 2.5293458457701726e-06, "epoch": 4.263595649392195, "percentage": 85.44, "elapsed_time": "17:32:00", "remaining_time": "2:59:20"}
1667
+ {"current_steps": 1667, "total_steps": 1950, "loss": 0.18, "lr": 2.5119468518446844e-06, "epoch": 4.266154830454255, "percentage": 85.49, "elapsed_time": "17:32:36", "remaining_time": "2:58:41"}
1668
+ {"current_steps": 1668, "total_steps": 1950, "loss": 0.1818, "lr": 2.494603896464405e-06, "epoch": 4.268714011516315, "percentage": 85.54, "elapsed_time": "17:33:09", "remaining_time": "2:58:03"}
1669
+ {"current_steps": 1669, "total_steps": 1950, "loss": 0.1888, "lr": 2.47731703520294e-06, "epoch": 4.271273192578375, "percentage": 85.59, "elapsed_time": "17:33:47", "remaining_time": "2:57:25"}
1670
+ {"current_steps": 1670, "total_steps": 1950, "loss": 0.186, "lr": 2.4600863234541338e-06, "epoch": 4.273832373640435, "percentage": 85.64, "elapsed_time": "17:34:22", "remaining_time": "2:56:46"}
1671
+ {"current_steps": 1671, "total_steps": 1950, "loss": 0.1554, "lr": 2.4429118164319076e-06, "epoch": 4.276391554702495, "percentage": 85.69, "elapsed_time": "17:35:05", "remaining_time": "2:56:09"}
1672
+ {"current_steps": 1672, "total_steps": 1950, "loss": 0.2089, "lr": 2.4257935691700897e-06, "epoch": 4.278950735764555, "percentage": 85.74, "elapsed_time": "17:35:45", "remaining_time": "2:55:32"}
1673
+ {"current_steps": 1673, "total_steps": 1950, "loss": 0.1579, "lr": 2.408731636522217e-06, "epoch": 4.281509916826615, "percentage": 85.79, "elapsed_time": "17:36:18", "remaining_time": "2:54:53"}
1674
+ {"current_steps": 1674, "total_steps": 1950, "loss": 0.1903, "lr": 2.3917260731613733e-06, "epoch": 4.2840690978886755, "percentage": 85.85, "elapsed_time": "17:37:04", "remaining_time": "2:54:17"}
1675
+ {"current_steps": 1675, "total_steps": 1950, "loss": 0.1725, "lr": 2.374776933580025e-06, "epoch": 4.286628278950736, "percentage": 85.9, "elapsed_time": "17:37:41", "remaining_time": "2:53:38"}
1676
+ {"current_steps": 1676, "total_steps": 1950, "loss": 0.1867, "lr": 2.35788427208983e-06, "epoch": 4.289187460012796, "percentage": 85.95, "elapsed_time": "17:38:22", "remaining_time": "2:53:01"}
1677
+ {"current_steps": 1677, "total_steps": 1950, "loss": 0.1613, "lr": 2.3410481428214602e-06, "epoch": 4.291746641074856, "percentage": 86.0, "elapsed_time": "17:39:00", "remaining_time": "2:52:23"}
1678
+ {"current_steps": 1678, "total_steps": 1950, "loss": 0.1667, "lr": 2.324268599724451e-06, "epoch": 4.294305822136916, "percentage": 86.05, "elapsed_time": "17:39:40", "remaining_time": "2:51:46"}
1679
+ {"current_steps": 1679, "total_steps": 1950, "loss": 0.1657, "lr": 2.307545696566997e-06, "epoch": 4.296865003198977, "percentage": 86.1, "elapsed_time": "17:40:20", "remaining_time": "2:51:08"}
1680
+ {"current_steps": 1680, "total_steps": 1950, "loss": 0.1897, "lr": 2.2908794869358044e-06, "epoch": 4.299424184261037, "percentage": 86.15, "elapsed_time": "17:41:03", "remaining_time": "2:50:31"}
1681
+ {"current_steps": 1681, "total_steps": 1950, "loss": 0.188, "lr": 2.274270024235912e-06, "epoch": 4.301983365323097, "percentage": 86.21, "elapsed_time": "17:41:39", "remaining_time": "2:49:53"}
1682
+ {"current_steps": 1682, "total_steps": 1950, "loss": 0.1595, "lr": 2.2577173616905256e-06, "epoch": 4.304542546385157, "percentage": 86.26, "elapsed_time": "17:42:14", "remaining_time": "2:49:15"}
1683
+ {"current_steps": 1683, "total_steps": 1950, "loss": 0.1737, "lr": 2.2412215523408266e-06, "epoch": 4.3071017274472165, "percentage": 86.31, "elapsed_time": "17:42:49", "remaining_time": "2:48:36"}
1684
+ {"current_steps": 1684, "total_steps": 1950, "loss": 0.1796, "lr": 2.2247826490458223e-06, "epoch": 4.309660908509277, "percentage": 86.36, "elapsed_time": "17:43:30", "remaining_time": "2:47:59"}
1685
+ {"current_steps": 1685, "total_steps": 1950, "loss": 0.1565, "lr": 2.2084007044821764e-06, "epoch": 4.312220089571337, "percentage": 86.41, "elapsed_time": "17:43:59", "remaining_time": "2:47:20"}
1686
+ {"current_steps": 1686, "total_steps": 1950, "loss": 0.1756, "lr": 2.1920757711440354e-06, "epoch": 4.314779270633397, "percentage": 86.46, "elapsed_time": "17:44:38", "remaining_time": "2:46:42"}
1687
+ {"current_steps": 1687, "total_steps": 1950, "loss": 0.1683, "lr": 2.1758079013428435e-06, "epoch": 4.317338451695457, "percentage": 86.51, "elapsed_time": "17:45:08", "remaining_time": "2:46:03"}
1688
+ {"current_steps": 1688, "total_steps": 1950, "loss": 0.1697, "lr": 2.159597147207213e-06, "epoch": 4.319897632757518, "percentage": 86.56, "elapsed_time": "17:45:54", "remaining_time": "2:45:26"}
1689
+ {"current_steps": 1689, "total_steps": 1950, "loss": 0.1788, "lr": 2.143443560682721e-06, "epoch": 4.322456813819578, "percentage": 86.62, "elapsed_time": "17:46:31", "remaining_time": "2:44:48"}
1690
+ {"current_steps": 1690, "total_steps": 1950, "loss": 0.1704, "lr": 2.127347193531757e-06, "epoch": 4.325015994881638, "percentage": 86.67, "elapsed_time": "17:47:12", "remaining_time": "2:44:11"}
1691
+ {"current_steps": 1691, "total_steps": 1950, "loss": 0.1684, "lr": 2.1113080973333643e-06, "epoch": 4.327575175943698, "percentage": 86.72, "elapsed_time": "17:47:47", "remaining_time": "2:43:32"}
1692
+ {"current_steps": 1692, "total_steps": 1950, "loss": 0.1541, "lr": 2.0953263234830667e-06, "epoch": 4.330134357005758, "percentage": 86.77, "elapsed_time": "17:48:20", "remaining_time": "2:42:54"}
1693
+ {"current_steps": 1693, "total_steps": 1950, "loss": 0.1861, "lr": 2.0794019231926986e-06, "epoch": 4.332693538067819, "percentage": 86.82, "elapsed_time": "17:49:02", "remaining_time": "2:42:16"}
1694
+ {"current_steps": 1694, "total_steps": 1950, "loss": 0.1785, "lr": 2.0635349474902598e-06, "epoch": 4.335252719129878, "percentage": 86.87, "elapsed_time": "17:49:39", "remaining_time": "2:41:38"}
1695
+ {"current_steps": 1695, "total_steps": 1950, "loss": 0.1896, "lr": 2.0477254472197237e-06, "epoch": 4.337811900191938, "percentage": 86.92, "elapsed_time": "17:50:19", "remaining_time": "2:41:01"}
1696
+ {"current_steps": 1696, "total_steps": 1950, "loss": 0.1775, "lr": 2.0319734730408935e-06, "epoch": 4.340371081253998, "percentage": 86.97, "elapsed_time": "17:51:02", "remaining_time": "2:40:24"}
1697
+ {"current_steps": 1697, "total_steps": 1950, "loss": 0.1903, "lr": 2.016279075429246e-06, "epoch": 4.342930262316059, "percentage": 87.03, "elapsed_time": "17:51:40", "remaining_time": "2:39:46"}
1698
+ {"current_steps": 1698, "total_steps": 1950, "loss": 0.1754, "lr": 2.0006423046757596e-06, "epoch": 4.345489443378119, "percentage": 87.08, "elapsed_time": "17:52:21", "remaining_time": "2:39:08"}
1699
+ {"current_steps": 1699, "total_steps": 1950, "loss": 0.1549, "lr": 1.985063210886735e-06, "epoch": 4.348048624440179, "percentage": 87.13, "elapsed_time": "17:52:58", "remaining_time": "2:38:30"}
1700
+ {"current_steps": 1700, "total_steps": 1950, "loss": 0.1362, "lr": 1.96954184398368e-06, "epoch": 4.350607805502239, "percentage": 87.18, "elapsed_time": "17:53:33", "remaining_time": "2:37:52"}
1701
+ {"current_steps": 1701, "total_steps": 1950, "loss": 0.1586, "lr": 1.9540782537031045e-06, "epoch": 4.3531669865642995, "percentage": 87.23, "elapsed_time": "17:54:12", "remaining_time": "2:37:14"}
1702
+ {"current_steps": 1702, "total_steps": 1950, "loss": 0.1612, "lr": 1.9386724895963805e-06, "epoch": 4.35572616762636, "percentage": 87.28, "elapsed_time": "17:54:40", "remaining_time": "2:36:35"}
1703
+ {"current_steps": 1703, "total_steps": 1950, "loss": 0.1822, "lr": 1.9233246010295903e-06, "epoch": 4.35828534868842, "percentage": 87.33, "elapsed_time": "17:55:21", "remaining_time": "2:35:58"}
1704
+ {"current_steps": 1704, "total_steps": 1950, "loss": 0.1815, "lr": 1.908034637183356e-06, "epoch": 4.36084452975048, "percentage": 87.38, "elapsed_time": "17:56:01", "remaining_time": "2:35:20"}
1705
+ {"current_steps": 1705, "total_steps": 1950, "loss": 0.1545, "lr": 1.8928026470526917e-06, "epoch": 4.36340371081254, "percentage": 87.44, "elapsed_time": "17:56:33", "remaining_time": "2:34:41"}
1706
+ {"current_steps": 1706, "total_steps": 1950, "loss": 0.1476, "lr": 1.8776286794468346e-06, "epoch": 4.3659628918746005, "percentage": 87.49, "elapsed_time": "17:57:01", "remaining_time": "2:34:02"}
1707
+ {"current_steps": 1707, "total_steps": 1950, "loss": 0.2037, "lr": 1.8625127829890922e-06, "epoch": 4.36852207293666, "percentage": 87.54, "elapsed_time": "17:57:35", "remaining_time": "2:33:24"}
1708
+ {"current_steps": 1708, "total_steps": 1950, "loss": 0.1719, "lr": 1.8474550061166984e-06, "epoch": 4.37108125399872, "percentage": 87.59, "elapsed_time": "17:58:10", "remaining_time": "2:32:45"}
1709
+ {"current_steps": 1709, "total_steps": 1950, "loss": 0.1664, "lr": 1.8324553970806436e-06, "epoch": 4.37364043506078, "percentage": 87.64, "elapsed_time": "17:58:51", "remaining_time": "2:32:08"}
1710
+ {"current_steps": 1710, "total_steps": 1950, "loss": 0.1953, "lr": 1.817514003945524e-06, "epoch": 4.3761996161228405, "percentage": 87.69, "elapsed_time": "17:59:34", "remaining_time": "2:31:31"}
1711
+ {"current_steps": 1711, "total_steps": 1950, "loss": 0.1641, "lr": 1.802630874589404e-06, "epoch": 4.378758797184901, "percentage": 87.74, "elapsed_time": "18:00:12", "remaining_time": "2:30:53"}
1712
+ {"current_steps": 1712, "total_steps": 1950, "loss": 0.1718, "lr": 1.787806056703627e-06, "epoch": 4.381317978246961, "percentage": 87.79, "elapsed_time": "18:00:53", "remaining_time": "2:30:15"}
1713
+ {"current_steps": 1713, "total_steps": 1950, "loss": 0.1653, "lr": 1.7730395977926917e-06, "epoch": 4.383877159309021, "percentage": 87.85, "elapsed_time": "18:01:25", "remaining_time": "2:29:37"}
1714
+ {"current_steps": 1714, "total_steps": 1950, "loss": 0.1842, "lr": 1.758331545174099e-06, "epoch": 4.386436340371081, "percentage": 87.9, "elapsed_time": "18:01:57", "remaining_time": "2:28:58"}
1715
+ {"current_steps": 1715, "total_steps": 1950, "loss": 0.1586, "lr": 1.743681945978184e-06, "epoch": 4.3889955214331415, "percentage": 87.95, "elapsed_time": "18:02:29", "remaining_time": "2:28:19"}
1716
+ {"current_steps": 1716, "total_steps": 1950, "loss": 0.1761, "lr": 1.7290908471479805e-06, "epoch": 4.391554702495202, "percentage": 88.0, "elapsed_time": "18:03:09", "remaining_time": "2:27:42"}
1717
+ {"current_steps": 1717, "total_steps": 1950, "loss": 0.1831, "lr": 1.7145582954390638e-06, "epoch": 4.394113883557262, "percentage": 88.05, "elapsed_time": "18:03:49", "remaining_time": "2:27:04"}
1718
+ {"current_steps": 1718, "total_steps": 1950, "loss": 0.1796, "lr": 1.7000843374193987e-06, "epoch": 4.396673064619322, "percentage": 88.1, "elapsed_time": "18:04:20", "remaining_time": "2:26:25"}
1719
+ {"current_steps": 1719, "total_steps": 1950, "loss": 0.1812, "lr": 1.6856690194691872e-06, "epoch": 4.399232245681382, "percentage": 88.15, "elapsed_time": "18:05:00", "remaining_time": "2:25:48"}
1720
+ {"current_steps": 1720, "total_steps": 1950, "loss": 0.1618, "lr": 1.6713123877807413e-06, "epoch": 4.401791426743442, "percentage": 88.21, "elapsed_time": "18:05:32", "remaining_time": "2:25:09"}
1721
+ {"current_steps": 1721, "total_steps": 1950, "loss": 0.1485, "lr": 1.6570144883582994e-06, "epoch": 4.404350607805502, "percentage": 88.26, "elapsed_time": "18:06:15", "remaining_time": "2:24:32"}
1722
+ {"current_steps": 1722, "total_steps": 1950, "loss": 0.1628, "lr": 1.6427753670179214e-06, "epoch": 4.406909788867562, "percentage": 88.31, "elapsed_time": "18:06:46", "remaining_time": "2:23:53"}
1723
+ {"current_steps": 1723, "total_steps": 1950, "loss": 0.1887, "lr": 1.6285950693872999e-06, "epoch": 4.409468969929622, "percentage": 88.36, "elapsed_time": "18:07:31", "remaining_time": "2:23:16"}
1724
+ {"current_steps": 1724, "total_steps": 1950, "loss": 0.1629, "lr": 1.614473640905645e-06, "epoch": 4.4120281509916826, "percentage": 88.41, "elapsed_time": "18:08:11", "remaining_time": "2:22:39"}
1725
+ {"current_steps": 1725, "total_steps": 1950, "loss": 0.2008, "lr": 1.6004111268235156e-06, "epoch": 4.414587332053743, "percentage": 88.46, "elapsed_time": "18:08:54", "remaining_time": "2:22:01"}
1726
+ {"current_steps": 1726, "total_steps": 1950, "loss": 0.191, "lr": 1.5864075722027017e-06, "epoch": 4.417146513115803, "percentage": 88.51, "elapsed_time": "18:09:37", "remaining_time": "2:21:24"}
1727
+ {"current_steps": 1727, "total_steps": 1950, "loss": 0.2073, "lr": 1.5724630219160553e-06, "epoch": 4.419705694177863, "percentage": 88.56, "elapsed_time": "18:10:15", "remaining_time": "2:20:46"}
1728
+ {"current_steps": 1728, "total_steps": 1950, "loss": 0.1568, "lr": 1.5585775206473508e-06, "epoch": 4.422264875239923, "percentage": 88.62, "elapsed_time": "18:10:48", "remaining_time": "2:20:08"}
1729
+ {"current_steps": 1729, "total_steps": 1950, "loss": 0.1728, "lr": 1.5447511128911542e-06, "epoch": 4.424824056301984, "percentage": 88.67, "elapsed_time": "18:11:25", "remaining_time": "2:19:30"}
1730
+ {"current_steps": 1730, "total_steps": 1950, "loss": 0.1904, "lr": 1.5309838429526714e-06, "epoch": 4.427383237364044, "percentage": 88.72, "elapsed_time": "18:12:01", "remaining_time": "2:18:52"}
1731
+ {"current_steps": 1731, "total_steps": 1950, "loss": 0.166, "lr": 1.5172757549476024e-06, "epoch": 4.429942418426104, "percentage": 88.77, "elapsed_time": "18:12:43", "remaining_time": "2:18:14"}
1732
+ {"current_steps": 1732, "total_steps": 1950, "loss": 0.195, "lr": 1.5036268928020125e-06, "epoch": 4.432501599488164, "percentage": 88.82, "elapsed_time": "18:13:26", "remaining_time": "2:17:37"}
1733
+ {"current_steps": 1733, "total_steps": 1950, "loss": 0.1706, "lr": 1.4900373002521851e-06, "epoch": 4.435060780550224, "percentage": 88.87, "elapsed_time": "18:14:00", "remaining_time": "2:16:59"}
1734
+ {"current_steps": 1734, "total_steps": 1950, "loss": 0.1909, "lr": 1.4765070208444732e-06, "epoch": 4.437619961612284, "percentage": 88.92, "elapsed_time": "18:14:36", "remaining_time": "2:16:21"}
1735
+ {"current_steps": 1735, "total_steps": 1950, "loss": 0.1955, "lr": 1.4630360979351644e-06, "epoch": 4.440179142674344, "percentage": 88.97, "elapsed_time": "18:15:14", "remaining_time": "2:15:43"}
1736
+ {"current_steps": 1736, "total_steps": 1950, "loss": 0.1668, "lr": 1.4496245746903626e-06, "epoch": 4.442738323736404, "percentage": 89.03, "elapsed_time": "18:15:51", "remaining_time": "2:15:05"}
1737
+ {"current_steps": 1737, "total_steps": 1950, "loss": 0.173, "lr": 1.4362724940858109e-06, "epoch": 4.445297504798464, "percentage": 89.08, "elapsed_time": "18:16:30", "remaining_time": "2:14:27"}
1738
+ {"current_steps": 1738, "total_steps": 1950, "loss": 0.1639, "lr": 1.422979898906789e-06, "epoch": 4.447856685860525, "percentage": 89.13, "elapsed_time": "18:17:15", "remaining_time": "2:13:50"}
1739
+ {"current_steps": 1739, "total_steps": 1950, "loss": 0.1633, "lr": 1.4097468317479623e-06, "epoch": 4.450415866922585, "percentage": 89.18, "elapsed_time": "18:17:49", "remaining_time": "2:13:12"}
1740
+ {"current_steps": 1740, "total_steps": 1950, "loss": 0.1808, "lr": 1.396573335013236e-06, "epoch": 4.452975047984645, "percentage": 89.23, "elapsed_time": "18:18:27", "remaining_time": "2:12:34"}
1741
+ {"current_steps": 1741, "total_steps": 1950, "loss": 0.1673, "lr": 1.3834594509156319e-06, "epoch": 4.455534229046705, "percentage": 89.28, "elapsed_time": "18:19:08", "remaining_time": "2:11:56"}
1742
+ {"current_steps": 1742, "total_steps": 1950, "loss": 0.1971, "lr": 1.3704052214771513e-06, "epoch": 4.4580934101087655, "percentage": 89.33, "elapsed_time": "18:19:49", "remaining_time": "2:11:19"}
1743
+ {"current_steps": 1743, "total_steps": 1950, "loss": 0.1737, "lr": 1.3574106885286465e-06, "epoch": 4.460652591170826, "percentage": 89.38, "elapsed_time": "18:20:26", "remaining_time": "2:10:41"}
1744
+ {"current_steps": 1744, "total_steps": 1950, "loss": 0.1904, "lr": 1.344475893709658e-06, "epoch": 4.463211772232885, "percentage": 89.44, "elapsed_time": "18:21:06", "remaining_time": "2:10:03"}
1745
+ {"current_steps": 1745, "total_steps": 1950, "loss": 0.1613, "lr": 1.3316008784683265e-06, "epoch": 4.465770953294945, "percentage": 89.49, "elapsed_time": "18:21:40", "remaining_time": "2:09:25"}
1746
+ {"current_steps": 1746, "total_steps": 1950, "loss": 0.1627, "lr": 1.3187856840612167e-06, "epoch": 4.468330134357005, "percentage": 89.54, "elapsed_time": "18:22:20", "remaining_time": "2:08:47"}
1747
+ {"current_steps": 1747, "total_steps": 1950, "loss": 0.1644, "lr": 1.3060303515532135e-06, "epoch": 4.470889315419066, "percentage": 89.59, "elapsed_time": "18:23:02", "remaining_time": "2:08:10"}
1748
+ {"current_steps": 1748, "total_steps": 1950, "loss": 0.1748, "lr": 1.2933349218173774e-06, "epoch": 4.473448496481126, "percentage": 89.64, "elapsed_time": "18:23:38", "remaining_time": "2:07:32"}
1749
+ {"current_steps": 1749, "total_steps": 1950, "loss": 0.1717, "lr": 1.2806994355348224e-06, "epoch": 4.476007677543186, "percentage": 89.69, "elapsed_time": "18:24:13", "remaining_time": "2:06:54"}
1750
+ {"current_steps": 1750, "total_steps": 1950, "loss": 0.1739, "lr": 1.2681239331945695e-06, "epoch": 4.478566858605246, "percentage": 89.74, "elapsed_time": "18:24:44", "remaining_time": "2:06:15"}
1751
+ {"current_steps": 1751, "total_steps": 1950, "loss": 0.163, "lr": 1.2556084550934423e-06, "epoch": 4.4811260396673065, "percentage": 89.79, "elapsed_time": "18:25:22", "remaining_time": "2:05:37"}
1752
+ {"current_steps": 1752, "total_steps": 1950, "loss": 0.1596, "lr": 1.2431530413359138e-06, "epoch": 4.483685220729367, "percentage": 89.85, "elapsed_time": "18:25:59", "remaining_time": "2:04:59"}
1753
+ {"current_steps": 1753, "total_steps": 1950, "loss": 0.1764, "lr": 1.2307577318339825e-06, "epoch": 4.486244401791427, "percentage": 89.9, "elapsed_time": "18:26:38", "remaining_time": "2:04:21"}
1754
+ {"current_steps": 1754, "total_steps": 1950, "loss": 0.1904, "lr": 1.2184225663070604e-06, "epoch": 4.488803582853487, "percentage": 89.95, "elapsed_time": "18:27:21", "remaining_time": "2:03:44"}
1755
+ {"current_steps": 1755, "total_steps": 1950, "loss": 0.1785, "lr": 1.2061475842818337e-06, "epoch": 4.491362763915547, "percentage": 90.0, "elapsed_time": "18:27:55", "remaining_time": "2:03:06"}
1756
+ {"current_steps": 1756, "total_steps": 1950, "loss": 0.1804, "lr": 1.1939328250921278e-06, "epoch": 4.4939219449776076, "percentage": 90.05, "elapsed_time": "18:28:40", "remaining_time": "2:02:29"}
1757
+ {"current_steps": 1757, "total_steps": 1950, "loss": 0.1534, "lr": 1.1817783278788042e-06, "epoch": 4.496481126039667, "percentage": 90.1, "elapsed_time": "18:29:19", "remaining_time": "2:01:51"}
1758
+ {"current_steps": 1758, "total_steps": 1950, "loss": 0.1791, "lr": 1.169684131589608e-06, "epoch": 4.499040307101727, "percentage": 90.15, "elapsed_time": "18:29:57", "remaining_time": "2:01:13"}
1759
+ {"current_steps": 1759, "total_steps": 1950, "loss": 0.1721, "lr": 1.1576502749790608e-06, "epoch": 4.501599488163787, "percentage": 90.21, "elapsed_time": "18:30:38", "remaining_time": "2:00:35"}
1760
+ {"current_steps": 1760, "total_steps": 1950, "loss": 0.1739, "lr": 1.1456767966083393e-06, "epoch": 4.5041586692258475, "percentage": 90.26, "elapsed_time": "18:31:23", "remaining_time": "1:59:58"}
1761
+ {"current_steps": 1761, "total_steps": 1950, "loss": 0.1836, "lr": 1.1337637348451369e-06, "epoch": 4.506717850287908, "percentage": 90.31, "elapsed_time": "18:32:06", "remaining_time": "1:59:21"}
1762
+ {"current_steps": 1762, "total_steps": 1950, "loss": 0.1746, "lr": 1.1219111278635575e-06, "epoch": 4.509277031349968, "percentage": 90.36, "elapsed_time": "18:32:44", "remaining_time": "1:58:43"}
1763
+ {"current_steps": 1763, "total_steps": 1950, "loss": 0.1664, "lr": 1.1101190136439689e-06, "epoch": 4.511836212412028, "percentage": 90.41, "elapsed_time": "18:33:18", "remaining_time": "1:58:05"}
1764
+ {"current_steps": 1764, "total_steps": 1950, "loss": 0.1552, "lr": 1.0983874299729092e-06, "epoch": 4.514395393474088, "percentage": 90.46, "elapsed_time": "18:33:49", "remaining_time": "1:57:26"}
1765
+ {"current_steps": 1765, "total_steps": 1950, "loss": 0.155, "lr": 1.086716414442952e-06, "epoch": 4.516954574536149, "percentage": 90.51, "elapsed_time": "18:34:29", "remaining_time": "1:56:48"}
1766
+ {"current_steps": 1766, "total_steps": 1950, "loss": 0.1947, "lr": 1.0751060044525797e-06, "epoch": 4.519513755598209, "percentage": 90.56, "elapsed_time": "18:35:04", "remaining_time": "1:56:10"}
1767
+ {"current_steps": 1767, "total_steps": 1950, "loss": 0.179, "lr": 1.0635562372060825e-06, "epoch": 4.522072936660269, "percentage": 90.62, "elapsed_time": "18:35:44", "remaining_time": "1:55:33"}
1768
+ {"current_steps": 1768, "total_steps": 1950, "loss": 0.1595, "lr": 1.052067149713416e-06, "epoch": 4.524632117722329, "percentage": 90.67, "elapsed_time": "18:36:22", "remaining_time": "1:54:55"}
1769
+ {"current_steps": 1769, "total_steps": 1950, "loss": 0.2022, "lr": 1.0406387787900974e-06, "epoch": 4.527191298784389, "percentage": 90.72, "elapsed_time": "18:37:05", "remaining_time": "1:54:17"}
1770
+ {"current_steps": 1770, "total_steps": 1950, "loss": 0.1965, "lr": 1.0292711610570904e-06, "epoch": 4.529750479846449, "percentage": 90.77, "elapsed_time": "18:37:41", "remaining_time": "1:53:39"}
1771
+ {"current_steps": 1771, "total_steps": 1950, "loss": 0.1796, "lr": 1.0179643329406752e-06, "epoch": 4.532309660908509, "percentage": 90.82, "elapsed_time": "18:38:15", "remaining_time": "1:53:01"}
1772
+ {"current_steps": 1772, "total_steps": 1950, "loss": 0.1872, "lr": 1.0067183306723384e-06, "epoch": 4.534868841970569, "percentage": 90.87, "elapsed_time": "18:38:48", "remaining_time": "1:52:23"}
1773
+ {"current_steps": 1773, "total_steps": 1950, "loss": 0.1645, "lr": 9.955331902886645e-07, "epoch": 4.537428023032629, "percentage": 90.92, "elapsed_time": "18:39:17", "remaining_time": "1:51:44"}
1774
+ {"current_steps": 1774, "total_steps": 1950, "loss": 0.1736, "lr": 9.844089476312035e-07, "epoch": 4.53998720409469, "percentage": 90.97, "elapsed_time": "18:40:01", "remaining_time": "1:51:07"}
1775
+ {"current_steps": 1775, "total_steps": 1950, "loss": 0.156, "lr": 9.733456383463658e-07, "epoch": 4.54254638515675, "percentage": 91.03, "elapsed_time": "18:40:32", "remaining_time": "1:50:28"}
1776
+ {"current_steps": 1776, "total_steps": 1950, "loss": 0.1709, "lr": 9.62343297885313e-07, "epoch": 4.54510556621881, "percentage": 91.08, "elapsed_time": "18:41:10", "remaining_time": "1:49:50"}
1777
+ {"current_steps": 1777, "total_steps": 1950, "loss": 0.1609, "lr": 9.514019615038395e-07, "epoch": 4.54766474728087, "percentage": 91.13, "elapsed_time": "18:41:48", "remaining_time": "1:49:12"}
1778
+ {"current_steps": 1778, "total_steps": 1950, "loss": 0.1823, "lr": 9.40521664262255e-07, "epoch": 4.55022392834293, "percentage": 91.18, "elapsed_time": "18:42:28", "remaining_time": "1:48:35"}
1779
+ {"current_steps": 1779, "total_steps": 1950, "loss": 0.1719, "lr": 9.297024410252753e-07, "epoch": 4.552783109404991, "percentage": 91.23, "elapsed_time": "18:43:08", "remaining_time": "1:47:57"}
1780
+ {"current_steps": 1780, "total_steps": 1950, "loss": 0.2187, "lr": 9.189443264619102e-07, "epoch": 4.555342290467051, "percentage": 91.28, "elapsed_time": "18:43:50", "remaining_time": "1:47:20"}
1781
+ {"current_steps": 1781, "total_steps": 1950, "loss": 0.1581, "lr": 9.082473550453619e-07, "epoch": 4.557901471529111, "percentage": 91.33, "elapsed_time": "18:44:24", "remaining_time": "1:46:41"}
1782
+ {"current_steps": 1782, "total_steps": 1950, "loss": 0.1813, "lr": 8.976115610528957e-07, "epoch": 4.560460652591171, "percentage": 91.38, "elapsed_time": "18:45:06", "remaining_time": "1:46:04"}
1783
+ {"current_steps": 1783, "total_steps": 1950, "loss": 0.1637, "lr": 8.870369785657451e-07, "epoch": 4.563019833653231, "percentage": 91.44, "elapsed_time": "18:45:41", "remaining_time": "1:45:26"}
1784
+ {"current_steps": 1784, "total_steps": 1950, "loss": 0.1867, "lr": 8.765236414690026e-07, "epoch": 4.565579014715291, "percentage": 91.49, "elapsed_time": "18:46:25", "remaining_time": "1:44:48"}
1785
+ {"current_steps": 1785, "total_steps": 1950, "loss": 0.1812, "lr": 8.660715834514977e-07, "epoch": 4.568138195777351, "percentage": 91.54, "elapsed_time": "18:46:58", "remaining_time": "1:44:10"}
1786
+ {"current_steps": 1786, "total_steps": 1950, "loss": 0.1551, "lr": 8.556808380057013e-07, "epoch": 4.570697376839411, "percentage": 91.59, "elapsed_time": "18:47:32", "remaining_time": "1:43:32"}
1787
+ {"current_steps": 1787, "total_steps": 1950, "loss": 0.1665, "lr": 8.453514384276196e-07, "epoch": 4.5732565579014715, "percentage": 91.64, "elapsed_time": "18:48:14", "remaining_time": "1:42:54"}
1788
+ {"current_steps": 1788, "total_steps": 1950, "loss": 0.2019, "lr": 8.350834178166755e-07, "epoch": 4.575815738963532, "percentage": 91.69, "elapsed_time": "18:48:55", "remaining_time": "1:42:17"}
1789
+ {"current_steps": 1789, "total_steps": 1950, "loss": 0.1623, "lr": 8.248768090756143e-07, "epoch": 4.578374920025592, "percentage": 91.74, "elapsed_time": "18:49:37", "remaining_time": "1:41:39"}
1790
+ {"current_steps": 1790, "total_steps": 1950, "loss": 0.193, "lr": 8.147316449103959e-07, "epoch": 4.580934101087652, "percentage": 91.79, "elapsed_time": "18:50:15", "remaining_time": "1:41:01"}
1791
+ {"current_steps": 1791, "total_steps": 1950, "loss": 0.1573, "lr": 8.046479578300803e-07, "epoch": 4.583493282149712, "percentage": 91.85, "elapsed_time": "18:50:44", "remaining_time": "1:40:23"}
1792
+ {"current_steps": 1792, "total_steps": 1950, "loss": 0.1534, "lr": 7.946257801467339e-07, "epoch": 4.5860524632117725, "percentage": 91.9, "elapsed_time": "18:51:18", "remaining_time": "1:39:44"}
1793
+ {"current_steps": 1793, "total_steps": 1950, "loss": 0.1785, "lr": 7.846651439753273e-07, "epoch": 4.588611644273833, "percentage": 91.95, "elapsed_time": "18:51:54", "remaining_time": "1:39:06"}
1794
+ {"current_steps": 1794, "total_steps": 1950, "loss": 0.1632, "lr": 7.747660812336221e-07, "epoch": 4.591170825335892, "percentage": 92.0, "elapsed_time": "18:52:27", "remaining_time": "1:38:28"}
1795
+ {"current_steps": 1795, "total_steps": 1950, "loss": 0.1664, "lr": 7.649286236420806e-07, "epoch": 4.593730006397953, "percentage": 92.05, "elapsed_time": "18:53:09", "remaining_time": "1:37:50"}
1796
+ {"current_steps": 1796, "total_steps": 1950, "loss": 0.1649, "lr": 7.551528027237553e-07, "epoch": 4.5962891874600125, "percentage": 92.1, "elapsed_time": "18:53:41", "remaining_time": "1:37:12"}
1797
+ {"current_steps": 1797, "total_steps": 1950, "loss": 0.1897, "lr": 7.454386498041865e-07, "epoch": 4.598848368522073, "percentage": 92.15, "elapsed_time": "18:54:20", "remaining_time": "1:36:34"}
1798
+ {"current_steps": 1798, "total_steps": 1950, "loss": 0.1806, "lr": 7.357861960113121e-07, "epoch": 4.601407549584133, "percentage": 92.21, "elapsed_time": "18:54:59", "remaining_time": "1:35:56"}
1799
+ {"current_steps": 1799, "total_steps": 1950, "loss": 0.1454, "lr": 7.261954722753595e-07, "epoch": 4.603966730646193, "percentage": 92.26, "elapsed_time": "18:55:28", "remaining_time": "1:35:18"}
1800
+ {"current_steps": 1800, "total_steps": 1950, "loss": 0.1956, "lr": 7.166665093287539e-07, "epoch": 4.606525911708253, "percentage": 92.31, "elapsed_time": "18:56:11", "remaining_time": "1:34:40"}
1801
+ {"current_steps": 1801, "total_steps": 1950, "loss": 0.1813, "lr": 7.071993377060038e-07, "epoch": 4.6090850927703135, "percentage": 92.36, "elapsed_time": "18:56:47", "remaining_time": "1:34:02"}
1802
+ {"current_steps": 1802, "total_steps": 1950, "loss": 0.1937, "lr": 6.977939877436224e-07, "epoch": 4.611644273832374, "percentage": 92.41, "elapsed_time": "18:57:27", "remaining_time": "1:33:25"}
1803
+ {"current_steps": 1803, "total_steps": 1950, "loss": 0.159, "lr": 6.884504895800237e-07, "epoch": 4.614203454894434, "percentage": 92.46, "elapsed_time": "18:58:05", "remaining_time": "1:32:47"}
1804
+ {"current_steps": 1804, "total_steps": 1950, "loss": 0.1608, "lr": 6.791688731554158e-07, "epoch": 4.616762635956494, "percentage": 92.51, "elapsed_time": "18:58:43", "remaining_time": "1:32:09"}
1805
+ {"current_steps": 1805, "total_steps": 1950, "loss": 0.1857, "lr": 6.69949168211721e-07, "epoch": 4.619321817018554, "percentage": 92.56, "elapsed_time": "18:59:25", "remaining_time": "1:31:31"}
1806
+ {"current_steps": 1806, "total_steps": 1950, "loss": 0.1918, "lr": 6.607914042924756e-07, "epoch": 4.621880998080615, "percentage": 92.62, "elapsed_time": "19:00:02", "remaining_time": "1:30:53"}
1807
+ {"current_steps": 1807, "total_steps": 1950, "loss": 0.1569, "lr": 6.516956107427241e-07, "epoch": 4.624440179142674, "percentage": 92.67, "elapsed_time": "19:00:46", "remaining_time": "1:30:16"}
1808
+ {"current_steps": 1808, "total_steps": 1950, "loss": 0.1557, "lr": 6.426618167089338e-07, "epoch": 4.626999360204734, "percentage": 92.72, "elapsed_time": "19:01:30", "remaining_time": "1:29:39"}
1809
+ {"current_steps": 1809, "total_steps": 1950, "loss": 0.1733, "lr": 6.336900511389133e-07, "epoch": 4.629558541266794, "percentage": 92.77, "elapsed_time": "19:02:06", "remaining_time": "1:29:01"}
1810
+ {"current_steps": 1810, "total_steps": 1950, "loss": 0.1635, "lr": 6.247803427816945e-07, "epoch": 4.6321177223288545, "percentage": 92.82, "elapsed_time": "19:02:46", "remaining_time": "1:28:23"}
1811
+ {"current_steps": 1811, "total_steps": 1950, "loss": 0.1709, "lr": 6.159327201874598e-07, "epoch": 4.634676903390915, "percentage": 92.87, "elapsed_time": "19:03:22", "remaining_time": "1:27:45"}
1812
+ {"current_steps": 1812, "total_steps": 1950, "loss": 0.1815, "lr": 6.071472117074462e-07, "epoch": 4.637236084452975, "percentage": 92.92, "elapsed_time": "19:03:59", "remaining_time": "1:27:07"}
1813
+ {"current_steps": 1813, "total_steps": 1950, "loss": 0.1527, "lr": 5.984238454938496e-07, "epoch": 4.639795265515035, "percentage": 92.97, "elapsed_time": "19:04:32", "remaining_time": "1:26:29"}
1814
+ {"current_steps": 1814, "total_steps": 1950, "loss": 0.1785, "lr": 5.897626494997366e-07, "epoch": 4.642354446577095, "percentage": 93.03, "elapsed_time": "19:05:14", "remaining_time": "1:25:51"}
1815
+ {"current_steps": 1815, "total_steps": 1950, "loss": 0.1853, "lr": 5.811636514789598e-07, "epoch": 4.644913627639156, "percentage": 93.08, "elapsed_time": "19:05:52", "remaining_time": "1:25:13"}
1816
+ {"current_steps": 1816, "total_steps": 1950, "loss": 0.1646, "lr": 5.726268789860645e-07, "epoch": 4.647472808701216, "percentage": 93.13, "elapsed_time": "19:06:30", "remaining_time": "1:24:35"}
1817
+ {"current_steps": 1817, "total_steps": 1950, "loss": 0.1723, "lr": 5.641523593761977e-07, "epoch": 4.650031989763276, "percentage": 93.18, "elapsed_time": "19:07:12", "remaining_time": "1:23:58"}
1818
+ {"current_steps": 1818, "total_steps": 1950, "loss": 0.184, "lr": 5.557401198050327e-07, "epoch": 4.652591170825336, "percentage": 93.23, "elapsed_time": "19:07:50", "remaining_time": "1:23:20"}
1819
+ {"current_steps": 1819, "total_steps": 1950, "loss": 0.1712, "lr": 5.473901872286602e-07, "epoch": 4.6551503518873965, "percentage": 93.28, "elapsed_time": "19:08:29", "remaining_time": "1:22:42"}
1820
+ {"current_steps": 1820, "total_steps": 1950, "loss": 0.1817, "lr": 5.391025884035239e-07, "epoch": 4.657709532949456, "percentage": 93.33, "elapsed_time": "19:09:07", "remaining_time": "1:22:04"}
1821
+ {"current_steps": 1821, "total_steps": 1950, "loss": 0.1576, "lr": 5.308773498863251e-07, "epoch": 4.660268714011516, "percentage": 93.38, "elapsed_time": "19:09:48", "remaining_time": "1:21:27"}
1822
+ {"current_steps": 1822, "total_steps": 1950, "loss": 0.1929, "lr": 5.22714498033936e-07, "epoch": 4.662827895073576, "percentage": 93.44, "elapsed_time": "19:10:20", "remaining_time": "1:20:48"}
1823
+ {"current_steps": 1823, "total_steps": 1950, "loss": 0.1869, "lr": 5.146140590033199e-07, "epoch": 4.665387076135636, "percentage": 93.49, "elapsed_time": "19:10:55", "remaining_time": "1:20:10"}
1824
+ {"current_steps": 1824, "total_steps": 1950, "loss": 0.1902, "lr": 5.065760587514446e-07, "epoch": 4.667946257197697, "percentage": 93.54, "elapsed_time": "19:11:30", "remaining_time": "1:19:32"}
1825
+ {"current_steps": 1825, "total_steps": 1950, "loss": 0.188, "lr": 4.986005230351954e-07, "epoch": 4.670505438259757, "percentage": 93.59, "elapsed_time": "19:12:11", "remaining_time": "1:18:55"}
1826
+ {"current_steps": 1826, "total_steps": 1950, "loss": 0.184, "lr": 4.906874774113024e-07, "epoch": 4.673064619321817, "percentage": 93.64, "elapsed_time": "19:12:53", "remaining_time": "1:18:17"}
1827
+ {"current_steps": 1827, "total_steps": 1950, "loss": 0.1469, "lr": 4.828369472362493e-07, "epoch": 4.675623800383877, "percentage": 93.69, "elapsed_time": "19:13:29", "remaining_time": "1:17:39"}
1828
+ {"current_steps": 1828, "total_steps": 1950, "loss": 0.162, "lr": 4.750489576662021e-07, "epoch": 4.6781829814459375, "percentage": 93.74, "elapsed_time": "19:14:13", "remaining_time": "1:17:01"}
1829
+ {"current_steps": 1829, "total_steps": 1950, "loss": 0.1543, "lr": 4.6732353365691374e-07, "epoch": 4.680742162507998, "percentage": 93.79, "elapsed_time": "19:14:42", "remaining_time": "1:16:23"}
1830
+ {"current_steps": 1830, "total_steps": 1950, "loss": 0.1561, "lr": 4.5966069996365993e-07, "epoch": 4.683301343570058, "percentage": 93.85, "elapsed_time": "19:15:19", "remaining_time": "1:15:45"}
1831
+ {"current_steps": 1831, "total_steps": 1950, "loss": 0.1673, "lr": 4.5206048114114775e-07, "epoch": 4.685860524632118, "percentage": 93.9, "elapsed_time": "19:15:55", "remaining_time": "1:15:07"}
1832
+ {"current_steps": 1832, "total_steps": 1950, "loss": 0.1807, "lr": 4.4452290154344046e-07, "epoch": 4.688419705694178, "percentage": 93.95, "elapsed_time": "19:16:34", "remaining_time": "1:14:29"}
1833
+ {"current_steps": 1833, "total_steps": 1950, "loss": 0.2129, "lr": 4.3704798532388624e-07, "epoch": 4.690978886756238, "percentage": 94.0, "elapsed_time": "19:17:12", "remaining_time": "1:13:51"}
1834
+ {"current_steps": 1834, "total_steps": 1950, "loss": 0.1604, "lr": 4.296357564350362e-07, "epoch": 4.693538067818298, "percentage": 94.05, "elapsed_time": "19:17:49", "remaining_time": "1:13:13"}
1835
+ {"current_steps": 1835, "total_steps": 1950, "loss": 0.1763, "lr": 4.22286238628562e-07, "epoch": 4.696097248880358, "percentage": 94.1, "elapsed_time": "19:18:23", "remaining_time": "1:12:35"}
1836
+ {"current_steps": 1836, "total_steps": 1950, "loss": 0.154, "lr": 4.1499945545518283e-07, "epoch": 4.698656429942418, "percentage": 94.15, "elapsed_time": "19:19:08", "remaining_time": "1:11:58"}
1837
+ {"current_steps": 1837, "total_steps": 1950, "loss": 0.1616, "lr": 4.077754302645964e-07, "epoch": 4.7012156110044785, "percentage": 94.21, "elapsed_time": "19:19:49", "remaining_time": "1:11:20"}
1838
+ {"current_steps": 1838, "total_steps": 1950, "loss": 0.1809, "lr": 4.006141862054014e-07, "epoch": 4.703774792066539, "percentage": 94.26, "elapsed_time": "19:20:30", "remaining_time": "1:10:42"}
1839
+ {"current_steps": 1839, "total_steps": 1950, "loss": 0.1799, "lr": 3.935157462250128e-07, "epoch": 4.706333973128599, "percentage": 94.31, "elapsed_time": "19:21:12", "remaining_time": "1:10:05"}
1840
+ {"current_steps": 1840, "total_steps": 1950, "loss": 0.1697, "lr": 3.8648013306960664e-07, "epoch": 4.708893154190659, "percentage": 94.36, "elapsed_time": "19:21:40", "remaining_time": "1:09:26"}
1841
+ {"current_steps": 1841, "total_steps": 1950, "loss": 0.1354, "lr": 3.7950736928402674e-07, "epoch": 4.711452335252719, "percentage": 94.41, "elapsed_time": "19:22:12", "remaining_time": "1:08:48"}
1842
+ {"current_steps": 1842, "total_steps": 1950, "loss": 0.1568, "lr": 3.7259747721173134e-07, "epoch": 4.7140115163147795, "percentage": 94.46, "elapsed_time": "19:22:46", "remaining_time": "1:08:10"}
1843
+ {"current_steps": 1843, "total_steps": 1950, "loss": 0.1539, "lr": 3.6575047899471085e-07, "epoch": 4.71657069737684, "percentage": 94.51, "elapsed_time": "19:23:28", "remaining_time": "1:07:32"}
1844
+ {"current_steps": 1844, "total_steps": 1950, "loss": 0.1566, "lr": 3.5896639657342134e-07, "epoch": 4.719129878438899, "percentage": 94.56, "elapsed_time": "19:24:02", "remaining_time": "1:06:54"}
1845
+ {"current_steps": 1845, "total_steps": 1950, "loss": 0.1751, "lr": 3.522452516867048e-07, "epoch": 4.72168905950096, "percentage": 94.62, "elapsed_time": "19:24:46", "remaining_time": "1:06:17"}
1846
+ {"current_steps": 1846, "total_steps": 1950, "loss": 0.1788, "lr": 3.455870658717353e-07, "epoch": 4.7242482405630195, "percentage": 94.67, "elapsed_time": "19:25:22", "remaining_time": "1:05:39"}
1847
+ {"current_steps": 1847, "total_steps": 1950, "loss": 0.1856, "lr": 3.3899186046393526e-07, "epoch": 4.72680742162508, "percentage": 94.72, "elapsed_time": "19:26:02", "remaining_time": "1:05:01"}
1848
+ {"current_steps": 1848, "total_steps": 1950, "loss": 0.1903, "lr": 3.324596565969174e-07, "epoch": 4.72936660268714, "percentage": 94.77, "elapsed_time": "19:26:37", "remaining_time": "1:04:23"}
1849
+ {"current_steps": 1849, "total_steps": 1950, "loss": 0.1625, "lr": 3.2599047520241123e-07, "epoch": 4.7319257837492, "percentage": 94.82, "elapsed_time": "19:27:16", "remaining_time": "1:03:45"}
1850
+ {"current_steps": 1850, "total_steps": 1950, "loss": 0.2058, "lr": 3.1958433701019697e-07, "epoch": 4.73448496481126, "percentage": 94.87, "elapsed_time": "19:27:57", "remaining_time": "1:03:07"}
1851
+ {"current_steps": 1851, "total_steps": 1950, "loss": 0.1868, "lr": 3.1324126254804524e-07, "epoch": 4.737044145873321, "percentage": 94.92, "elapsed_time": "19:28:39", "remaining_time": "1:02:30"}
1852
+ {"current_steps": 1852, "total_steps": 1950, "loss": 0.1794, "lr": 3.069612721416371e-07, "epoch": 4.739603326935381, "percentage": 94.97, "elapsed_time": "19:29:15", "remaining_time": "1:01:52"}
1853
+ {"current_steps": 1853, "total_steps": 1950, "loss": 0.1701, "lr": 3.007443859145087e-07, "epoch": 4.742162507997441, "percentage": 95.03, "elapsed_time": "19:29:56", "remaining_time": "1:01:14"}
1854
+ {"current_steps": 1854, "total_steps": 1950, "loss": 0.193, "lr": 2.9459062378799806e-07, "epoch": 4.744721689059501, "percentage": 95.08, "elapsed_time": "19:30:34", "remaining_time": "1:00:36"}
1855
+ {"current_steps": 1855, "total_steps": 1950, "loss": 0.1645, "lr": 2.8850000548115155e-07, "epoch": 4.747280870121561, "percentage": 95.13, "elapsed_time": "19:31:15", "remaining_time": "0:59:59"}
1856
+ {"current_steps": 1856, "total_steps": 1950, "loss": 0.1711, "lr": 2.8247255051068845e-07, "epoch": 4.749840051183622, "percentage": 95.18, "elapsed_time": "19:31:56", "remaining_time": "0:59:21"}
1857
+ {"current_steps": 1857, "total_steps": 1950, "loss": 0.1699, "lr": 2.7650827819093005e-07, "epoch": 4.752399232245681, "percentage": 95.23, "elapsed_time": "19:32:33", "remaining_time": "0:58:43"}
1858
+ {"current_steps": 1858, "total_steps": 1950, "loss": 0.1648, "lr": 2.706072076337285e-07, "epoch": 4.754958413307741, "percentage": 95.28, "elapsed_time": "19:33:04", "remaining_time": "0:58:05"}
1859
+ {"current_steps": 1859, "total_steps": 1950, "loss": 0.1887, "lr": 2.647693577484156e-07, "epoch": 4.757517594369801, "percentage": 95.33, "elapsed_time": "19:33:47", "remaining_time": "0:57:27"}
1860
+ {"current_steps": 1860, "total_steps": 1950, "loss": 0.1822, "lr": 2.5899474724174313e-07, "epoch": 4.760076775431862, "percentage": 95.38, "elapsed_time": "19:34:24", "remaining_time": "0:56:49"}
1861
+ {"current_steps": 1861, "total_steps": 1950, "loss": 0.1833, "lr": 2.532833946178137e-07, "epoch": 4.762635956493922, "percentage": 95.44, "elapsed_time": "19:34:58", "remaining_time": "0:56:11"}
1862
+ {"current_steps": 1862, "total_steps": 1950, "loss": 0.1634, "lr": 2.4763531817802777e-07, "epoch": 4.765195137555982, "percentage": 95.49, "elapsed_time": "19:35:39", "remaining_time": "0:55:33"}
1863
+ {"current_steps": 1863, "total_steps": 1950, "loss": 0.1716, "lr": 2.4205053602103015e-07, "epoch": 4.767754318618042, "percentage": 95.54, "elapsed_time": "19:36:17", "remaining_time": "0:54:55"}
1864
+ {"current_steps": 1864, "total_steps": 1950, "loss": 0.1804, "lr": 2.365290660426389e-07, "epoch": 4.770313499680102, "percentage": 95.59, "elapsed_time": "19:36:53", "remaining_time": "0:54:17"}
1865
+ {"current_steps": 1865, "total_steps": 1950, "loss": 0.17, "lr": 2.3107092593579905e-07, "epoch": 4.772872680742163, "percentage": 95.64, "elapsed_time": "19:37:22", "remaining_time": "0:53:39"}
1866
+ {"current_steps": 1866, "total_steps": 1950, "loss": 0.1624, "lr": 2.2567613319051997e-07, "epoch": 4.775431861804223, "percentage": 95.69, "elapsed_time": "19:38:04", "remaining_time": "0:53:01"}
1867
+ {"current_steps": 1867, "total_steps": 1950, "loss": 0.1967, "lr": 2.2034470509382234e-07, "epoch": 4.777991042866283, "percentage": 95.74, "elapsed_time": "19:38:48", "remaining_time": "0:52:24"}
1868
+ {"current_steps": 1868, "total_steps": 1950, "loss": 0.1743, "lr": 2.1507665872968264e-07, "epoch": 4.780550223928343, "percentage": 95.79, "elapsed_time": "19:39:24", "remaining_time": "0:51:46"}
1869
+ {"current_steps": 1869, "total_steps": 1950, "loss": 0.1697, "lr": 2.0987201097897757e-07, "epoch": 4.7831094049904035, "percentage": 95.85, "elapsed_time": "19:40:01", "remaining_time": "0:51:08"}
1870
+ {"current_steps": 1870, "total_steps": 1950, "loss": 0.1692, "lr": 2.0473077851942858e-07, "epoch": 4.785668586052463, "percentage": 95.9, "elapsed_time": "19:40:43", "remaining_time": "0:50:30"}
1871
+ {"current_steps": 1871, "total_steps": 1950, "loss": 0.1594, "lr": 1.9965297782554848e-07, "epoch": 4.788227767114523, "percentage": 95.95, "elapsed_time": "19:41:21", "remaining_time": "0:49:52"}
1872
+ {"current_steps": 1872, "total_steps": 1950, "loss": 0.1862, "lr": 1.9463862516859277e-07, "epoch": 4.790786948176583, "percentage": 96.0, "elapsed_time": "19:42:05", "remaining_time": "0:49:15"}
1873
+ {"current_steps": 1873, "total_steps": 1950, "loss": 0.1625, "lr": 1.896877366165062e-07, "epoch": 4.7933461292386434, "percentage": 96.05, "elapsed_time": "19:42:40", "remaining_time": "0:48:37"}
1874
+ {"current_steps": 1874, "total_steps": 1950, "loss": 0.1647, "lr": 1.8480032803386505e-07, "epoch": 4.795905310300704, "percentage": 96.1, "elapsed_time": "19:43:15", "remaining_time": "0:47:59"}
1875
+ {"current_steps": 1875, "total_steps": 1950, "loss": 0.1556, "lr": 1.799764150818306e-07, "epoch": 4.798464491362764, "percentage": 96.15, "elapsed_time": "19:43:53", "remaining_time": "0:47:21"}
1876
+ {"current_steps": 1876, "total_steps": 1950, "loss": 0.1686, "lr": 1.7521601321810687e-07, "epoch": 4.801023672424824, "percentage": 96.21, "elapsed_time": "19:44:25", "remaining_time": "0:46:43"}
1877
+ {"current_steps": 1877, "total_steps": 1950, "loss": 0.1549, "lr": 1.7051913769687623e-07, "epoch": 4.803582853486884, "percentage": 96.26, "elapsed_time": "19:45:04", "remaining_time": "0:46:05"}
1878
+ {"current_steps": 1878, "total_steps": 1950, "loss": 0.1796, "lr": 1.658858035687594e-07, "epoch": 4.8061420345489445, "percentage": 96.31, "elapsed_time": "19:45:39", "remaining_time": "0:45:27"}
1879
+ {"current_steps": 1879, "total_steps": 1950, "loss": 0.1723, "lr": 1.6131602568076887e-07, "epoch": 4.808701215611005, "percentage": 96.36, "elapsed_time": "19:46:15", "remaining_time": "0:44:49"}
1880
+ {"current_steps": 1880, "total_steps": 1950, "loss": 0.1631, "lr": 1.5680981867625566e-07, "epoch": 4.811260396673065, "percentage": 96.41, "elapsed_time": "19:46:49", "remaining_time": "0:44:11"}
1881
+ {"current_steps": 1881, "total_steps": 1950, "loss": 0.1595, "lr": 1.5236719699486256e-07, "epoch": 4.813819577735125, "percentage": 96.46, "elapsed_time": "19:47:31", "remaining_time": "0:43:33"}
1882
+ {"current_steps": 1882, "total_steps": 1950, "loss": 0.174, "lr": 1.479881748724865e-07, "epoch": 4.816378758797185, "percentage": 96.51, "elapsed_time": "19:48:07", "remaining_time": "0:42:55"}
1883
+ {"current_steps": 1883, "total_steps": 1950, "loss": 0.1733, "lr": 1.4367276634122073e-07, "epoch": 4.818937939859245, "percentage": 96.56, "elapsed_time": "19:48:42", "remaining_time": "0:42:17"}
1884
+ {"current_steps": 1884, "total_steps": 1950, "loss": 0.1524, "lr": 1.3942098522931491e-07, "epoch": 4.821497120921305, "percentage": 96.62, "elapsed_time": "19:49:16", "remaining_time": "0:41:39"}
1885
+ {"current_steps": 1885, "total_steps": 1950, "loss": 0.1801, "lr": 1.3523284516113955e-07, "epoch": 4.824056301983365, "percentage": 96.67, "elapsed_time": "19:49:55", "remaining_time": "0:41:01"}
1886
+ {"current_steps": 1886, "total_steps": 1950, "loss": 0.1789, "lr": 1.3110835955712831e-07, "epoch": 4.826615483045425, "percentage": 96.72, "elapsed_time": "19:50:33", "remaining_time": "0:40:24"}
1887
+ {"current_steps": 1887, "total_steps": 1950, "loss": 0.1643, "lr": 1.2704754163374022e-07, "epoch": 4.8291746641074855, "percentage": 96.77, "elapsed_time": "19:51:13", "remaining_time": "0:39:46"}
1888
+ {"current_steps": 1888, "total_steps": 1950, "loss": 0.1417, "lr": 1.2305040440342198e-07, "epoch": 4.831733845169546, "percentage": 96.82, "elapsed_time": "19:51:41", "remaining_time": "0:39:08"}
1889
+ {"current_steps": 1889, "total_steps": 1950, "loss": 0.1862, "lr": 1.1911696067455902e-07, "epoch": 4.834293026231606, "percentage": 96.87, "elapsed_time": "19:52:12", "remaining_time": "0:38:29"}
1890
+ {"current_steps": 1890, "total_steps": 1950, "loss": 0.1671, "lr": 1.1524722305144231e-07, "epoch": 4.836852207293666, "percentage": 96.92, "elapsed_time": "19:52:50", "remaining_time": "0:37:52"}
1891
+ {"current_steps": 1891, "total_steps": 1950, "loss": 0.1583, "lr": 1.114412039342172e-07, "epoch": 4.839411388355726, "percentage": 96.97, "elapsed_time": "19:53:26", "remaining_time": "0:37:14"}
1892
+ {"current_steps": 1892, "total_steps": 1950, "loss": 0.1689, "lr": 1.0769891551885903e-07, "epoch": 4.841970569417787, "percentage": 97.03, "elapsed_time": "19:54:02", "remaining_time": "0:36:36"}
1893
+ {"current_steps": 1893, "total_steps": 1950, "loss": 0.1901, "lr": 1.0402036979711317e-07, "epoch": 4.844529750479847, "percentage": 97.08, "elapsed_time": "19:54:48", "remaining_time": "0:35:58"}
1894
+ {"current_steps": 1894, "total_steps": 1950, "loss": 0.1628, "lr": 1.0040557855648169e-07, "epoch": 4.847088931541906, "percentage": 97.13, "elapsed_time": "19:55:30", "remaining_time": "0:35:20"}
1895
+ {"current_steps": 1895, "total_steps": 1950, "loss": 0.1769, "lr": 9.685455338016347e-08, "epoch": 4.849648112603967, "percentage": 97.18, "elapsed_time": "19:56:10", "remaining_time": "0:34:43"}
1896
+ {"current_steps": 1896, "total_steps": 1950, "loss": 0.163, "lr": 9.336730564702745e-08, "epoch": 4.8522072936660265, "percentage": 97.23, "elapsed_time": "19:56:43", "remaining_time": "0:34:05"}
1897
+ {"current_steps": 1897, "total_steps": 1950, "loss": 0.1748, "lr": 8.994384653157718e-08, "epoch": 4.854766474728087, "percentage": 97.28, "elapsed_time": "19:57:25", "remaining_time": "0:33:27"}
1898
+ {"current_steps": 1898, "total_steps": 1950, "loss": 0.1658, "lr": 8.658418700391302e-08, "epoch": 4.857325655790147, "percentage": 97.33, "elapsed_time": "19:58:08", "remaining_time": "0:32:49"}
1899
+ {"current_steps": 1899, "total_steps": 1950, "loss": 0.166, "lr": 8.328833782969003e-08, "epoch": 4.859884836852207, "percentage": 97.38, "elapsed_time": "19:58:48", "remaining_time": "0:32:11"}
1900
+ {"current_steps": 1900, "total_steps": 1950, "loss": 0.1832, "lr": 8.005630957010014e-08, "epoch": 4.862444017914267, "percentage": 97.44, "elapsed_time": "19:59:26", "remaining_time": "0:31:33"}
1901
+ {"current_steps": 1901, "total_steps": 1950, "loss": 0.1838, "lr": 7.688811258181883e-08, "epoch": 4.865003198976328, "percentage": 97.49, "elapsed_time": "20:00:12", "remaining_time": "0:30:56"}
1902
+ {"current_steps": 1902, "total_steps": 1950, "loss": 0.1898, "lr": 7.378375701698748e-08, "epoch": 4.867562380038388, "percentage": 97.54, "elapsed_time": "20:00:40", "remaining_time": "0:30:18"}
1903
+ {"current_steps": 1903, "total_steps": 1950, "loss": 0.1754, "lr": 7.074325282317329e-08, "epoch": 4.870121561100448, "percentage": 97.59, "elapsed_time": "20:01:19", "remaining_time": "0:29:40"}
1904
+ {"current_steps": 1904, "total_steps": 1950, "loss": 0.1572, "lr": 6.776660974333605e-08, "epoch": 4.872680742162508, "percentage": 97.64, "elapsed_time": "20:01:56", "remaining_time": "0:29:02"}
1905
+ {"current_steps": 1905, "total_steps": 1950, "loss": 0.1766, "lr": 6.485383731580142e-08, "epoch": 4.8752399232245685, "percentage": 97.69, "elapsed_time": "20:02:35", "remaining_time": "0:28:24"}
1906
+ {"current_steps": 1906, "total_steps": 1950, "loss": 0.1794, "lr": 6.200494487422771e-08, "epoch": 4.877799104286629, "percentage": 97.74, "elapsed_time": "20:03:19", "remaining_time": "0:27:46"}
1907
+ {"current_steps": 1907, "total_steps": 1950, "loss": 0.17, "lr": 5.921994154758137e-08, "epoch": 4.880358285348688, "percentage": 97.79, "elapsed_time": "20:03:55", "remaining_time": "0:27:08"}
1908
+ {"current_steps": 1908, "total_steps": 1950, "loss": 0.1415, "lr": 5.649883626009933e-08, "epoch": 4.882917466410748, "percentage": 97.85, "elapsed_time": "20:04:35", "remaining_time": "0:26:30"}
1909
+ {"current_steps": 1909, "total_steps": 1950, "loss": 0.1637, "lr": 5.3841637731260054e-08, "epoch": 4.885476647472808, "percentage": 97.9, "elapsed_time": "20:05:12", "remaining_time": "0:25:53"}
1910
+ {"current_steps": 1910, "total_steps": 1950, "loss": 0.1856, "lr": 5.1248354475768034e-08, "epoch": 4.888035828534869, "percentage": 97.95, "elapsed_time": "20:05:47", "remaining_time": "0:25:15"}
1911
+ {"current_steps": 1911, "total_steps": 1950, "loss": 0.1833, "lr": 4.871899480351605e-08, "epoch": 4.890595009596929, "percentage": 98.0, "elapsed_time": "20:06:27", "remaining_time": "0:24:37"}
1912
+ {"current_steps": 1912, "total_steps": 1950, "loss": 0.1646, "lr": 4.6253566819554066e-08, "epoch": 4.893154190658989, "percentage": 98.05, "elapsed_time": "20:07:01", "remaining_time": "0:23:59"}
1913
+ {"current_steps": 1913, "total_steps": 1950, "loss": 0.1688, "lr": 4.385207842407813e-08, "epoch": 4.895713371721049, "percentage": 98.1, "elapsed_time": "20:07:36", "remaining_time": "0:23:21"}
1914
+ {"current_steps": 1914, "total_steps": 1950, "loss": 0.1889, "lr": 4.151453731239707e-08, "epoch": 4.8982725527831095, "percentage": 98.15, "elapsed_time": "20:08:18", "remaining_time": "0:22:43"}
1915
+ {"current_steps": 1915, "total_steps": 1950, "loss": 0.1771, "lr": 3.924095097489922e-08, "epoch": 4.90083173384517, "percentage": 98.21, "elapsed_time": "20:08:59", "remaining_time": "0:22:05"}
1916
+ {"current_steps": 1916, "total_steps": 1950, "loss": 0.1767, "lr": 3.703132669704568e-08, "epoch": 4.90339091490723, "percentage": 98.26, "elapsed_time": "20:09:37", "remaining_time": "0:21:27"}
1917
+ {"current_steps": 1917, "total_steps": 1950, "loss": 0.1698, "lr": 3.4885671559332645e-08, "epoch": 4.90595009596929, "percentage": 98.31, "elapsed_time": "20:10:18", "remaining_time": "0:20:50"}
1918
+ {"current_steps": 1918, "total_steps": 1950, "loss": 0.1434, "lr": 3.280399243727806e-08, "epoch": 4.90850927703135, "percentage": 98.36, "elapsed_time": "20:10:51", "remaining_time": "0:20:12"}
1919
+ {"current_steps": 1919, "total_steps": 1950, "loss": 0.1738, "lr": 3.078629600139271e-08, "epoch": 4.9110684580934105, "percentage": 98.41, "elapsed_time": "20:11:32", "remaining_time": "0:19:34"}
1920
+ {"current_steps": 1920, "total_steps": 1950, "loss": 0.1698, "lr": 2.8832588717164766e-08, "epoch": 4.91362763915547, "percentage": 98.46, "elapsed_time": "20:12:12", "remaining_time": "0:18:56"}
1921
+ {"current_steps": 1921, "total_steps": 1950, "loss": 0.1803, "lr": 2.694287684503083e-08, "epoch": 4.91618682021753, "percentage": 98.51, "elapsed_time": "20:12:47", "remaining_time": "0:18:18"}
1922
+ {"current_steps": 1922, "total_steps": 1950, "loss": 0.2076, "lr": 2.511716644036932e-08, "epoch": 4.91874600127959, "percentage": 98.56, "elapsed_time": "20:13:22", "remaining_time": "0:17:40"}
1923
+ {"current_steps": 1923, "total_steps": 1950, "loss": 0.1737, "lr": 2.3355463353467168e-08, "epoch": 4.9213051823416505, "percentage": 98.62, "elapsed_time": "20:13:56", "remaining_time": "0:17:02"}
1924
+ {"current_steps": 1924, "total_steps": 1950, "loss": 0.1525, "lr": 2.1657773229508684e-08, "epoch": 4.923864363403711, "percentage": 98.67, "elapsed_time": "20:14:30", "remaining_time": "0:16:24"}
1925
+ {"current_steps": 1925, "total_steps": 1950, "loss": 0.1611, "lr": 2.0024101508555604e-08, "epoch": 4.926423544465771, "percentage": 98.72, "elapsed_time": "20:15:08", "remaining_time": "0:15:46"}
1926
+ {"current_steps": 1926, "total_steps": 1950, "loss": 0.149, "lr": 1.8454453425527098e-08, "epoch": 4.928982725527831, "percentage": 98.77, "elapsed_time": "20:15:45", "remaining_time": "0:15:08"}
1927
+ {"current_steps": 1927, "total_steps": 1950, "loss": 0.1928, "lr": 1.6948834010190874e-08, "epoch": 4.931541906589891, "percentage": 98.82, "elapsed_time": "20:16:21", "remaining_time": "0:14:31"}
1928
+ {"current_steps": 1928, "total_steps": 1950, "loss": 0.1885, "lr": 1.550724808713877e-08, "epoch": 4.9341010876519515, "percentage": 98.87, "elapsed_time": "20:17:00", "remaining_time": "0:13:53"}
1929
+ {"current_steps": 1929, "total_steps": 1950, "loss": 0.1466, "lr": 1.4129700275771208e-08, "epoch": 4.936660268714012, "percentage": 98.92, "elapsed_time": "20:17:24", "remaining_time": "0:13:15"}
1930
+ {"current_steps": 1930, "total_steps": 1950, "loss": 0.1844, "lr": 1.281619499029274e-08, "epoch": 4.939219449776072, "percentage": 98.97, "elapsed_time": "20:18:07", "remaining_time": "0:12:37"}
1931
+ {"current_steps": 1931, "total_steps": 1950, "loss": 0.1687, "lr": 1.1566736439685422e-08, "epoch": 4.941778630838132, "percentage": 99.03, "elapsed_time": "20:18:48", "remaining_time": "0:11:59"}
1932
+ {"current_steps": 1932, "total_steps": 1950, "loss": 0.1398, "lr": 1.0381328627702136e-08, "epoch": 4.944337811900192, "percentage": 99.08, "elapsed_time": "20:19:25", "remaining_time": "0:11:21"}
1933
+ {"current_steps": 1933, "total_steps": 1950, "loss": 0.1665, "lr": 9.259975352848838e-09, "epoch": 4.946896992962252, "percentage": 99.13, "elapsed_time": "20:20:03", "remaining_time": "0:10:43"}
1934
+ {"current_steps": 1934, "total_steps": 1950, "loss": 0.1632, "lr": 8.20268020838455e-09, "epoch": 4.949456174024312, "percentage": 99.18, "elapsed_time": "20:20:40", "remaining_time": "0:10:05"}
1935
+ {"current_steps": 1935, "total_steps": 1950, "loss": 0.1563, "lr": 7.209446582292501e-09, "epoch": 4.952015355086372, "percentage": 99.23, "elapsed_time": "20:21:15", "remaining_time": "0:09:28"}
1936
+ {"current_steps": 1936, "total_steps": 1950, "loss": 0.1467, "lr": 6.2802776572779005e-09, "epoch": 4.954574536148432, "percentage": 99.28, "elapsed_time": "20:21:51", "remaining_time": "0:08:50"}
1937
+ {"current_steps": 1937, "total_steps": 1950, "loss": 0.1586, "lr": 5.415176410765721e-09, "epoch": 4.957133717210493, "percentage": 99.33, "elapsed_time": "20:22:26", "remaining_time": "0:08:12"}
1938
+ {"current_steps": 1938, "total_steps": 1950, "loss": 0.175, "lr": 4.614145614876275e-09, "epoch": 4.959692898272553, "percentage": 99.38, "elapsed_time": "20:23:05", "remaining_time": "0:07:34"}
1939
+ {"current_steps": 1939, "total_steps": 1950, "loss": 0.1893, "lr": 3.877187836422991e-09, "epoch": 4.962252079334613, "percentage": 99.44, "elapsed_time": "20:23:44", "remaining_time": "0:06:56"}
1940
+ {"current_steps": 1940, "total_steps": 1950, "loss": 0.1928, "lr": 3.2043054369057523e-09, "epoch": 4.964811260396673, "percentage": 99.49, "elapsed_time": "20:24:26", "remaining_time": "0:06:18"}
1941
+ {"current_steps": 1941, "total_steps": 1950, "loss": 0.1714, "lr": 2.5955005725064597e-09, "epoch": 4.967370441458733, "percentage": 99.54, "elapsed_time": "20:25:07", "remaining_time": "0:05:40"}
1942
+ {"current_steps": 1942, "total_steps": 1950, "loss": 0.1648, "lr": 2.0507751940690434e-09, "epoch": 4.969929622520794, "percentage": 99.59, "elapsed_time": "20:25:39", "remaining_time": "0:05:02"}
1943
+ {"current_steps": 1943, "total_steps": 1950, "loss": 0.1591, "lr": 1.5701310471083476e-09, "epoch": 4.972488803582854, "percentage": 99.64, "elapsed_time": "20:26:12", "remaining_time": "0:04:25"}
1944
+ {"current_steps": 1944, "total_steps": 1950, "loss": 0.1437, "lr": 1.1535696717945855e-09, "epoch": 4.975047984644913, "percentage": 99.69, "elapsed_time": "20:26:47", "remaining_time": "0:03:47"}
1945
+ {"current_steps": 1945, "total_steps": 1950, "loss": 0.1491, "lr": 8.010924029533406e-10, "epoch": 4.977607165706974, "percentage": 99.74, "elapsed_time": "20:27:16", "remaining_time": "0:03:09"}
1946
+ {"current_steps": 1946, "total_steps": 1950, "loss": 0.1584, "lr": 5.127003700589051e-10, "epoch": 4.980166346769034, "percentage": 99.79, "elapsed_time": "20:27:55", "remaining_time": "0:02:31"}
1947
+ {"current_steps": 1947, "total_steps": 1950, "loss": 0.1975, "lr": 2.8839449723205847e-10, "epoch": 4.982725527831094, "percentage": 99.85, "elapsed_time": "20:28:33", "remaining_time": "0:01:53"}
1948
+ {"current_steps": 1948, "total_steps": 1950, "loss": 0.2008, "lr": 1.2817550323784843e-10, "epoch": 4.985284708893154, "percentage": 99.9, "elapsed_time": "20:29:14", "remaining_time": "0:01:15"}
1949
+ {"current_steps": 1949, "total_steps": 1950, "loss": 0.1795, "lr": 3.2043901478928666e-11, "epoch": 4.987843889955214, "percentage": 99.95, "elapsed_time": "20:29:55", "remaining_time": "0:00:37"}
1950
+ {"current_steps": 1950, "total_steps": 1950, "loss": 0.1707, "lr": 0.0, "epoch": 4.990403071017274, "percentage": 100.0, "elapsed_time": "20:30:33", "remaining_time": "0:00:00"}
1951
+ {"current_steps": 1950, "total_steps": 1950, "epoch": 4.990403071017274, "percentage": 100.0, "elapsed_time": "20:32:05", "remaining_time": "0:00:00"}