CHEMISTral7Bv0.3 / runseed42 /metrics.train.jsonl
Clemspace's picture
Initial model upload
cb9e677
raw
history blame
150 kB
{"lr": 2.3999999999999974e-06, "step": 1, "loss": 2.0899362564086914, "percent_done": 0.2, "peak_allocated_mem": 63.57235288619995, "allocated_mem": 24.13792896270752, "wps": 87.55304532290906, "avg_wps": 87.55304532290906, "eta_in_seconds": 373516.00825977325, "at": "2024-05-26T00:03:21.270750"}
{"lr": 2.646387992434257e-06, "step": 2, "loss": 2.524580478668213, "percent_done": 0.4, "peak_allocated_mem": 64.8545789718628, "allocated_mem": 24.138355255126953, "wps": 5626.73457304892, "avg_wps": 172.42315402895264, "eta_in_seconds": 189283.90553927422, "at": "2024-05-26T00:03:32.919173"}
{"lr": 3.3813362028748325e-06, "step": 3, "loss": 2.1502745151519775, "percent_done": 0.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1372709274292, "wps": 5601.028629241724, "avg_wps": 254.71414615069997, "eta_in_seconds": 127874.29552785555, "at": "2024-05-26T00:03:44.621084"}
{"lr": 4.592269463674938e-06, "step": 4, "loss": 2.0348753929138184, "percent_done": 0.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1399564743042, "wps": 5526.5897570007055, "avg_wps": 334.48025845457653, "eta_in_seconds": 97183.18249988556, "at": "2024-05-26T00:03:56.480504"}
{"lr": 6.258468371008163e-06, "step": 5, "loss": 2.400183916091919, "percent_done": 1.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5562.432567416476, "avg_wps": 411.9081073188292, "eta_in_seconds": 78756.20659947395, "at": "2024-05-26T00:04:08.263517"}
{"lr": 8.351423799612423e-06, "step": 6, "loss": 2.1549015045166016, "percent_done": 1.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.138590335845947, "wps": 5558.27034773041, "avg_wps": 487.07063610458806, "eta_in_seconds": 66468.3551012675, "at": "2024-05-26T00:04:20.055323"}
{"lr": 1.0835324701827431e-05, "step": 7, "loss": 2.195272922515869, "percent_done": 1.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1382474899292, "wps": 5542.565544724134, "avg_wps": 560.0464308757615, "eta_in_seconds": 57690.3024798802, "at": "2024-05-26T00:04:31.880537"}
{"lr": 1.3667670844548846e-05, "step": 8, "loss": 2.157195568084717, "percent_done": 1.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5545.683469111278, "avg_wps": 630.9504489538973, "eta_in_seconds": 51103.39814078808, "at": "2024-05-26T00:04:43.699113"}
{"lr": 1.6799999999999995e-05, "step": 9, "loss": 1.9964332580566406, "percent_done": 1.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1372709274292, "wps": 5545.264269198486, "avg_wps": 699.8652592379805, "eta_in_seconds": 45977.67295241356, "at": "2024-05-26T00:04:55.518644"}
{"lr": 2.017871714788541e-05, "step": 10, "loss": 2.042534351348877, "percent_done": 2.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13841724395752, "wps": 5535.939583040763, "avg_wps": 766.8561123607292, "eta_in_seconds": 41875.7045583725, "at": "2024-05-26T00:05:07.358144"}
{"lr": 2.37460115010474e-05, "step": 11, "loss": 2.069523811340332, "percent_done": 2.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5536.518620411838, "avg_wps": 832.0175548675699, "eta_in_seconds": 38517.34114564549, "at": "2024-05-26T00:05:19.196394"}
{"lr": 2.7440845664062507e-05, "step": 12, "loss": 2.052086353302002, "percent_done": 2.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.141798496246338, "wps": 5537.652180456069, "avg_wps": 895.4250382708717, "eta_in_seconds": 35716.633590857185, "at": "2024-05-26T00:05:31.032277"}
{"lr": 3.12e-05, "step": 13, "loss": 1.8192474842071533, "percent_done": 2.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.14063787460327, "wps": 5535.187561665465, "avg_wps": 957.1407687539536, "eta_in_seconds": 33345.18081551332, "at": "2024-05-26T00:05:42.873465"}
{"lr": 3.495915433593748e-05, "step": 14, "loss": 1.946042537689209, "percent_done": 2.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.14157009124756, "wps": 5542.429649320902, "avg_wps": 1017.2536778805361, "eta_in_seconds": 31310.27853972571, "at": "2024-05-26T00:05:54.699126"}
{"lr": 3.86539884989526e-05, "step": 15, "loss": 1.7829875946044922, "percent_done": 3.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13841724395752, "wps": 5543.334775724542, "avg_wps": 1075.8131015326833, "eta_in_seconds": 29545.057552019753, "at": "2024-05-26T00:06:06.522826"}
{"lr": 4.222128285211459e-05, "step": 16, "loss": 2.223297119140625, "percent_done": 3.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1397123336792, "wps": 5542.737882195839, "avg_wps": 1132.8750127130904, "eta_in_seconds": 27999.049889922142, "at": "2024-05-26T00:06:18.347795"}
{"lr": 4.56e-05, "step": 17, "loss": 1.4540331363677979, "percent_done": 3.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1370267868042, "wps": 5544.523580319454, "avg_wps": 1188.502286267241, "eta_in_seconds": 26633.426259040833, "at": "2024-05-26T00:06:30.168902"}
{"lr": 4.873232915545115e-05, "step": 18, "loss": 1.5981942415237427, "percent_done": 3.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13963794708252, "wps": 5539.665356843985, "avg_wps": 1242.7306282749407, "eta_in_seconds": 25418.50283665127, "at": "2024-05-26T00:06:42.000450"}
{"lr": 5.156467529817257e-05, "step": 19, "loss": 1.4388254880905151, "percent_done": 3.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13890552520752, "wps": 5535.4164015669085, "avg_wps": 1295.6116764956253, "eta_in_seconds": 24330.450683543557, "at": "2024-05-26T00:06:53.841037"}
{"lr": 5.404857620038757e-05, "step": 20, "loss": 2.101304054260254, "percent_done": 4.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13890504837036, "wps": 5535.553625409448, "avg_wps": 1347.2061159255522, "eta_in_seconds": 23350.012762069702, "at": "2024-05-26T00:07:05.681392"}
{"lr": 5.6141531628991836e-05, "step": 21, "loss": 1.871744990348816, "percent_done": 4.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13712167739868, "wps": 5537.535267234748, "avg_wps": 1397.565993168832, "eta_in_seconds": 22461.72570986975, "at": "2024-05-26T00:07:17.517503"}
{"lr": 5.780773053632506e-05, "step": 22, "loss": 1.5911368131637573, "percent_done": 4.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5540.108387338111, "avg_wps": 1446.7377626459229, "eta_in_seconds": 21652.99669976668, "at": "2024-05-26T00:07:29.348185"}
{"lr": 5.9018663797125166e-05, "step": 23, "loss": 1.609352707862854, "percent_done": 4.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13792896270752, "wps": 5547.958456519078, "avg_wps": 1494.7807037776133, "eta_in_seconds": 20913.216180137966, "at": "2024-05-26T00:07:41.162052"}
{"lr": 5.975361200756574e-05, "step": 24, "loss": 1.9449068307876587, "percent_done": 4.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5535.518287668786, "avg_wps": 1541.670982436515, "eta_in_seconds": 20234.626165628433, "at": "2024-05-26T00:07:53.002301"}
{"lr": 6e-05, "step": 25, "loss": 1.9009581804275513, "percent_done": 5.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1372709274292, "wps": 5540.029779982879, "avg_wps": 1587.5003088337653, "eta_in_seconds": 19609.19303560257, "at": "2024-05-26T00:08:04.833075"}
{"lr": 5.9999343854031334e-05, "step": 26, "loss": 2.0498569011688232, "percent_done": 5.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5537.299670855712, "avg_wps": 1632.2818262005753, "eta_in_seconds": 19031.066511539313, "at": "2024-05-26T00:08:16.669672"}
{"lr": 5.999737544482728e-05, "step": 27, "loss": 1.349915862083435, "percent_done": 5.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1389799118042, "wps": 5532.232178571703, "avg_wps": 1676.0420801840273, "eta_in_seconds": 18495.07740079915, "at": "2024-05-26T00:08:28.517110"}
{"lr": 5.999409485849245e-05, "step": 28, "loss": 1.783543586730957, "percent_done": 5.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.139604091644287, "wps": 5529.9537137257485, "avg_wps": 1718.823329676492, "eta_in_seconds": 17996.60934659413, "at": "2024-05-26T00:08:40.369421"}
{"lr": 5.9989502238530296e-05, "step": 29, "loss": 1.620679259300232, "percent_done": 5.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13735866546631, "wps": 5522.544560390815, "avg_wps": 1760.6392671318408, "eta_in_seconds": 17531.959315143784, "at": "2024-05-26T00:08:52.237600"}
{"lr": 5.99835977858369e-05, "step": 30, "loss": 1.3995318412780762, "percent_done": 6.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1380033493042, "wps": 5539.8447711905565, "avg_wps": 1801.6069794911675, "eta_in_seconds": 17096.914227485657, "at": "2024-05-26T00:09:04.068718"}
{"lr": 5.9976381758692166e-05, "step": 31, "loss": 1.4312913417816162, "percent_done": 6.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5547.84189151848, "avg_wps": 1841.7244829614674, "eta_in_seconds": 16688.915353167442, "at": "2024-05-26T00:09:15.882864"}
{"lr": 5.9967854472748474e-05, "step": 32, "loss": 1.5339837074279785, "percent_done": 6.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817262649536, "wps": 5519.576169787376, "avg_wps": 1880.8898191051344, "eta_in_seconds": 16306.562823861837, "at": "2024-05-26T00:09:27.757474"}
{"lr": 5.9958016301016944e-05, "step": 33, "loss": 1.7230792045593262, "percent_done": 6.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1387357711792, "wps": 5532.143774040797, "avg_wps": 1919.2757446824705, "eta_in_seconds": 15946.281864289082, "at": "2024-05-26T00:09:39.605130"}
{"lr": 5.994686767385109e-05, "step": 34, "loss": 1.7153072357177734, "percent_done": 6.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13963747024536, "wps": 5533.034517617992, "avg_wps": 1956.8662360217147, "eta_in_seconds": 15606.470916523655, "at": "2024-05-26T00:09:51.450911"}
{"lr": 5.993440907892797e-05, "step": 35, "loss": 1.494494915008545, "percent_done": 7.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.138137340545654, "wps": 5540.615145675467, "avg_wps": 1993.7108246045661, "eta_in_seconds": 15285.185606615883, "at": "2024-05-26T00:10:03.280422"}
{"lr": 5.9920641061226885e-05, "step": 36, "loss": 1.7100409269332886, "percent_done": 7.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13980770111084, "wps": 5534.4324016424225, "avg_wps": 2029.782447507116, "eta_in_seconds": 14981.262665536668, "at": "2024-05-26T00:10:15.123147"}
{"lr": 5.9905564223005546e-05, "step": 37, "loss": 1.5540026426315308, "percent_done": 7.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1370267868042, "wps": 5525.468940137315, "avg_wps": 2065.0927280221586, "eta_in_seconds": 14693.3682871767, "at": "2024-05-26T00:10:26.985070"}
{"lr": 5.988917922377368e-05, "step": 38, "loss": 1.7690261602401733, "percent_done": 7.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1406888961792, "wps": 5539.526477800049, "avg_wps": 2099.75008205116, "eta_in_seconds": 14419.636059936724, "at": "2024-05-26T00:10:38.816769"}
{"lr": 5.9871486780264246e-05, "step": 39, "loss": 1.610843300819397, "percent_done": 7.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.137158393859863, "wps": 5524.0498246239495, "avg_wps": 2133.6638130239685, "eta_in_seconds": 14159.726483424505, "at": "2024-05-26T00:10:50.681769"}
{"lr": 5.985248766640204e-05, "step": 40, "loss": 1.6625176668167114, "percent_done": 8.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5544.099411977706, "avg_wps": 2166.989231035533, "eta_in_seconds": 13911.725802898407, "at": "2024-05-26T00:11:02.503842"}
{"lr": 5.983218271326983e-05, "step": 41, "loss": 1.5587224960327148, "percent_done": 8.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1389799118042, "wps": 5535.130493970461, "avg_wps": 2199.6351751730604, "eta_in_seconds": 13675.460521599141, "at": "2024-05-26T00:11:14.345102"}
{"lr": 5.981057280907208e-05, "step": 42, "loss": 1.6394068002700806, "percent_done": 8.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5542.058876517238, "avg_wps": 2231.6811301296284, "eta_in_seconds": 13449.72074852671, "at": "2024-05-26T00:11:26.171525"}
{"lr": 5.978765889909597e-05, "step": 43, "loss": 1.8504140377044678, "percent_done": 8.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13963794708252, "wps": 5537.244232765539, "avg_wps": 2263.099743394272, "eta_in_seconds": 13234.039766660957, "at": "2024-05-26T00:11:38.008052"}
{"lr": 5.976344198567018e-05, "step": 44, "loss": 1.6190497875213623, "percent_done": 8.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1387357711792, "wps": 5530.863783795987, "avg_wps": 2293.901811341495, "eta_in_seconds": 13027.765989043497, "at": "2024-05-26T00:11:49.858501"}
{"lr": 5.9737923128120935e-05, "step": 45, "loss": 1.6997615098953247, "percent_done": 9.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.137300491333008, "wps": 5523.228225775809, "avg_wps": 2324.0986163203415, "eta_in_seconds": 12830.298934221268, "at": "2024-05-26T00:12:01.725220"}
{"lr": 5.971110344272575e-05, "step": 46, "loss": 1.7731759548187256, "percent_done": 9.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1370849609375, "wps": 5546.081359300658, "avg_wps": 2353.8257788054875, "eta_in_seconds": 12640.418958746868, "at": "2024-05-26T00:12:13.543067"}
{"lr": 5.968298410266454e-05, "step": 47, "loss": 1.6038544178009033, "percent_done": 9.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1380033493042, "wps": 5530.973292789456, "avg_wps": 2382.9499028627824, "eta_in_seconds": 12458.427247813408, "at": "2024-05-26T00:12:25.393198"}
{"lr": 5.9653566337968336e-05, "step": 48, "loss": 1.5806320905685425, "percent_done": 9.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1372709274292, "wps": 5538.426185704312, "avg_wps": 2411.5744073380824, "eta_in_seconds": 12283.374674181143, "at": "2024-05-26T00:12:37.227423"}
{"lr": 5.9622851435465466e-05, "step": 49, "loss": 1.4341806173324585, "percent_done": 9.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.137271404266357, "wps": 5547.794415919143, "avg_wps": 2439.7212897046975, "eta_in_seconds": 12114.800212928227, "at": "2024-05-26T00:12:49.041635"}
{"lr": 5.9590840738725265e-05, "step": 50, "loss": 1.4500197172164917, "percent_done": 10.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.139648914337158, "wps": 5539.750540924846, "avg_wps": 2467.3355744887713, "eta_in_seconds": 11952.650585889816, "at": "2024-05-26T00:13:00.872857"}
{"lr": 5.955753564799931e-05, "step": 51, "loss": 1.5096863508224487, "percent_done": 10.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13963794708252, "wps": 5539.978083463767, "avg_wps": 2494.463145163946, "eta_in_seconds": 11796.391563069586, "at": "2024-05-26T00:13:12.703674"}
{"lr": 5.9522937620160167e-05, "step": 52, "loss": 1.7216428518295288, "percent_done": 10.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5543.565295984434, "avg_wps": 2521.1301803976307, "eta_in_seconds": 11645.621566185586, "at": "2024-05-26T00:13:24.526852"}
{"lr": 5.9487048168637646e-05, "step": 53, "loss": 1.7031399011611938, "percent_done": 10.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5537.898963882401, "avg_wps": 2547.312209734005, "eta_in_seconds": 11500.196908748374, "at": "2024-05-26T00:13:36.362193"}
{"lr": 5.944986886335264e-05, "step": 54, "loss": 1.7923967838287354, "percent_done": 10.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13988208770752, "wps": 5540.3491362407385, "avg_wps": 2573.05348120662, "eta_in_seconds": 11359.676825020048, "at": "2024-05-26T00:13:48.192136"}
{"lr": 5.941140133064838e-05, "step": 55, "loss": 1.6145018339157104, "percent_done": 11.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13819980621338, "wps": 5532.177287264699, "avg_wps": 2598.3230307292242, "eta_in_seconds": 11223.97779456052, "at": "2024-05-26T00:14:00.039674"}
{"lr": 5.937164725321938e-05, "step": 56, "loss": 1.493621587753296, "percent_done": 11.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13995599746704, "wps": 5519.523524306861, "avg_wps": 2623.1137353743584, "eta_in_seconds": 11092.917401024273, "at": "2024-05-26T00:14:11.914303"}
{"lr": 5.933060837003778e-05, "step": 57, "loss": 1.4488284587860107, "percent_done": 11.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13792896270752, "wps": 5551.856517024938, "avg_wps": 2647.6169631340003, "eta_in_seconds": 10965.501582840032, "at": "2024-05-26T00:14:23.719679"}
{"lr": 5.928828647627726e-05, "step": 58, "loss": 1.8310798406600952, "percent_done": 11.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13841724395752, "wps": 5531.945041172631, "avg_wps": 2671.6337960073306, "eta_in_seconds": 10842.39615597396, "at": "2024-05-26T00:14:35.567699"}
{"lr": 5.924468342323457e-05, "step": 59, "loss": 1.8137357234954834, "percent_done": 11.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13896083831787, "wps": 5527.583975032376, "avg_wps": 2695.2364115035157, "eta_in_seconds": 10723.13206984229, "at": "2024-05-26T00:14:47.424891"}
{"lr": 5.919980111824851e-05, "step": 60, "loss": 1.512571930885315, "percent_done": 12.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5537.72079118129, "avg_wps": 2718.492891536368, "eta_in_seconds": 10607.289093812307, "at": "2024-05-26T00:14:59.260447"}
{"lr": 5.915364152461648e-05, "step": 61, "loss": 1.5166411399841309, "percent_done": 12.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5539.386712673805, "avg_wps": 2741.3785934414523, "eta_in_seconds": 10494.830618737173, "at": "2024-05-26T00:15:11.092581"}
{"lr": 5.9106206661508645e-05, "step": 62, "loss": 1.6018924713134766, "percent_done": 12.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13873529434204, "wps": 5532.074856095626, "avg_wps": 2763.8665452701775, "eta_in_seconds": 10385.72866302921, "at": "2024-05-26T00:15:22.940259"}
{"lr": 5.90574986038796e-05, "step": 63, "loss": 1.4618632793426514, "percent_done": 12.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13841724395752, "wps": 5529.793850942314, "avg_wps": 2785.985783546574, "eta_in_seconds": 10279.748076654616, "at": "2024-05-26T00:15:34.792730"}
{"lr": 5.9007519482377565e-05, "step": 64, "loss": 1.7917994260787964, "percent_done": 12.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1380033493042, "wps": 5531.270235335729, "avg_wps": 2807.7599972922703, "eta_in_seconds": 10176.687475979328, "at": "2024-05-26T00:15:46.642121"}
{"lr": 5.8956271483251227e-05, "step": 65, "loss": 1.5388588905334473, "percent_done": 13.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13727045059204, "wps": 5541.480467211162, "avg_wps": 2829.2325455082782, "eta_in_seconds": 10076.287311645654, "at": "2024-05-26T00:15:58.469684"}
{"lr": 5.8903756848254094e-05, "step": 66, "loss": 1.5354622602462769, "percent_done": 13.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817262649536, "wps": 5534.298576151526, "avg_wps": 2850.3415745242264, "eta_in_seconds": 9978.672119234547, "at": "2024-05-26T00:16:10.312548"}
{"lr": 5.884997787454641e-05, "step": 67, "loss": 1.551658272743225, "percent_done": 13.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1372709274292, "wps": 5545.073876931426, "avg_wps": 2871.1669062811698, "eta_in_seconds": 9883.468612681574, "at": "2024-05-26T00:16:22.132505"}
{"lr": 5.879493691459472e-05, "step": 68, "loss": 1.5081156492233276, "percent_done": 13.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1384916305542, "wps": 5543.528178915346, "avg_wps": 2891.6666401015896, "eta_in_seconds": 9790.7385337493, "at": "2024-05-26T00:16:33.955697"}
{"lr": 5.873863637606892e-05, "step": 69, "loss": 1.6811738014221191, "percent_done": 13.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13744831085205, "wps": 5540.486158061833, "avg_wps": 2911.8420897351943, "eta_in_seconds": 9700.394159275553, "at": "2024-05-26T00:16:45.785296"}
{"lr": 5.868107872173695e-05, "step": 70, "loss": 2.0245096683502197, "percent_done": 14.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.139193534851074, "wps": 5534.936784672989, "avg_wps": 2931.690300093053, "eta_in_seconds": 9612.36594435147, "at": "2024-05-26T00:16:57.627088"}
{"lr": 5.862226646935706e-05, "step": 71, "loss": 1.291055679321289, "percent_done": 14.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13963794708252, "wps": 5535.811816409992, "avg_wps": 2951.2438980309184, "eta_in_seconds": 9526.472555778397, "at": "2024-05-26T00:17:09.466927"}
{"lr": 5.856220219156771e-05, "step": 72, "loss": 1.696504831314087, "percent_done": 14.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1387357711792, "wps": 5533.233106007674, "avg_wps": 2970.4957223928614, "eta_in_seconds": 9442.669042931664, "at": "2024-05-26T00:17:21.312194"}
{"lr": 5.8500888515774985e-05, "step": 73, "loss": 1.2231526374816895, "percent_done": 14.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1399564743042, "wps": 5514.1967865476645, "avg_wps": 2989.3862016528365, "eta_in_seconds": 9361.076191670274, "at": "2024-05-26T00:17:33.198309"}
{"lr": 5.84383281240377e-05, "step": 74, "loss": 1.5708428621292114, "percent_done": 14.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5538.367712134215, "avg_wps": 3008.094949394964, "eta_in_seconds": 9281.068739407772, "at": "2024-05-26T00:17:45.032506"}
{"lr": 5.8374523752950034e-05, "step": 75, "loss": 1.6024234294891357, "percent_done": 15.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5545.841902233415, "avg_wps": 3026.5607851097043, "eta_in_seconds": 9202.788900534313, "at": "2024-05-26T00:17:56.850793"}
{"lr": 5.830947819352191e-05, "step": 76, "loss": 1.9813722372055054, "percent_done": 15.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1372709274292, "wps": 5544.453011562738, "avg_wps": 3044.7543202052316, "eta_in_seconds": 9126.274594833976, "at": "2024-05-26T00:18:08.672042"}
{"lr": 5.8243194291056786e-05, "step": 77, "loss": 1.57261323928833, "percent_done": 15.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5534.243420984151, "avg_wps": 3062.646287207252, "eta_in_seconds": 9051.560448163516, "at": "2024-05-26T00:18:20.515204"}
{"lr": 5.817567494502731e-05, "step": 78, "loss": 1.5319303274154663, "percent_done": 15.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5548.882527821081, "avg_wps": 3080.3408991020083, "eta_in_seconds": 8978.289386107372, "at": "2024-05-26T00:18:32.342630"}
{"lr": 5.810692310894839e-05, "step": 79, "loss": 1.504271149635315, "percent_done": 15.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1404447555542, "wps": 5547.128611462899, "avg_wps": 3097.778503134207, "eta_in_seconds": 8906.594184214555, "at": "2024-05-26T00:18:44.158288"}
{"lr": 5.8036941790248074e-05, "step": 80, "loss": 1.537473201751709, "percent_done": 16.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.139437198638916, "wps": 5547.05663309866, "avg_wps": 3114.971022758016, "eta_in_seconds": 8836.396807193756, "at": "2024-05-26T00:18:55.974075"}
{"lr": 5.796573405013595e-05, "step": 81, "loss": 1.5852731466293335, "percent_done": 16.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13890552520752, "wps": 5529.699072362179, "avg_wps": 3131.8553361215204, "eta_in_seconds": 8767.83281887019, "at": "2024-05-26T00:19:07.826949"}
{"lr": 5.7893303003469235e-05, "step": 82, "loss": 1.5945942401885986, "percent_done": 16.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.139241218566895, "wps": 5530.273912078115, "avg_wps": 3148.507443738734, "eta_in_seconds": 8700.645778836273, "at": "2024-05-26T00:19:19.678572"}
{"lr": 5.7819651818616575e-05, "step": 83, "loss": 1.7726037502288818, "percent_done": 16.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5544.20799199795, "avg_wps": 3164.984762706722, "eta_in_seconds": 8634.642517718925, "at": "2024-05-26T00:19:31.500393"}
{"lr": 5.774478371731938e-05, "step": 84, "loss": 1.5255744457244873, "percent_done": 16.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13762378692627, "wps": 5534.432735935683, "avg_wps": 3181.1985906088116, "eta_in_seconds": 8570.032716751099, "at": "2024-05-26T00:19:43.343105"}
{"lr": 5.766870197455095e-05, "step": 85, "loss": 1.5827147960662842, "percent_done": 17.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13866138458252, "wps": 5523.826585731917, "avg_wps": 3197.150307066719, "eta_in_seconds": 8506.775530660854, "at": "2024-05-26T00:19:55.208549"}
{"lr": 5.759140991837317e-05, "step": 86, "loss": 1.3610950708389282, "percent_done": 17.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13801145553589, "wps": 5541.5615735421, "avg_wps": 3212.9557960341403, "eta_in_seconds": 8444.530744397363, "at": "2024-05-26T00:20:07.036006"}
{"lr": 5.751291092979098e-05, "step": 87, "loss": 1.4847681522369385, "percent_done": 17.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5531.706357934675, "avg_wps": 3228.511079960922, "eta_in_seconds": 8383.5450242059, "at": "2024-05-26T00:20:18.884533"}
{"lr": 5.743320844260443e-05, "step": 88, "loss": 1.0767104625701904, "percent_done": 17.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1387357711792, "wps": 5531.295612714277, "avg_wps": 3243.8574449359435, "eta_in_seconds": 8323.680204304783, "at": "2024-05-26T00:20:30.733993"}
{"lr": 5.735230594325853e-05, "step": 89, "loss": 1.5505489110946655, "percent_done": 17.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1372709274292, "wps": 5531.027047266254, "avg_wps": 3258.999571955979, "eta_in_seconds": 8264.89706589131, "at": "2024-05-26T00:20:42.583973"}
{"lr": 5.727020697069067e-05, "step": 90, "loss": 1.7600947618484497, "percent_done": 18.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.138655185699463, "wps": 5529.237685026854, "avg_wps": 3273.935553483542, "eta_in_seconds": 8207.174381123648, "at": "2024-05-26T00:20:54.437824"}
{"lr": 5.718691511617588e-05, "step": 91, "loss": 1.317226529121399, "percent_done": 18.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13856601715088, "wps": 5502.959403593815, "avg_wps": 3288.573649336026, "eta_in_seconds": 8150.71421782263, "at": "2024-05-26T00:21:06.348233"}
{"lr": 5.7102434023169716e-05, "step": 92, "loss": 1.2027145624160767, "percent_done": 18.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13890552520752, "wps": 5531.824695043968, "avg_wps": 3303.1331918472656, "eta_in_seconds": 8094.946963082189, "at": "2024-05-26T00:21:18.196493"}
{"lr": 5.701676738714885e-05, "step": 93, "loss": 1.7757294178009033, "percent_done": 18.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13897943496704, "wps": 5513.260013664116, "avg_wps": 3317.4329246403618, "eta_in_seconds": 8040.29881113319, "at": "2024-05-26T00:21:30.084656"}
{"lr": 5.6929918955449466e-05, "step": 94, "loss": 1.6398133039474487, "percent_done": 18.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13995599746704, "wps": 5503.530239684291, "avg_wps": 3331.5109429036474, "eta_in_seconds": 7986.651239034977, "at": "2024-05-26T00:21:41.993855"}
{"lr": 5.6841892527103325e-05, "step": 95, "loss": 1.6421366930007935, "percent_done": 19.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1372709274292, "wps": 5539.134773708763, "avg_wps": 3345.546401059732, "eta_in_seconds": 7933.556082675331, "at": "2024-05-26T00:21:53.826550"}
{"lr": 5.675269195267157e-05, "step": 96, "loss": 1.535171389579773, "percent_done": 19.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13759183883667, "wps": 5519.26064443039, "avg_wps": 3359.3280993101475, "eta_in_seconds": 7881.499876548847, "at": "2024-05-26T00:22:05.701819"}
{"lr": 5.6662321134076275e-05, "step": 97, "loss": 1.289878249168396, "percent_done": 19.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13732147216797, "wps": 5544.5440467133, "avg_wps": 3373.033047095898, "eta_in_seconds": 7830.047210103458, "at": "2024-05-26T00:22:17.522970"}
{"lr": 5.657078402442983e-05, "step": 98, "loss": 1.6153517961502075, "percent_done": 19.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.137089729309082, "wps": 5523.603253886858, "avg_wps": 3386.4871425174815, "eta_in_seconds": 7779.587192058563, "at": "2024-05-26T00:22:29.388874"}
{"lr": 5.6478084627861946e-05, "step": 99, "loss": 1.7160063982009888, "percent_done": 19.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5532.454204423485, "avg_wps": 3399.8077610196756, "eta_in_seconds": 7729.829992539955, "at": "2024-05-26T00:22:41.235797"}
{"lr": 5.638422699934453e-05, "step": 100, "loss": 1.4796698093414307, "percent_done": 20.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.139036655426025, "wps": 5539.2885910522355, "avg_wps": 3412.9900073928015, "eta_in_seconds": 7680.772561073303, "at": "2024-05-26T00:22:53.068126"}
{"lr": 5.62892152445143e-05, "step": 101, "loss": 1.5540027618408203, "percent_done": 20.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1372709274292, "wps": 5597.059642797446, "avg_wps": 3426.227366541052, "eta_in_seconds": 7631.969861474368, "at": "2024-05-26T00:23:19.492117"}
{"lr": 5.619305351949323e-05, "step": 102, "loss": 1.1712055206298828, "percent_done": 20.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.137778759002686, "wps": 5565.942533352121, "avg_wps": 3439.18940091804, "eta_in_seconds": 7584.149914231954, "at": "2024-05-26T00:23:31.267769"}
{"lr": 5.609574603070667e-05, "step": 103, "loss": 1.5182369947433472, "percent_done": 20.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.14134693145752, "wps": 5553.062441781844, "avg_wps": 3451.947126415252, "eta_in_seconds": 7537.135143497616, "at": "2024-05-26T00:23:43.070636"}
{"lr": 5.599729703469942e-05, "step": 104, "loss": 1.539081335067749, "percent_done": 20.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13963794708252, "wps": 5539.45056615357, "avg_wps": 3464.5007130604386, "eta_in_seconds": 7490.907968979616, "at": "2024-05-26T00:23:54.902547"}
{"lr": 5.589771083794951e-05, "step": 105, "loss": 1.3853428363800049, "percent_done": 21.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13897943496704, "wps": 5532.474693163494, "avg_wps": 3476.8780093736523, "eta_in_seconds": 7445.3920816921045, "at": "2024-05-26T00:24:06.749359"}
{"lr": 5.579699179667977e-05, "step": 106, "loss": 1.746046781539917, "percent_done": 21.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1397123336792, "wps": 5529.919893688251, "avg_wps": 3489.098434826783, "eta_in_seconds": 7400.531822852368, "at": "2024-05-26T00:24:18.601620"}
{"lr": 5.569514431666738e-05, "step": 107, "loss": 1.4366753101348877, "percent_done": 21.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 3110.3677494049234, "avg_wps": 3485.1324206697495, "eta_in_seconds": 7390.149036302745, "at": "2024-05-26T00:24:39.672844"}
{"lr": 5.559217285305104e-05, "step": 108, "loss": 1.4705623388290405, "percent_done": 21.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1406888961792, "wps": 5568.263503384901, "avg_wps": 3497.246748995588, "eta_in_seconds": 7345.810531492587, "at": "2024-05-26T00:24:51.443525"}
{"lr": 5.548808191013616e-05, "step": 109, "loss": 1.511877417564392, "percent_done": 21.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5544.419461278335, "avg_wps": 3509.133737064294, "eta_in_seconds": 7302.251187906352, "at": "2024-05-26T00:25:03.264777"}
{"lr": 5.538287604119777e-05, "step": 110, "loss": 1.631191611289978, "percent_done": 22.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13963794708252, "wps": 5539.096934612043, "avg_wps": 3520.863946254514, "eta_in_seconds": 7259.309189493007, "at": "2024-05-26T00:25:15.097574"}
{"lr": 5.5276559848281426e-05, "step": 111, "loss": 1.1168304681777954, "percent_done": 22.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.139692783355713, "wps": 5535.312512817423, "avg_wps": 3532.4454920385933, "eta_in_seconds": 7216.956088199272, "at": "2024-05-26T00:25:26.938291"}
{"lr": 5.516913798200181e-05, "step": 112, "loss": 1.3504208326339722, "percent_done": 22.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.137049674987793, "wps": 5524.111104691364, "avg_wps": 3543.853551182154, "eta_in_seconds": 7175.231039532594, "at": "2024-05-26T00:25:38.803137"}
{"lr": 5.506061514133933e-05, "step": 113, "loss": 1.6625151634216309, "percent_done": 22.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13819980621338, "wps": 5537.484732799822, "avg_wps": 3555.1805667044105, "eta_in_seconds": 7133.936384983822, "at": "2024-05-26T00:25:50.639233"}
{"lr": 5.495099607343464e-05, "step": 114, "loss": 1.089699625968933, "percent_done": 22.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5526.334425393153, "avg_wps": 3566.3389461793854, "eta_in_seconds": 7093.239420526906, "at": "2024-05-26T00:26:02.499237"}
{"lr": 5.4840285573380864e-05, "step": 115, "loss": 1.5184028148651123, "percent_done": 23.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1370267868042, "wps": 5530.564993204644, "avg_wps": 3577.387108918421, "eta_in_seconds": 7053.013619101566, "at": "2024-05-26T00:26:14.350294"}
{"lr": 5.4728488484013935e-05, "step": 116, "loss": 1.607438325881958, "percent_done": 23.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1372709274292, "wps": 5537.610457041481, "avg_wps": 3588.337217255435, "eta_in_seconds": 7013.227151278791, "at": "2024-05-26T00:26:26.186115"}
{"lr": 5.46156096957007e-05, "step": 117, "loss": 1.5858045816421509, "percent_done": 23.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1404447555542, "wps": 5532.53783061558, "avg_wps": 3599.147335569262, "eta_in_seconds": 6973.954011813188, "at": "2024-05-26T00:26:38.032820"}
{"lr": 5.450165414612506e-05, "step": 118, "loss": 1.2271007299423218, "percent_done": 23.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5536.211859357799, "avg_wps": 3609.851152518804, "eta_in_seconds": 6935.120297836044, "at": "2024-05-26T00:26:49.871724"}
{"lr": 5.43866268200719e-05, "step": 119, "loss": 1.3237642049789429, "percent_done": 23.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13933229446411, "wps": 5533.040977363736, "avg_wps": 3620.42592349851, "eta_in_seconds": 6896.762018506266, "at": "2024-05-26T00:27:01.717493"}
{"lr": 5.42705327492091e-05, "step": 120, "loss": 1.3115874528884888, "percent_done": 24.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5538.231129826692, "avg_wps": 3630.903646067428, "eta_in_seconds": 6858.810485641161, "at": "2024-05-26T00:27:13.552094"}
{"lr": 5.415337701186742e-05, "step": 121, "loss": 1.2221430540084839, "percent_done": 24.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.137965202331543, "wps": 5531.733075183824, "avg_wps": 3641.244261196932, "eta_in_seconds": 6821.334197402985, "at": "2024-05-26T00:27:25.400449"}
{"lr": 5.403516473281833e-05, "step": 122, "loss": 1.6666512489318848, "percent_done": 24.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5535.974926160593, "avg_wps": 3651.4881163845907, "eta_in_seconds": 6784.2499305537485, "at": "2024-05-26T00:27:37.239789"}
{"lr": 5.391590108304989e-05, "step": 123, "loss": 1.5952054262161255, "percent_done": 24.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13706350326538, "wps": 5528.6313692000795, "avg_wps": 3661.595646751923, "eta_in_seconds": 6747.624364781186, "at": "2024-05-26T00:27:49.094976"}
{"lr": 5.3795591279540496e-05, "step": 124, "loss": 1.6903510093688965, "percent_done": 24.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5532.742396950077, "avg_wps": 3671.6095225837266, "eta_in_seconds": 6711.371633729626, "at": "2024-05-26T00:28:00.941314"}
{"lr": 5.3674240585030686e-05, "step": 125, "loss": 1.670830488204956, "percent_done": 25.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1413631439209, "wps": 5535.899446291045, "avg_wps": 3681.5279621076993, "eta_in_seconds": 6675.489159107208, "at": "2024-05-26T00:28:12.780885"}
{"lr": 5.3551854307792975e-05, "step": 126, "loss": 1.5355591773986816, "percent_done": 25.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13866138458252, "wps": 5526.040789881656, "avg_wps": 3691.3065729857167, "eta_in_seconds": 6640.051026749232, "at": "2024-05-26T00:28:24.641450"}
{"lr": 5.3428437801399596e-05, "step": 127, "loss": 1.3291274309158325, "percent_done": 25.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.137056350708008, "wps": 5527.882332433383, "avg_wps": 3700.9885506962646, "eta_in_seconds": 6604.972608035005, "at": "2024-05-26T00:28:36.498128"}
{"lr": 5.3303996464488364e-05, "step": 128, "loss": 1.2499892711639404, "percent_done": 25.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13841724395752, "wps": 5533.640351464532, "avg_wps": 3710.589229455752, "eta_in_seconds": 6570.221194647253, "at": "2024-05-26T00:28:48.342491"}
{"lr": 5.317853574052649e-05, "step": 129, "loss": 1.5997017621994019, "percent_done": 25.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5532.302993307046, "avg_wps": 3720.085156146638, "eta_in_seconds": 6535.833181083665, "at": "2024-05-26T00:29:00.189835"}
{"lr": 5.3052061117572476e-05, "step": 130, "loss": 1.2660155296325684, "percent_done": 26.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13866090774536, "wps": 5522.46223457303, "avg_wps": 3729.448136686874, "eta_in_seconds": 6501.8520465447355, "at": "2024-05-26T00:29:12.058235"}
{"lr": 5.292457812803603e-05, "step": 131, "loss": 1.473204255104065, "percent_done": 26.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.138676643371582, "wps": 5522.268745279879, "avg_wps": 3738.713665425786, "eta_in_seconds": 6468.209701008469, "at": "2024-05-26T00:29:23.926912"}
{"lr": 5.2796092348436136e-05, "step": 132, "loss": 1.4274117946624756, "percent_done": 26.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13702630996704, "wps": 5536.678649211735, "avg_wps": 3747.934068843009, "eta_in_seconds": 6434.811167167894, "at": "2024-05-26T00:29:35.764812"}
{"lr": 5.266660939915699e-05, "step": 133, "loss": 1.4024438858032227, "percent_done": 26.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5533.322659221424, "avg_wps": 3757.04875984181, "eta_in_seconds": 6401.756681223561, "at": "2024-05-26T00:29:47.609838"}
{"lr": 5.25361349442023e-05, "step": 134, "loss": 1.6963635683059692, "percent_done": 26.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13713550567627, "wps": 5533.485845105383, "avg_wps": 3766.0714237744305, "eta_in_seconds": 6369.017817500812, "at": "2024-05-26T00:29:59.454640"}
{"lr": 5.240467469094738e-05, "step": 135, "loss": 1.2273313999176025, "percent_done": 27.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1382474899292, "wps": 5538.345394303255, "avg_wps": 3775.019635857367, "eta_in_seconds": 6336.560417537336, "at": "2024-05-26T00:30:11.288854"}
{"lr": 5.227223438988959e-05, "step": 136, "loss": 1.3269773721694946, "percent_done": 27.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13995599746704, "wps": 5519.251778766513, "avg_wps": 3783.812183740026, "eta_in_seconds": 6304.515880178003, "at": "2024-05-26T00:30:23.164105"}
{"lr": 5.2138819834396735e-05, "step": 137, "loss": 1.6708487272262573, "percent_done": 27.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.137944221496582, "wps": 5534.977353276828, "avg_wps": 3792.5705754854494, "eta_in_seconds": 6272.676414717724, "at": "2024-05-26T00:30:35.005563"}
{"lr": 5.200443686045369e-05, "step": 138, "loss": 1.2962806224822998, "percent_done": 27.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13866138458252, "wps": 5535.8934258287845, "avg_wps": 3801.2449240334345, "eta_in_seconds": 6241.121652015741, "at": "2024-05-26T00:30:46.845093"}
{"lr": 5.1869091346407056e-05, "step": 139, "loss": 1.3293571472167969, "percent_done": 27.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1399564743042, "wps": 5518.765651525683, "avg_wps": 3809.774835881176, "eta_in_seconds": 6209.945999217548, "at": "2024-05-26T00:30:58.721325"}
{"lr": 5.1732789212708097e-05, "step": 140, "loss": 1.4928131103515625, "percent_done": 28.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5544.100977467862, "avg_wps": 3818.306670118135, "eta_in_seconds": 6178.9065254075185, "at": "2024-05-26T00:31:10.543196"}
{"lr": 5.159553642165368e-05, "step": 141, "loss": 1.5970425605773926, "percent_done": 28.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13841724395752, "wps": 5524.360790615043, "avg_wps": 3826.6880343733033, "eta_in_seconds": 6148.247201931392, "at": "2024-05-26T00:31:22.407369"}
{"lr": 5.145733897712554e-05, "step": 142, "loss": 1.7108588218688965, "percent_done": 28.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13866138458252, "wps": 5533.329008253335, "avg_wps": 3835.017837137935, "eta_in_seconds": 6117.804139734993, "at": "2024-05-26T00:31:34.252317"}
{"lr": 5.131820292432759e-05, "step": 143, "loss": 1.868727445602417, "percent_done": 28.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13792896270752, "wps": 5528.080773501194, "avg_wps": 3843.2490002472596, "eta_in_seconds": 6087.649277602042, "at": "2024-05-26T00:31:46.108465"}
{"lr": 5.117813434952152e-05, "step": 144, "loss": 1.8097214698791504, "percent_done": 28.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5537.813502032706, "avg_wps": 3851.433264880849, "eta_in_seconds": 6057.697068969408, "at": "2024-05-26T00:31:57.943884"}
{"lr": 5.103713937976054e-05, "step": 145, "loss": 1.6488709449768066, "percent_done": 29.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5535.326557634993, "avg_wps": 3859.5305195212936, "eta_in_seconds": 6028.007780305271, "at": "2024-05-26T00:32:09.784516"}
{"lr": 5.0895224182621414e-05, "step": 146, "loss": 1.6172908544540405, "percent_done": 29.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5533.640685662114, "avg_wps": 3867.54463427126, "eta_in_seconds": 5998.5717538774825, "at": "2024-05-26T00:32:21.628812"}
{"lr": 5.075239496593458e-05, "step": 147, "loss": 1.806726336479187, "percent_done": 29.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13849115371704, "wps": 5530.702533019881, "avg_wps": 3875.4725772056986, "eta_in_seconds": 5969.390194132215, "at": "2024-05-26T00:32:33.479389"}
{"lr": 5.0608657977512685e-05, "step": 148, "loss": 1.3950109481811523, "percent_done": 29.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5533.683463286032, "avg_wps": 3883.3352212573154, "eta_in_seconds": 5940.427669937546, "at": "2024-05-26T00:32:45.323748"}
{"lr": 5.0464019504877256e-05, "step": 149, "loss": 1.685523509979248, "percent_done": 29.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13904047012329, "wps": 5525.507592916948, "avg_wps": 3891.096482327046, "eta_in_seconds": 5911.736217407572, "at": "2024-05-26T00:32:57.185460"}
{"lr": 5.031848587498364e-05, "step": 150, "loss": 1.3426657915115356, "percent_done": 30.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5540.3617549189175, "avg_wps": 3898.8338968788635, "eta_in_seconds": 5883.194977442424, "at": "2024-05-26T00:33:09.015393"}
{"lr": 5.017206345394427e-05, "step": 151, "loss": 1.1932377815246582, "percent_done": 30.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13841724395752, "wps": 5530.696301294541, "avg_wps": 3906.4671727362975, "eta_in_seconds": 5854.922872417021, "at": "2024-05-26T00:33:20.866100"}
{"lr": 5.00247586467502e-05, "step": 152, "loss": 1.5188419818878174, "percent_done": 30.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5534.958963588762, "avg_wps": 3914.0434039079178, "eta_in_seconds": 5826.84596119429, "at": "2024-05-26T00:33:32.707611"}
{"lr": 4.987657789699088e-05, "step": 153, "loss": 1.699030876159668, "percent_done": 30.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13727045059204, "wps": 5534.990616218613, "avg_wps": 3921.5495715785733, "eta_in_seconds": 5798.981138684392, "at": "2024-05-26T00:33:44.549171"}
{"lr": 4.9727527686572356e-05, "step": 154, "loss": 1.4579997062683105, "percent_done": 30.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1389799118042, "wps": 5533.561593359805, "avg_wps": 3928.9818647318493, "eta_in_seconds": 5771.331296676165, "at": "2024-05-26T00:33:56.393598"}
{"lr": 4.957761453543368e-05, "step": 155, "loss": 1.5616415739059448, "percent_done": 31.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13918399810791, "wps": 5546.354522258468, "avg_wps": 3936.387607590215, "eta_in_seconds": 5743.824606195573, "at": "2024-05-26T00:34:08.210887"}
{"lr": 4.942684500126173e-05, "step": 156, "loss": 1.636575698852539, "percent_done": 31.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5536.919434711029, "avg_wps": 3943.6952090659074, "eta_in_seconds": 5716.563477870745, "at": "2024-05-26T00:34:20.048148"}
{"lr": 4.927522567920438e-05, "step": 157, "loss": 1.8378536701202393, "percent_done": 31.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13792896270752, "wps": 5541.3607112397085, "avg_wps": 3950.9507768392773, "eta_in_seconds": 5689.478120500115, "at": "2024-05-26T00:34:31.876008"}
{"lr": 4.9122763201581924e-05, "step": 158, "loss": 1.624532699584961, "percent_done": 31.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13963747024536, "wps": 5538.455646138669, "avg_wps": 3958.1313564214447, "eta_in_seconds": 5662.599338356453, "at": "2024-05-26T00:34:43.710158"}
{"lr": 4.8969464237597066e-05, "step": 159, "loss": 1.4007322788238525, "percent_done": 31.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13916015625, "wps": 5547.36918723339, "avg_wps": 3965.2759596814326, "eta_in_seconds": 5635.869035908261, "at": "2024-05-26T00:34:55.525135"}
{"lr": 4.8815335493043095e-05, "step": 160, "loss": 1.5568217039108276, "percent_done": 32.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.14060926437378, "wps": 5542.0574239184625, "avg_wps": 3972.3395722173827, "eta_in_seconds": 5609.349249958991, "at": "2024-05-26T00:35:07.351538"}
{"lr": 4.866038371001062e-05, "step": 161, "loss": 1.3363252878189087, "percent_done": 32.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13841724395752, "wps": 5545.6341284409145, "avg_wps": 3979.351626452097, "eta_in_seconds": 5582.9959464547055, "at": "2024-05-26T00:35:19.170367"}
{"lr": 4.850461566659259e-05, "step": 162, "loss": 1.338950276374817, "percent_done": 32.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13995599746704, "wps": 5506.948587611595, "avg_wps": 3986.177203137962, "eta_in_seconds": 5556.995304313707, "at": "2024-05-26T00:35:31.072109"}
{"lr": 4.834803817658786e-05, "step": 163, "loss": 1.2776546478271484, "percent_done": 32.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1387357711792, "wps": 5542.646794583385, "avg_wps": 3993.056456146613, "eta_in_seconds": 5531.009201235566, "at": "2024-05-26T00:35:42.897260"}
{"lr": 4.819065808920307e-05, "step": 164, "loss": 1.4070043563842773, "percent_done": 32.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1372709274292, "wps": 5540.459467868356, "avg_wps": 3999.8682185431176, "eta_in_seconds": 5505.205370996056, "at": "2024-05-26T00:35:54.726921"}
{"lr": 4.803248228875308e-05, "step": 165, "loss": 1.471192717552185, "percent_done": 33.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.141496658325195, "wps": 5542.936944196005, "avg_wps": 4006.6281208824953, "eta_in_seconds": 5479.5602031476565, "at": "2024-05-26T00:36:06.551378"}
{"lr": 4.7873517694359834e-05, "step": 166, "loss": 1.555643081665039, "percent_done": 33.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.139355182647705, "wps": 5540.876489640953, "avg_wps": 4013.322544294357, "eta_in_seconds": 5454.090409732727, "at": "2024-05-26T00:36:18.380298"}
{"lr": 4.7713771259649654e-05, "step": 167, "loss": 1.4674922227859497, "percent_done": 33.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.137837886810303, "wps": 5530.920318385281, "avg_wps": 4019.927364713092, "eta_in_seconds": 5428.826448847434, "at": "2024-05-26T00:36:30.230598"}
{"lr": 4.755324997244911e-05, "step": 168, "loss": 1.5082496404647827, "percent_done": 33.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.140522956848145, "wps": 5549.663373325819, "avg_wps": 4026.53387208514, "eta_in_seconds": 5403.643106256212, "at": "2024-05-26T00:36:42.040702"}
{"lr": 4.739196085447931e-05, "step": 169, "loss": 1.4904391765594482, "percent_done": 33.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1380033493042, "wps": 5523.3548572738, "avg_wps": 4033.000956615353, "eta_in_seconds": 5378.728205957356, "at": "2024-05-26T00:36:53.907068"}
{"lr": 4.722991096104879e-05, "step": 170, "loss": 1.4823875427246094, "percent_done": 34.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13841724395752, "wps": 5537.428733245111, "avg_wps": 4039.4565655614915, "eta_in_seconds": 5353.908291620367, "at": "2024-05-26T00:37:05.743274"}
{"lr": 4.706710738074485e-05, "step": 171, "loss": 1.6395151615142822, "percent_done": 34.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13873529434204, "wps": 5531.952166362009, "avg_wps": 4045.839894515075, "eta_in_seconds": 5329.262788977539, "at": "2024-05-26T00:37:17.591244"}
{"lr": 4.6903557235123503e-05, "step": 172, "loss": 1.6742452383041382, "percent_done": 34.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13702630996704, "wps": 5530.9124168279295, "avg_wps": 4052.1656095073636, "eta_in_seconds": 5304.770355280055, "at": "2024-05-26T00:37:29.441588"}
{"lr": 4.673926767839795e-05, "step": 173, "loss": 1.2659401893615723, "percent_done": 34.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1384916305542, "wps": 5533.1006750381885, "avg_wps": 4058.444471670209, "eta_in_seconds": 5280.41523041477, "at": "2024-05-26T00:37:41.287088"}
{"lr": 4.6574245897125624e-05, "step": 174, "loss": 1.0927540063858032, "percent_done": 34.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13739776611328, "wps": 5530.781432328368, "avg_wps": 4064.6631204199402, "eta_in_seconds": 5256.213213013507, "at": "2024-05-26T00:37:53.137554"}
{"lr": 4.640849910989384e-05, "step": 175, "loss": 1.337214469909668, "percent_done": 35.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5552.215929196103, "avg_wps": 4070.8955582678295, "eta_in_seconds": 5232.067414930888, "at": "2024-05-26T00:38:04.942264"}
{"lr": 4.6242034567004e-05, "step": 176, "loss": 1.5160088539123535, "percent_done": 35.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.137300491333008, "wps": 5531.864772729148, "avg_wps": 4077.013410479484, "eta_in_seconds": 5208.141809252175, "at": "2024-05-26T00:38:16.813569"}
{"lr": 4.60748595501545e-05, "step": 177, "loss": 1.3292492628097534, "percent_done": 35.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1370267868042, "wps": 5534.255231897187, "avg_wps": 4083.0875934900823, "eta_in_seconds": 5184.343346870552, "at": "2024-05-26T00:38:28.656672"}
{"lr": 4.590698137212215e-05, "step": 178, "loss": 1.4860689640045166, "percent_done": 35.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13792896270752, "wps": 5538.810981517906, "avg_wps": 4089.125310203, "eta_in_seconds": 5160.661608326301, "at": "2024-05-26T00:38:40.489929"}
{"lr": 4.5738407376442294e-05, "step": 179, "loss": 1.2346954345703125, "percent_done": 35.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13824987411499, "wps": 5536.797087632224, "avg_wps": 4095.106997732116, "eta_in_seconds": 5137.119985302067, "at": "2024-05-26T00:38:52.327495"}
{"lr": 4.5569144937087604e-05, "step": 180, "loss": 1.4844282865524292, "percent_done": 36.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13792896270752, "wps": 5536.149641524129, "avg_wps": 4101.037483197592, "eta_in_seconds": 5113.7108807033965, "at": "2024-05-26T00:39:04.166490"}
{"lr": 4.5399201458145525e-05, "step": 181, "loss": 1.6267871856689453, "percent_done": 36.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1382474899292, "wps": 5543.4886028289675, "avg_wps": 4106.94164027059, "eta_in_seconds": 5090.402014727092, "at": "2024-05-26T00:39:15.989880"}
{"lr": 4.522858437349436e-05, "step": 182, "loss": 1.6486303806304932, "percent_done": 36.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13963794708252, "wps": 5544.838421617288, "avg_wps": 4112.801742647404, "eta_in_seconds": 5067.214347800056, "at": "2024-05-26T00:39:27.810368"}
{"lr": 4.505730114647811e-05, "step": 183, "loss": 1.3425076007843018, "percent_done": 36.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1370267868042, "wps": 5541.176395465127, "avg_wps": 4118.603225659315, "eta_in_seconds": 5044.164456185096, "at": "2024-05-26T00:39:39.638662"}
{"lr": 4.488535926958002e-05, "step": 184, "loss": 1.781583547592163, "percent_done": 36.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13717746734619, "wps": 5543.097344249737, "avg_wps": 4124.363554443577, "eta_in_seconds": 5021.229512536007, "at": "2024-05-26T00:39:51.462856"}
{"lr": 4.471276626409479e-05, "step": 185, "loss": 1.369985818862915, "percent_done": 37.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5539.250414978418, "avg_wps": 4130.06593202918, "eta_in_seconds": 4998.428678802542, "at": "2024-05-26T00:40:03.295248"}
{"lr": 4.45395296797996e-05, "step": 186, "loss": 1.2858965396881104, "percent_done": 37.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13800287246704, "wps": 5531.820130677768, "avg_wps": 4135.700231455384, "eta_in_seconds": 4975.772625753956, "at": "2024-05-26T00:40:15.143534"}
{"lr": 4.4365657094623857e-05, "step": 187, "loss": 1.61137056350708, "percent_done": 37.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13840961456299, "wps": 5524.408643184817, "avg_wps": 4141.267176238552, "eta_in_seconds": 4953.258779751426, "at": "2024-05-26T00:40:27.007606"}
{"lr": 4.419115611431772e-05, "step": 188, "loss": 1.7724450826644897, "percent_done": 37.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1387357711792, "wps": 5533.056458539925, "avg_wps": 4146.815544191923, "eta_in_seconds": 4930.827470404037, "at": "2024-05-26T00:40:38.853134"}
{"lr": 4.401603437211934e-05, "step": 189, "loss": 1.2718950510025024, "percent_done": 37.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13963794708252, "wps": 5538.770579909343, "avg_wps": 4152.3368601983875, "eta_in_seconds": 4908.488084231735, "at": "2024-05-26T00:40:50.686456"}
{"lr": 4.384029952842108e-05, "step": 190, "loss": 1.0087783336639404, "percent_done": 38.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1397123336792, "wps": 5545.144349630792, "avg_wps": 4157.833429691444, "eta_in_seconds": 4886.237109673651, "at": "2024-05-26T00:41:02.506141"}
{"lr": 4.366395927043427e-05, "step": 191, "loss": 1.608473300933838, "percent_done": 38.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5542.126032107357, "avg_wps": 4163.277873645289, "eta_in_seconds": 4864.105787459468, "at": "2024-05-26T00:41:14.332385"}
{"lr": 4.348702131185308e-05, "step": 192, "loss": 1.3803850412368774, "percent_done": 38.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13963794708252, "wps": 5544.102431138085, "avg_wps": 4168.685481094917, "eta_in_seconds": 4842.075059761603, "at": "2024-05-26T00:41:26.154264"}
{"lr": 4.3309493392517e-05, "step": 193, "loss": 1.5278865098953247, "percent_done": 38.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.139034271240234, "wps": 5548.627596303829, "avg_wps": 4174.064178408998, "eta_in_seconds": 4820.13479909378, "at": "2024-05-26T00:41:37.966544"}
{"lr": 4.313138327807234e-05, "step": 194, "loss": 1.8288185596466064, "percent_done": 38.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13921880722046, "wps": 5536.45461148206, "avg_wps": 4179.3654305104155, "eta_in_seconds": 4798.3399234727485, "at": "2024-05-26T00:41:49.804810"}
{"lr": 4.2952698759632504e-05, "step": 195, "loss": 1.122506022453308, "percent_done": 39.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13830041885376, "wps": 5535.220108612204, "avg_wps": 4184.621969232516, "eta_in_seconds": 4776.651307326097, "at": "2024-05-26T00:42:01.645708"}
{"lr": 4.277344765343719e-05, "step": 196, "loss": 1.3557201623916626, "percent_done": 39.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1389799118042, "wps": 5528.652719222615, "avg_wps": 4189.81868605775, "eta_in_seconds": 4755.085003152186, "at": "2024-05-26T00:42:13.500731"}
{"lr": 4.2593637800510475e-05, "step": 197, "loss": 1.6514897346496582, "percent_done": 39.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.139344215393066, "wps": 5537.284723655701, "avg_wps": 4195.000559111975, "eta_in_seconds": 4733.588880427598, "at": "2024-05-26T00:42:25.337177"}
{"lr": 4.241327706631782e-05, "step": 198, "loss": 1.0746054649353027, "percent_done": 39.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13841724395752, "wps": 5543.368983630239, "avg_wps": 4200.160390036222, "eta_in_seconds": 4712.170527332961, "at": "2024-05-26T00:42:37.160614"}
{"lr": 4.223237334042203e-05, "step": 199, "loss": 1.47548508644104, "percent_done": 39.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13890552520752, "wps": 5529.567922854537, "avg_wps": 4205.240869946182, "eta_in_seconds": 4690.893247276095, "at": "2024-05-26T00:42:49.013627"}
{"lr": 4.205093453613813e-05, "step": 200, "loss": 1.526173710823059, "percent_done": 40.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.139493942260742, "wps": 5540.243052281161, "avg_wps": 4210.313551529432, "eta_in_seconds": 4669.67596578598, "at": "2024-05-26T00:43:00.843868"}
{"lr": 4.186896859018719e-05, "step": 201, "loss": 1.4787572622299194, "percent_done": 40.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.139551639556885, "wps": 5596.201714965491, "avg_wps": 4215.507392203633, "eta_in_seconds": 4648.376144765029, "at": "2024-05-26T00:43:27.376702"}
{"lr": 4.1686483462349175e-05, "step": 202, "loss": 1.4978930950164795, "percent_done": 40.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1372709274292, "wps": 5560.3849281835455, "avg_wps": 4220.560943614809, "eta_in_seconds": 4627.282548673083, "at": "2024-05-26T00:43:39.163958"}
{"lr": 4.1503487135114756e-05, "step": 203, "loss": 1.2025593519210815, "percent_done": 40.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.14137363433838, "wps": 5556.142213502009, "avg_wps": 4225.5645791954, "eta_in_seconds": 4606.293818305866, "at": "2024-05-26T00:43:50.960251"}
{"lr": 4.1319987613336105e-05, "step": 204, "loss": 1.8979005813598633, "percent_done": 40.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5541.944682228907, "avg_wps": 4230.490412043713, "eta_in_seconds": 4585.4390651198, "at": "2024-05-26T00:44:02.786871"}
{"lr": 4.113599292387675e-05, "step": 205, "loss": 1.567550778388977, "percent_done": 41.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1387357711792, "wps": 5529.45902565837, "avg_wps": 4235.343865045288, "eta_in_seconds": 4564.710827746043, "at": "2024-05-26T00:44:14.640109"}
{"lr": 4.095151111526049e-05, "step": 206, "loss": 1.1945691108703613, "percent_done": 41.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1372709274292, "wps": 5541.909598040349, "avg_wps": 4240.196645060535, "eta_in_seconds": 4544.030763866832, "at": "2024-05-26T00:44:26.466748"}
{"lr": 4.076655025731926e-05, "step": 207, "loss": 1.416570782661438, "percent_done": 41.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5526.984356291331, "avg_wps": 4244.971091888022, "eta_in_seconds": 4523.4814523694595, "at": "2024-05-26T00:44:38.325229"}
{"lr": 4.058111844084018e-05, "step": 208, "loss": 1.490580677986145, "percent_done": 41.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5535.710811362995, "avg_wps": 4249.7350046017655, "eta_in_seconds": 4502.989475644552, "at": "2024-05-26T00:44:50.165132"}
{"lr": 4.0395223777211613e-05, "step": 209, "loss": 1.667999029159546, "percent_done": 41.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.141624927520752, "wps": 5531.944261856157, "avg_wps": 4254.453228868484, "eta_in_seconds": 4482.591528000444, "at": "2024-05-26T00:45:02.012975"}
{"lr": 4.020887439806836e-05, "step": 210, "loss": 1.9307905435562134, "percent_done": 42.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5537.607779624579, "avg_wps": 4259.152826815559, "eta_in_seconds": 4462.258287690935, "at": "2024-05-26T00:45:13.848847"}
{"lr": 4.0022078454935966e-05, "step": 211, "loss": 1.26886785030365, "percent_done": 42.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13792896270752, "wps": 5522.882654546504, "avg_wps": 4263.776641407079, "eta_in_seconds": 4442.048820303515, "at": "2024-05-26T00:45:25.716202"}
{"lr": 3.9834844118874095e-05, "step": 212, "loss": 1.5193549394607544, "percent_done": 42.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.141427040100098, "wps": 5533.928890404986, "avg_wps": 4268.397803839718, "eta_in_seconds": 4421.885884914758, "at": "2024-05-26T00:45:37.559889"}
{"lr": 3.964717958011919e-05, "step": 213, "loss": 1.251197338104248, "percent_done": 42.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1380033493042, "wps": 5534.057684293295, "avg_wps": 4272.985822552458, "eta_in_seconds": 4401.800703556884, "at": "2024-05-26T00:45:49.403218"}
{"lr": 3.9459093047726116e-05, "step": 214, "loss": 1.432743787765503, "percent_done": 42.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1382474899292, "wps": 5540.013813136418, "avg_wps": 4277.557308878169, "eta_in_seconds": 4381.775543041318, "at": "2024-05-26T00:46:01.233842"}
{"lr": 3.92705927492091e-05, "step": 215, "loss": 1.4782277345657349, "percent_done": 43.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1370267868042, "wps": 5536.510368306427, "avg_wps": 4282.086184191149, "eta_in_seconds": 4361.836543354877, "at": "2024-05-26T00:46:13.072043"}
{"lr": 3.908168693018187e-05, "step": 216, "loss": 1.644234299659729, "percent_done": 43.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817262649536, "wps": 5532.466453108508, "avg_wps": 4286.571361637611, "eta_in_seconds": 4341.983937691759, "at": "2024-05-26T00:46:24.918860"}
{"lr": 3.889238385399692e-05, "step": 217, "loss": 1.4462400674819946, "percent_done": 43.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13890552520752, "wps": 5528.062318436874, "avg_wps": 4291.012258137125, "eta_in_seconds": 4322.217435951057, "at": "2024-05-26T00:46:36.775121"}
{"lr": 3.870269180138406e-05, "step": 218, "loss": 1.675262689590454, "percent_done": 43.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1380033493042, "wps": 5534.44844776445, "avg_wps": 4295.43916347693, "eta_in_seconds": 4302.505819926569, "at": "2024-05-26T00:46:48.617609"}
{"lr": 3.851261907008817e-05, "step": 219, "loss": 1.3199164867401123, "percent_done": 43.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13963794708252, "wps": 5535.384075250543, "avg_wps": 4299.837237477709, "eta_in_seconds": 4282.863509224974, "at": "2024-05-26T00:47:00.458258"}
{"lr": 3.8322173974506286e-05, "step": 220, "loss": 1.6845101118087769, "percent_done": 44.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13995599746704, "wps": 5510.513466249422, "avg_wps": 4304.135562061595, "eta_in_seconds": 4263.36014175415, "at": "2024-05-26T00:47:12.352268"}
{"lr": 3.813136484532385e-05, "step": 221, "loss": 1.387367606163025, "percent_done": 44.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1399564743042, "wps": 5527.326662083986, "avg_wps": 4308.449838288029, "eta_in_seconds": 4243.879976856223, "at": "2024-05-26T00:47:24.210069"}
{"lr": 3.794020002915029e-05, "step": 222, "loss": 1.4622544050216675, "percent_done": 44.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5520.525512400772, "avg_wps": 4312.715114006132, "eta_in_seconds": 4224.486783472267, "at": "2024-05-26T00:47:36.082497"}
{"lr": 3.774868788815397e-05, "step": 223, "loss": 1.635811448097229, "percent_done": 44.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13792848587036, "wps": 5533.602810192979, "avg_wps": 4316.9862513436165, "eta_in_seconds": 4205.126202185593, "at": "2024-05-26T00:47:47.926910"}
{"lr": 3.755683679969634e-05, "step": 224, "loss": 1.5653899908065796, "percent_done": 44.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5528.7669224035835, "avg_wps": 4321.214432036123, "eta_in_seconds": 4185.84550350053, "at": "2024-05-26T00:47:59.781640"}
{"lr": 3.736465515596552e-05, "step": 225, "loss": 1.6065657138824463, "percent_done": 45.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1392240524292, "wps": 5529.020254575828, "avg_wps": 4325.413898247056, "eta_in_seconds": 4166.63015932507, "at": "2024-05-26T00:48:11.635839"}
{"lr": 3.717215136360919e-05, "step": 226, "loss": 1.5461000204086304, "percent_done": 45.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13841724395752, "wps": 5533.510797242492, "avg_wps": 4329.596437122061, "eta_in_seconds": 4147.468305830407, "at": "2024-05-26T00:48:23.480410"}
{"lr": 3.697933384336687e-05, "step": 227, "loss": 1.3097504377365112, "percent_done": 45.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13995599746704, "wps": 5512.12259994092, "avg_wps": 4333.692098894464, "eta_in_seconds": 4128.426199121097, "at": "2024-05-26T00:48:35.370927"}
{"lr": 3.6786211029701516e-05, "step": 228, "loss": 1.6260541677474976, "percent_done": 45.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13849115371704, "wps": 2808.324622321751, "avg_wps": 4323.392578538777, "eta_in_seconds": 4123.102789343449, "at": "2024-05-26T00:48:58.708265"}
{"lr": 3.659279137043063e-05, "step": 229, "loss": 1.5031825304031372, "percent_done": 45.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5571.398671168329, "avg_wps": 4327.625758035511, "eta_in_seconds": 4103.926030808661, "at": "2024-05-26T00:49:10.472346"}
{"lr": 3.639908332635672e-05, "step": 230, "loss": 1.608676791191101, "percent_done": 46.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1387357711792, "wps": 5544.593703509994, "avg_wps": 4331.759524281279, "eta_in_seconds": 4084.880497362303, "at": "2024-05-26T00:49:22.293236"}
{"lr": 3.6205095370897137e-05, "step": 231, "loss": 1.805351734161377, "percent_done": 46.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.14140796661377, "wps": 5539.069699711945, "avg_wps": 4335.8506645206, "eta_in_seconds": 4065.9112511083677, "at": "2024-05-26T00:49:34.125896"}
{"lr": 3.601083598971351e-05, "step": 232, "loss": 1.4192653894424438, "percent_done": 46.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13963794708252, "wps": 5532.713999521479, "avg_wps": 4339.89733473655, "eta_in_seconds": 4047.019236934596, "at": "2024-05-26T00:49:45.972161"}
{"lr": 3.581631368034047e-05, "step": 233, "loss": 1.5427579879760742, "percent_done": 46.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5538.066436591779, "avg_wps": 4343.930880044961, "eta_in_seconds": 4028.1745919076156, "at": "2024-05-26T00:49:57.806991"}
{"lr": 3.5621536951813995e-05, "step": 234, "loss": 1.4073643684387207, "percent_done": 46.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5539.973840595753, "avg_wps": 4347.94238181473, "eta_in_seconds": 4009.3852376958243, "at": "2024-05-26T00:50:09.637759"}
{"lr": 3.542651432429918e-05, "step": 235, "loss": 1.5565159320831299, "percent_done": 47.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.138086318969727, "wps": 5532.181295517999, "avg_wps": 4351.906573304648, "eta_in_seconds": 3990.673905210292, "at": "2024-05-26T00:50:21.485170"}
{"lr": 3.523125432871754e-05, "step": 236, "loss": 1.3352882862091064, "percent_done": 47.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13841724395752, "wps": 5530.5869145454035, "avg_wps": 4355.840123953177, "eta_in_seconds": 3972.0245710712366, "at": "2024-05-26T00:50:33.335979"}
{"lr": 3.503576550637384e-05, "step": 237, "loss": 1.6341153383255005, "percent_done": 47.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13873529434204, "wps": 5522.12885120343, "avg_wps": 4359.725296590551, "eta_in_seconds": 3953.452758475195, "at": "2024-05-26T00:50:45.204959"}
{"lr": 3.484005640858246e-05, "step": 238, "loss": 1.425567865371704, "percent_done": 47.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.14134693145752, "wps": 5536.1170836452475, "avg_wps": 4363.621277418509, "eta_in_seconds": 3934.904270646953, "at": "2024-05-26T00:50:57.043930"}
{"lr": 3.464413559629336e-05, "step": 239, "loss": 1.2422451972961426, "percent_done": 47.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13768482208252, "wps": 5527.562522108759, "avg_wps": 4367.469226769415, "eta_in_seconds": 3916.43194533791, "at": "2024-05-26T00:51:08.901282"}
{"lr": 3.444801163971754e-05, "step": 240, "loss": 1.5461735725402832, "percent_done": 48.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1406888961792, "wps": 5531.341025446556, "avg_wps": 4371.301656899959, "eta_in_seconds": 3898.0059802333512, "at": "2024-05-26T00:51:20.750660"}
{"lr": 3.4251693117952235e-05, "step": 241, "loss": 1.6313444375991821, "percent_done": 48.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13841724395752, "wps": 5528.268444044248, "avg_wps": 4375.10095004529, "eta_in_seconds": 3879.6416799992444, "at": "2024-05-26T00:51:32.606526"}
{"lr": 3.4055188618605555e-05, "step": 242, "loss": 1.125512719154358, "percent_done": 48.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13963794708252, "wps": 5537.499569525027, "avg_wps": 4378.899264957602, "eta_in_seconds": 3861.3101094399603, "at": "2024-05-26T00:51:44.442624"}
{"lr": 3.3858506737420905e-05, "step": 243, "loss": 1.6871873140335083, "percent_done": 48.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1399564743042, "wps": 5516.1301769274905, "avg_wps": 4382.617539458016, "eta_in_seconds": 3843.080498893565, "at": "2024-05-26T00:51:56.324569"}
{"lr": 3.366165607790091e-05, "step": 244, "loss": 1.508838415145874, "percent_done": 48.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5536.8670155193395, "avg_wps": 4386.365116295409, "eta_in_seconds": 3824.856243196081, "at": "2024-05-26T00:52:08.161952"}
{"lr": 3.3464645250931154e-05, "step": 245, "loss": 1.526856541633606, "percent_done": 49.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13995599746704, "wps": 5511.6593887264935, "avg_wps": 4390.023459904286, "eta_in_seconds": 3806.740477046188, "at": "2024-05-26T00:52:20.053560"}
{"lr": 3.3267482874403404e-05, "step": 246, "loss": 1.343733310699463, "percent_done": 49.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.14134693145752, "wps": 5528.1191293001275, "avg_wps": 4393.70048605466, "eta_in_seconds": 3788.6387688086284, "at": "2024-05-26T00:52:31.909674"}
{"lr": 3.3070177572838744e-05, "step": 247, "loss": 1.6397329568862915, "percent_done": 49.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.139309406280518, "wps": 5531.113857944268, "avg_wps": 4397.361496325575, "eta_in_seconds": 3770.5810663632533, "at": "2024-05-26T00:52:43.759385"}
{"lr": 3.287273797701024e-05, "step": 248, "loss": 1.7264926433563232, "percent_done": 49.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13873529434204, "wps": 5524.28418381858, "avg_wps": 4400.9815580735885, "eta_in_seconds": 3752.588321962664, "at": "2024-05-26T00:52:55.623726"}
{"lr": 3.267517272356543e-05, "step": 249, "loss": 1.706379771232605, "percent_done": 49.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.141398906707764, "wps": 5536.513713751602, "avg_wps": 4404.609590248677, "eta_in_seconds": 3734.6183953323516, "at": "2024-05-26T00:53:07.461861"}
{"lr": 3.247749045464852e-05, "step": 250, "loss": 1.6563538312911987, "percent_done": 50.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.139185905456543, "wps": 5534.978802166535, "avg_wps": 4408.210619804437, "eta_in_seconds": 3716.7008142471313, "at": "2024-05-26T00:53:19.303283"}
{"lr": 3.227969981752235e-05, "step": 251, "loss": 1.1807035207748413, "percent_done": 50.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.137569427490234, "wps": 5526.1845485071035, "avg_wps": 4411.766483353033, "eta_in_seconds": 3698.850349757776, "at": "2024-05-26T00:53:31.163558"}
{"lr": 3.208180946419016e-05, "step": 252, "loss": 1.2953325510025024, "percent_done": 50.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13995599746704, "wps": 5509.568005409552, "avg_wps": 4415.257579297445, "eta_in_seconds": 3681.082634047856, "at": "2024-05-26T00:53:43.059603"}
{"lr": 3.188382805101706e-05, "step": 253, "loss": 1.3787448406219482, "percent_done": 50.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5531.01647435701, "avg_wps": 4418.7808608415135, "eta_in_seconds": 3663.3163104896016, "at": "2024-05-26T00:53:54.909438"}
{"lr": 3.168576423835144e-05, "step": 254, "loss": 1.3832790851593018, "percent_done": 50.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13890552520752, "wps": 5528.566319366759, "avg_wps": 4422.275791900193, "eta_in_seconds": 3645.6016672521123, "at": "2024-05-26T00:54:06.764651"}
{"lr": 3.148762669014611e-05, "step": 255, "loss": 1.6247435808181763, "percent_done": 51.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5534.374123801316, "avg_wps": 4425.763359897295, "eta_in_seconds": 3627.9210374168324, "at": "2024-05-26T00:54:18.607391"}
{"lr": 3.12894240735793e-05, "step": 256, "loss": 1.197739839553833, "percent_done": 51.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1372709274292, "wps": 5532.6957362312305, "avg_wps": 4429.2249215600295, "eta_in_seconds": 3610.289448648691, "at": "2024-05-26T00:54:30.453702"}
{"lr": 3.109116505867555e-05, "step": 257, "loss": 1.3123215436935425, "percent_done": 51.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1372709274292, "wps": 5547.986786697155, "avg_wps": 4432.702986970204, "eta_in_seconds": 3592.67202129531, "at": "2024-05-26T00:54:42.267378"}
{"lr": 3.089285831792642e-05, "step": 258, "loss": 1.6977781057357788, "percent_done": 51.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5528.743125051717, "avg_wps": 4436.111640089365, "eta_in_seconds": 3575.1381585339245, "at": "2024-05-26T00:54:54.122156"}
{"lr": 3.0694512525911205e-05, "step": 259, "loss": 1.0950196981430054, "percent_done": 51.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1380033493042, "wps": 5534.838597738931, "avg_wps": 4439.514315447596, "eta_in_seconds": 3557.6360110030673, "at": "2024-05-26T00:55:05.963894"}
{"lr": 3.0496136358917387e-05, "step": 260, "loss": 1.3071869611740112, "percent_done": 52.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13841724395752, "wps": 5535.010900840757, "avg_wps": 4442.896407211733, "eta_in_seconds": 3540.17707333198, "at": "2024-05-26T00:55:17.805265"}
{"lr": 3.029773849456115e-05, "step": 261, "loss": 1.543917179107666, "percent_done": 52.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13963747024536, "wps": 5523.823033593049, "avg_wps": 4446.229964108923, "eta_in_seconds": 3522.7831503175685, "at": "2024-05-26T00:55:29.670622"}
{"lr": 3.009932761140782e-05, "step": 262, "loss": 1.5751579999923706, "percent_done": 52.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1372709274292, "wps": 5544.538007433828, "avg_wps": 4449.594133901399, "eta_in_seconds": 3505.391172907735, "at": "2024-05-26T00:55:41.491625"}
{"lr": 2.9900912388592177e-05, "step": 263, "loss": 1.1802653074264526, "percent_done": 52.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5536.393280272336, "avg_wps": 4452.917753268135, "eta_in_seconds": 3488.0572381110246, "at": "2024-05-26T00:55:53.329982"}
{"lr": 2.9702501505438846e-05, "step": 264, "loss": 1.4496034383773804, "percent_done": 52.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1405029296875, "wps": 5538.008863218723, "avg_wps": 4456.225069707394, "eta_in_seconds": 3470.761857415691, "at": "2024-05-26T00:56:05.165005"}
{"lr": 2.9504103641082615e-05, "step": 265, "loss": 1.2859277725219727, "percent_done": 53.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.137210845947266, "wps": 5541.263971855777, "avg_wps": 4459.52024661947, "eta_in_seconds": 3453.5015311735983, "at": "2024-05-26T00:56:16.993024"}
{"lr": 2.93057274740888e-05, "step": 266, "loss": 1.5144016742706299, "percent_done": 53.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.139424800872803, "wps": 5527.408799553815, "avg_wps": 4462.761600111927, "eta_in_seconds": 3436.3081370099144, "at": "2024-05-26T00:56:28.850617"}
{"lr": 2.9107381682073582e-05, "step": 267, "loss": 1.6225457191467285, "percent_done": 53.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5540.866995945731, "avg_wps": 4466.016161916648, "eta_in_seconds": 3419.1295880682014, "at": "2024-05-26T00:56:40.679565"}
{"lr": 2.8909074941324465e-05, "step": 268, "loss": 1.184424877166748, "percent_done": 53.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1387357711792, "wps": 5531.724726015742, "avg_wps": 4469.228902802474, "eta_in_seconds": 3402.0078923381975, "at": "2024-05-26T00:56:52.527961"}
{"lr": 2.8710815926420708e-05, "step": 269, "loss": 1.7449427843093872, "percent_done": 53.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5538.856629348349, "avg_wps": 4472.4396398281415, "eta_in_seconds": 3384.912311657654, "at": "2024-05-26T00:57:04.361113"}
{"lr": 2.851261330985389e-05, "step": 270, "loss": 1.6234735250473022, "percent_done": 54.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.137887477874756, "wps": 5533.3855932514725, "avg_wps": 4475.617915511204, "eta_in_seconds": 3367.8656857102005, "at": "2024-05-26T00:57:16.205956"}
{"lr": 2.8314475761648556e-05, "step": 271, "loss": 1.1902457475662231, "percent_done": 54.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1397123336792, "wps": 5539.079410485766, "avg_wps": 4478.790956485106, "eta_in_seconds": 3350.8471696517563, "at": "2024-05-26T00:57:28.038572"}
{"lr": 2.811641194898294e-05, "step": 272, "loss": 1.4205036163330078, "percent_done": 54.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5536.018966326275, "avg_wps": 4481.937748267793, "eta_in_seconds": 3333.872275618946, "at": "2024-05-26T00:57:39.877881"}
{"lr": 2.7918430535809843e-05, "step": 273, "loss": 1.005091667175293, "percent_done": 54.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5538.130482796971, "avg_wps": 4485.070937758747, "eta_in_seconds": 3316.931260720278, "at": "2024-05-26T00:57:51.712595"}
{"lr": 2.772054018247765e-05, "step": 274, "loss": 1.2020037174224854, "percent_done": 54.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.137707233428955, "wps": 5529.24002068975, "avg_wps": 4488.164248618584, "eta_in_seconds": 3300.043220245055, "at": "2024-05-26T00:58:03.590415"}
{"lr": 2.7522749545351488e-05, "step": 275, "loss": 1.2330303192138672, "percent_done": 55.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1370267868042, "wps": 5533.795869101056, "avg_wps": 4491.250207461964, "eta_in_seconds": 3283.183817169883, "at": "2024-05-26T00:58:15.434462"}
{"lr": 2.7325067276434586e-05, "step": 276, "loss": 1.5320179462432861, "percent_done": 55.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.140522956848145, "wps": 5539.285912012344, "avg_wps": 4494.331112267575, "eta_in_seconds": 3266.351239660512, "at": "2024-05-26T00:58:27.266703"}
{"lr": 2.7127502022989765e-05, "step": 277, "loss": 1.179079294204712, "percent_done": 55.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13890552520752, "wps": 5522.972760795532, "avg_wps": 4497.355020491515, "eta_in_seconds": 3249.5829067109726, "at": "2024-05-26T00:58:39.133893"}
{"lr": 2.693006242716126e-05, "step": 278, "loss": 1.4817994832992554, "percent_done": 55.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5538.101025821754, "avg_wps": 4500.39723569289, "eta_in_seconds": 3232.8239570967585, "at": "2024-05-26T00:58:50.968629"}
{"lr": 2.6732757125596597e-05, "step": 279, "loss": 1.6966520547866821, "percent_done": 55.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5532.905548609737, "avg_wps": 4503.409392151352, "eta_in_seconds": 3216.109116182532, "at": "2024-05-26T00:59:02.814541"}
{"lr": 2.653559474906885e-05, "step": 280, "loss": 1.6227508783340454, "percent_done": 56.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.137199878692627, "wps": 5514.956945650416, "avg_wps": 4506.361363657148, "eta_in_seconds": 3199.45935012613, "at": "2024-05-26T00:59:14.698974"}
{"lr": 2.6338583922099093e-05, "step": 281, "loss": 1.2926881313323975, "percent_done": 56.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13792896270752, "wps": 5534.2261504001835, "avg_wps": 4509.341841689588, "eta_in_seconds": 3182.811262457396, "at": "2024-05-26T00:59:26.542022"}
{"lr": 2.6141733262579107e-05, "step": 282, "loss": 1.2204015254974365, "percent_done": 56.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.14134693145752, "wps": 5538.880290622555, "avg_wps": 4512.316047333792, "eta_in_seconds": 3166.1895687563197, "at": "2024-05-26T00:59:38.375148"}
{"lr": 2.5945051381394456e-05, "step": 283, "loss": 1.5107355117797852, "percent_done": 56.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13792896270752, "wps": 5552.843918788635, "avg_wps": 4515.305825641744, "eta_in_seconds": 3149.5789098579558, "at": "2024-05-26T00:59:50.178525"}
{"lr": 2.574854688204777e-05, "step": 284, "loss": 1.6739741563796997, "percent_done": 56.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817262649536, "wps": 5526.0876717026995, "avg_wps": 4518.215794168703, "eta_in_seconds": 3133.045574819538, "at": "2024-05-26T01:00:02.039040"}
{"lr": 2.555222836028246e-05, "step": 285, "loss": 1.445129156112671, "percent_done": 57.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13963794708252, "wps": 5512.8998776916305, "avg_wps": 4521.078008843842, "eta_in_seconds": 3116.566441109306, "at": "2024-05-26T01:00:13.927902"}
{"lr": 2.5356104403706647e-05, "step": 286, "loss": 1.277710199356079, "percent_done": 57.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13841724395752, "wps": 5534.471402795223, "avg_wps": 4523.974392085318, "eta_in_seconds": 3100.084745071985, "at": "2024-05-26T01:00:25.770419"}
{"lr": 2.5160183591417547e-05, "step": 287, "loss": 1.2438263893127441, "percent_done": 57.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.137596607208252, "wps": 5525.886374342613, "avg_wps": 4526.834222718159, "eta_in_seconds": 3083.6490388680836, "at": "2024-05-26T01:00:37.631344"}
{"lr": 2.4964474493626167e-05, "step": 288, "loss": 1.4689997434616089, "percent_done": 57.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13963794708252, "wps": 5535.8439247466695, "avg_wps": 4529.700964323227, "eta_in_seconds": 3067.2294064064818, "at": "2024-05-26T01:00:49.470961"}
{"lr": 2.4768985671282466e-05, "step": 289, "loss": 1.5166946649551392, "percent_done": 57.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5529.101775088918, "avg_wps": 4532.535804074292, "eta_in_seconds": 3050.85201700336, "at": "2024-05-26T01:01:01.324956"}
{"lr": 2.457372567570083e-05, "step": 290, "loss": 1.2938913106918335, "percent_done": 58.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13890552520752, "wps": 5528.222525844154, "avg_wps": 4535.3525667349295, "eta_in_seconds": 3034.507195965997, "at": "2024-05-26T01:01:13.180849"}
{"lr": 2.4378703048186006e-05, "step": 291, "loss": 1.318616271018982, "percent_done": 58.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13748550415039, "wps": 5535.9577562605255, "avg_wps": 4538.171325319706, "eta_in_seconds": 3018.1813373991713, "at": "2024-05-26T01:01:25.020198"}
{"lr": 2.4183926319659536e-05, "step": 292, "loss": 1.2825901508331299, "percent_done": 58.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.138924598693848, "wps": 5525.258913939859, "avg_wps": 4540.949546913198, "eta_in_seconds": 3001.90254464868, "at": "2024-05-26T01:01:36.882483"}
{"lr": 2.3989404010286496e-05, "step": 293, "loss": 1.2012560367584229, "percent_done": 58.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1387357711792, "wps": 5516.096857843715, "avg_wps": 4543.690991752467, "eta_in_seconds": 2985.6678248200396, "at": "2024-05-26T01:01:48.764522"}
{"lr": 2.379514462910286e-05, "step": 294, "loss": 1.5051480531692505, "percent_done": 58.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1372709274292, "wps": 5539.113231032796, "avg_wps": 4546.470027275156, "eta_in_seconds": 2969.42813193717, "at": "2024-05-26T01:02:00.597240"}
{"lr": 2.3601156673643287e-05, "step": 295, "loss": 1.293953537940979, "percent_done": 59.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1384916305542, "wps": 5534.530128425111, "avg_wps": 4549.223100903126, "eta_in_seconds": 2953.2251336130043, "at": "2024-05-26T01:02:12.439712"}
{"lr": 2.340744862956937e-05, "step": 296, "loss": 1.432934284210205, "percent_done": 59.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13963794708252, "wps": 5527.644221957036, "avg_wps": 4551.945119217193, "eta_in_seconds": 2937.061772462484, "at": "2024-05-26T01:02:24.296933"}
{"lr": 2.3214028970298496e-05, "step": 297, "loss": 1.1521751880645752, "percent_done": 59.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13792896270752, "wps": 5548.077378022608, "avg_wps": 4554.698572337183, "eta_in_seconds": 2920.8975717515655, "at": "2024-05-26T01:02:36.110557"}
{"lr": 2.3020906156633134e-05, "step": 298, "loss": 1.6014556884765625, "percent_done": 59.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.137086868286133, "wps": 5535.5268712425395, "avg_wps": 4557.408362770301, "eta_in_seconds": 2904.7807319932335, "at": "2024-05-26T01:02:47.950911"}
{"lr": 2.2828088636390805e-05, "step": 299, "loss": 1.257323980331421, "percent_done": 59.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13995599746704, "wps": 5506.703782656311, "avg_wps": 4560.037461480972, "eta_in_seconds": 2888.7341631009026, "at": "2024-05-26T01:02:59.853252"}
{"lr": 2.2635584844034485e-05, "step": 300, "loss": 1.041149616241455, "percent_done": 60.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.137259483337402, "wps": 5540.2576804593755, "avg_wps": 4562.728358336017, "eta_in_seconds": 2872.667178630829, "at": "2024-05-26T01:03:11.683548"}
{"lr": 2.244340320030367e-05, "step": 301, "loss": 1.1909679174423218, "percent_done": 60.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5601.087634520706, "avg_wps": 4565.540265389221, "eta_in_seconds": 2856.54341915834, "at": "2024-05-26T01:03:37.980724"}
{"lr": 2.225155211184604e-05, "step": 302, "loss": 1.3130428791046143, "percent_done": 60.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13792896270752, "wps": 5559.977785486543, "avg_wps": 4568.245761802313, "eta_in_seconds": 2840.50567254957, "at": "2024-05-26T01:03:49.768929"}
{"lr": 2.2060039970849715e-05, "step": 303, "loss": 1.327286720275879, "percent_done": 60.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.139549255371094, "wps": 5553.915384460738, "avg_wps": 4570.923039338312, "eta_in_seconds": 2824.5043482221786, "at": "2024-05-26T01:04:01.569963"}
{"lr": 2.186887515467616e-05, "step": 304, "loss": 1.2636806964874268, "percent_done": 60.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13875722885132, "wps": 5535.986744465381, "avg_wps": 4573.545689597156, "eta_in_seconds": 2808.5553029932476, "at": "2024-05-26T01:04:13.409240"}
{"lr": 2.167806602549372e-05, "step": 305, "loss": 1.4129942655563354, "percent_done": 61.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5540.104255930096, "avg_wps": 4576.1633416315635, "eta_in_seconds": 2792.627589085063, "at": "2024-05-26T01:04:25.239781"}
{"lr": 2.148762092991183e-05, "step": 306, "loss": 1.423150658607483, "percent_done": 61.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.139676094055176, "wps": 5547.69342100268, "avg_wps": 4578.783771293298, "eta_in_seconds": 2776.7164022268034, "at": "2024-05-26T01:04:37.054010"}
{"lr": 2.129754819861595e-05, "step": 307, "loss": 1.5841243267059326, "percent_done": 61.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13897943496704, "wps": 5521.223982083363, "avg_wps": 4581.331022280492, "eta_in_seconds": 2760.867516118463, "at": "2024-05-26T01:04:48.924937"}
{"lr": 2.1107856146003084e-05, "step": 308, "loss": 1.2460328340530396, "percent_done": 61.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.138951301574707, "wps": 5536.44847829994, "avg_wps": 4583.8985184096855, "eta_in_seconds": 2745.024120727143, "at": "2024-05-26T01:05:00.763195"}
{"lr": 2.0918553069818132e-05, "step": 309, "loss": 1.5161986351013184, "percent_done": 61.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1387357711792, "wps": 5527.5794176616155, "avg_wps": 4586.432518945001, "eta_in_seconds": 2729.2183954075313, "at": "2024-05-26T01:05:12.620454"}
{"lr": 2.0729647250790905e-05, "step": 310, "loss": 1.587321400642395, "percent_done": 62.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.137510776519775, "wps": 5536.1954685024975, "avg_wps": 4588.972073396198, "eta_in_seconds": 2713.4268417512217, "at": "2024-05-26T01:05:24.459360"}
{"lr": 2.0541146952273892e-05, "step": 311, "loss": 1.3615864515304565, "percent_done": 62.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13841724395752, "wps": 5534.504832792271, "avg_wps": 4591.494342811603, "eta_in_seconds": 2697.662912161021, "at": "2024-05-26T01:05:36.301703"}
{"lr": 2.0353060419880816e-05, "step": 312, "loss": 1.683513879776001, "percent_done": 62.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5535.882276859177, "avg_wps": 4594.006232537883, "eta_in_seconds": 2681.9223519410843, "at": "2024-05-26T01:05:48.141183"}
{"lr": 2.01653958811259e-05, "step": 313, "loss": 1.048714518547058, "percent_done": 62.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1375150680542, "wps": 5512.02102059552, "avg_wps": 4596.452011498966, "eta_in_seconds": 2666.2373433554894, "at": "2024-05-26T01:06:00.031899"}
{"lr": 1.997816154506404e-05, "step": 314, "loss": 1.4360339641571045, "percent_done": 62.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1372709274292, "wps": 5529.866383223986, "avg_wps": 4598.924227720912, "eta_in_seconds": 2650.5537809308166, "at": "2024-05-26T01:06:11.884227"}
{"lr": 1.979136560193164e-05, "step": 315, "loss": 1.838736653327942, "percent_done": 63.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13912343978882, "wps": 5530.424455945281, "avg_wps": 4601.384609391944, "eta_in_seconds": 2634.8938480937295, "at": "2024-05-26T01:06:23.735460"}
{"lr": 1.9605016222788395e-05, "step": 316, "loss": 1.4693397283554077, "percent_done": 63.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5530.504682595344, "avg_wps": 4603.8322039696895, "eta_in_seconds": 2619.257928123957, "at": "2024-05-26T01:06:35.586409"}
{"lr": 1.9419121559159824e-05, "step": 317, "loss": 1.4064899682998657, "percent_done": 63.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13792848587036, "wps": 5512.320132194016, "avg_wps": 4606.227012546687, "eta_in_seconds": 2603.6684617003434, "at": "2024-05-26T01:06:47.476488"}
{"lr": 1.9233689742680746e-05, "step": 318, "loss": 1.6543333530426025, "percent_done": 63.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13942050933838, "wps": 5526.7246545026865, "avg_wps": 4608.640808712972, "eta_in_seconds": 2588.084534045285, "at": "2024-05-26T01:06:59.335585"}
{"lr": 1.9048728884739516e-05, "step": 319, "loss": 1.408535122871399, "percent_done": 63.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5529.425767819157, "avg_wps": 4611.047869912337, "eta_in_seconds": 2572.520679605418, "at": "2024-05-26T01:07:11.188893"}
{"lr": 1.886424707612324e-05, "step": 320, "loss": 1.5866949558258057, "percent_done": 64.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.140464305877686, "wps": 5523.08539774153, "avg_wps": 4613.428570465795, "eta_in_seconds": 2556.9876762628555, "at": "2024-05-26T01:07:23.055887"}
{"lr": 1.86802523866639e-05, "step": 321, "loss": 1.4521435499191284, "percent_done": 64.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1387357711792, "wps": 5525.252361290496, "avg_wps": 4615.801587743876, "eta_in_seconds": 2541.4749262941964, "at": "2024-05-26T01:07:34.918107"}
{"lr": 1.8496752864885245e-05, "step": 322, "loss": 1.5227761268615723, "percent_done": 64.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.14044427871704, "wps": 5525.6104474875965, "avg_wps": 4618.163062401021, "eta_in_seconds": 2525.9844319864833, "at": "2024-05-26T01:07:46.779612"}
{"lr": 1.831375653765083e-05, "step": 323, "loss": 1.3907850980758667, "percent_done": 64.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5527.902231483192, "avg_wps": 4620.517269233944, "eta_in_seconds": 2510.513720452601, "at": "2024-05-26T01:07:58.636159"}
{"lr": 1.813127140981282e-05, "step": 324, "loss": 1.3556586503982544, "percent_done": 64.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.138609886169434, "wps": 5512.704515043262, "avg_wps": 4622.8264284218185, "eta_in_seconds": 2495.083079279205, "at": "2024-05-26T01:08:10.525544"}
{"lr": 1.794930546386188e-05, "step": 325, "loss": 1.193861722946167, "percent_done": 65.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817262649536, "wps": 5516.623036431604, "avg_wps": 4625.132146359272, "eta_in_seconds": 2479.669690957436, "at": "2024-05-26T01:08:22.406274"}
{"lr": 1.7767866659577976e-05, "step": 326, "loss": 1.2673518657684326, "percent_done": 65.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13727045059204, "wps": 5518.114328739708, "avg_wps": 4627.429216642468, "eta_in_seconds": 2464.2762679088337, "at": "2024-05-26T01:08:34.283865"}
{"lr": 1.758696293368218e-05, "step": 327, "loss": 1.4862715005874634, "percent_done": 65.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5520.588377414058, "avg_wps": 4629.719822922852, "eta_in_seconds": 2448.901539109169, "at": "2024-05-26T01:08:46.156176"}
{"lr": 1.740660219948953e-05, "step": 328, "loss": 1.3229244947433472, "percent_done": 65.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1380033493042, "wps": 5513.1451232983945, "avg_wps": 4631.9827131895145, "eta_in_seconds": 2433.5565778133346, "at": "2024-05-26T01:08:58.044457"}
{"lr": 1.7226792346562806e-05, "step": 329, "loss": 1.0695526599884033, "percent_done": 65.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.137794017791748, "wps": 5520.521521019695, "avg_wps": 4634.249861029113, "eta_in_seconds": 2418.2243806576657, "at": "2024-05-26T01:09:09.917024"}
{"lr": 1.7047541240367497e-05, "step": 330, "loss": 1.2772799730300903, "percent_done": 66.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1380033493042, "wps": 5524.147518129011, "avg_wps": 4636.51321436569, "eta_in_seconds": 2402.909144199256, "at": "2024-05-26T01:09:21.781632"}
{"lr": 1.6868856721927658e-05, "step": 331, "loss": 1.3015071153640747, "percent_done": 66.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13963794708252, "wps": 5530.707095541982, "avg_wps": 4638.779041259455, "eta_in_seconds": 2387.6075798154234, "at": "2024-05-26T01:09:33.632306"}
{"lr": 1.669074660748301e-05, "step": 332, "loss": 1.2681198120117188, "percent_done": 66.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5533.303389441862, "avg_wps": 4641.038918298698, "eta_in_seconds": 2372.3239976699097, "at": "2024-05-26T01:09:45.477350"}
{"lr": 1.6513218688146936e-05, "step": 333, "loss": 1.077351689338684, "percent_done": 66.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1380033493042, "wps": 5532.607539599817, "avg_wps": 4643.285933992912, "eta_in_seconds": 2357.0618212151453, "at": "2024-05-26T01:09:57.323944"}
{"lr": 1.6336280729565724e-05, "step": 334, "loss": 1.0104950666427612, "percent_done": 66.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.141358852386475, "wps": 5545.151396999249, "avg_wps": 4645.548070660843, "eta_in_seconds": 2341.8067867398977, "at": "2024-05-26T01:10:09.143782"}
{"lr": 1.6159940471578926e-05, "step": 335, "loss": 1.0948432683944702, "percent_done": 67.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13963794708252, "wps": 5540.053562938807, "avg_wps": 4647.788186973401, "eta_in_seconds": 2326.577624666157, "at": "2024-05-26T01:10:20.974382"}
{"lr": 1.598420562788065e-05, "step": 336, "loss": 1.62564218044281, "percent_done": 67.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817262649536, "wps": 5530.313077173483, "avg_wps": 4649.996652415117, "eta_in_seconds": 2311.378868287518, "at": "2024-05-26T01:10:32.825821"}
{"lr": 1.5809083885682293e-05, "step": 337, "loss": 1.3993029594421387, "percent_done": 67.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13819980621338, "wps": 5540.200954825271, "avg_wps": 4652.214818345599, "eta_in_seconds": 2296.189754152156, "at": "2024-05-26T01:10:44.656133"}
{"lr": 1.5634582905376138e-05, "step": 338, "loss": 1.1360607147216797, "percent_done": 67.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13792896270752, "wps": 5536.252892672875, "avg_wps": 4654.413707475299, "eta_in_seconds": 2281.0245644792294, "at": "2024-05-26T01:10:56.494858"}
{"lr": 1.546071032020041e-05, "step": 339, "loss": 1.3813202381134033, "percent_done": 67.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13995599746704, "wps": 5521.306049180372, "avg_wps": 4656.570407886061, "eta_in_seconds": 2265.8942259588775, "at": "2024-05-26T01:11:08.365761"}
{"lr": 1.5287473735905225e-05, "step": 340, "loss": 1.1545019149780273, "percent_done": 68.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13843536376953, "wps": 5539.6732834303475, "avg_wps": 4658.754737015351, "eta_in_seconds": 2250.764548021204, "at": "2024-05-26T01:11:20.197153"}
{"lr": 1.5114880730419973e-05, "step": 341, "loss": 1.9393445253372192, "percent_done": 68.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5535.765549843778, "avg_wps": 4660.920168987583, "eta_in_seconds": 2235.658115179308, "at": "2024-05-26T01:11:32.036940"}
{"lr": 1.4942938853521888e-05, "step": 342, "loss": 1.5955932140350342, "percent_done": 68.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.137256622314453, "wps": 5529.3659269621685, "avg_wps": 4663.061641067549, "eta_in_seconds": 2220.577122293718, "at": "2024-05-26T01:11:43.890427"}
{"lr": 1.4771655626505637e-05, "step": 343, "loss": 1.489546298980713, "percent_done": 68.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13963747024536, "wps": 5535.5605369446, "avg_wps": 4665.205419675395, "eta_in_seconds": 2205.508884261718, "at": "2024-05-26T01:11:55.730795"}
{"lr": 1.4601038541854481e-05, "step": 344, "loss": 1.368099570274353, "percent_done": 68.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13988208770752, "wps": 5541.010410055027, "avg_wps": 4667.3499410081895, "eta_in_seconds": 2190.4541397621465, "at": "2024-05-26T01:12:07.559306"}
{"lr": 1.4431095062912406e-05, "step": 345, "loss": 1.371695637702942, "percent_done": 69.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5539.930407399604, "avg_wps": 4669.481762154883, "eta_in_seconds": 2175.4191401557646, "at": "2024-05-26T01:12:19.390170"}
{"lr": 1.426183262355772e-05, "step": 346, "loss": 1.3988710641860962, "percent_done": 69.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.140594959259033, "wps": 5530.285483525829, "avg_wps": 4671.583335669962, "eta_in_seconds": 2160.411850718405, "at": "2024-05-26T01:12:31.241703"}
{"lr": 1.4093258627877864e-05, "step": 347, "loss": 1.3253638744354248, "percent_done": 69.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.14137363433838, "wps": 5546.714341652883, "avg_wps": 4673.708386916458, "eta_in_seconds": 2145.4072804519697, "at": "2024-05-26T01:12:43.058109"}
{"lr": 1.392538044984549e-05, "step": 348, "loss": 1.4922512769699097, "percent_done": 69.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1372709274292, "wps": 5538.872031475573, "avg_wps": 4675.80710581218, "eta_in_seconds": 2130.428346288615, "at": "2024-05-26T01:12:54.891399"}
{"lr": 1.3758205432995999e-05, "step": 349, "loss": 1.6032309532165527, "percent_done": 69.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13841724395752, "wps": 2799.847247287034, "avg_wps": 4666.847531236229, "eta_in_seconds": 2120.475531665507, "at": "2024-05-26T01:13:18.299547"}
{"lr": 1.3591740890106174e-05, "step": 350, "loss": 1.3721952438354492, "percent_done": 70.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1370267868042, "wps": 5549.921649644395, "avg_wps": 4668.970107745052, "eta_in_seconds": 2105.4750347818645, "at": "2024-05-26T01:13:30.109046"}
{"lr": 1.342599410287438e-05, "step": 351, "loss": 1.2236526012420654, "percent_done": 70.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1384916305542, "wps": 5549.655530169466, "avg_wps": 4671.081967881481, "eta_in_seconds": 2090.492966542556, "at": "2024-05-26T01:13:41.919144"}
{"lr": 1.3260972321602061e-05, "step": 352, "loss": 1.4053864479064941, "percent_done": 70.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13963794708252, "wps": 5543.081359716434, "avg_wps": 4673.170465039946, "eta_in_seconds": 2075.5348157232456, "at": "2024-05-26T01:13:53.743310"}
{"lr": 1.3096682764876501e-05, "step": 353, "loss": 1.396177887916565, "percent_done": 70.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.141611099243164, "wps": 5543.549979543282, "avg_wps": 4675.249926233429, "eta_in_seconds": 2060.5940114438704, "at": "2024-05-26T01:14:05.566377"}
{"lr": 1.2933132619255162e-05, "step": 354, "loss": 1.6633139848709106, "percent_done": 70.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13971185684204, "wps": 5532.296980664749, "avg_wps": 4677.296799001518, "eta_in_seconds": 2045.6807449214202, "at": "2024-05-26T01:14:17.413596"}
{"lr": 1.2770329038951215e-05, "step": 355, "loss": 1.4951876401901245, "percent_done": 71.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.139026641845703, "wps": 5536.351241300769, "avg_wps": 4679.342082409068, "eta_in_seconds": 2030.7812151035791, "at": "2024-05-26T01:14:29.252008"}
{"lr": 1.2608279145520686e-05, "step": 356, "loss": 1.7069875001907349, "percent_done": 71.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13854217529297, "wps": 5521.726625886975, "avg_wps": 4681.348200228023, "eta_in_seconds": 2015.9115699918082, "at": "2024-05-26T01:14:41.121917"}
{"lr": 1.2446990027550896e-05, "step": 357, "loss": 1.1795735359191895, "percent_done": 71.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13963794708252, "wps": 5523.999313996375, "avg_wps": 4683.349363497956, "eta_in_seconds": 2001.0567806541753, "at": "2024-05-26T01:14:52.986808"}
{"lr": 1.2286468740350344e-05, "step": 358, "loss": 1.3241490125656128, "percent_done": 71.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1397123336792, "wps": 5535.469685077949, "avg_wps": 4685.364046674451, "eta_in_seconds": 1986.208949250216, "at": "2024-05-26T01:15:04.827224"}
{"lr": 1.2126722305640172e-05, "step": 359, "loss": 1.286388874053955, "percent_done": 71.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5531.542052526424, "avg_wps": 4687.361375192172, "eta_in_seconds": 1971.3811802319497, "at": "2024-05-26T01:15:16.676016"}
{"lr": 1.1967757711246922e-05, "step": 360, "loss": 1.0435327291488647, "percent_done": 72.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5527.839977949607, "avg_wps": 4689.341901413824, "eta_in_seconds": 1956.5730528699028, "at": "2024-05-26T01:15:28.532745"}
{"lr": 1.1809581910796943e-05, "step": 361, "loss": 1.5640085935592651, "percent_done": 72.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.14134693145752, "wps": 5527.675457503188, "avg_wps": 4691.312787399688, "eta_in_seconds": 1941.781418725064, "at": "2024-05-26T01:15:40.389878"}
{"lr": 1.1652201823412147e-05, "step": 362, "loss": 1.3622779846191406, "percent_done": 72.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1372709274292, "wps": 5525.521810167331, "avg_wps": 4693.2701377464045, "eta_in_seconds": 1927.007765281266, "at": "2024-05-26T01:15:52.251513"}
{"lr": 1.1495624333407409e-05, "step": 363, "loss": 1.2254904508590698, "percent_done": 72.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13792896270752, "wps": 5529.940029910749, "avg_wps": 4695.227105628912, "eta_in_seconds": 1912.2465853113115, "at": "2024-05-26T01:16:04.103751"}
{"lr": 1.133985628998939e-05, "step": 364, "loss": 1.4732694625854492, "percent_done": 72.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5531.145132715192, "avg_wps": 4697.177328338779, "eta_in_seconds": 1897.5004299341979, "at": "2024-05-26T01:16:15.953430"}
{"lr": 1.1184904506956906e-05, "step": 365, "loss": 1.7372241020202637, "percent_done": 73.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.137560844421387, "wps": 5518.700833643773, "avg_wps": 4699.09380878566, "eta_in_seconds": 1882.7800337713059, "at": "2024-05-26T01:16:27.829813"}
{"lr": 1.1030775762402946e-05, "step": 366, "loss": 1.1547083854675293, "percent_done": 73.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5529.9827503379865, "avg_wps": 4701.023689902065, "eta_in_seconds": 1868.0663147611044, "at": "2024-05-26T01:16:39.682168"}
{"lr": 1.0877476798418077e-05, "step": 367, "loss": 1.304084062576294, "percent_done": 73.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.137547969818115, "wps": 5529.8643807734925, "avg_wps": 4702.944393558633, "eta_in_seconds": 1853.3682881596953, "at": "2024-05-26T01:16:51.534592"}
{"lr": 1.0725014320795634e-05, "step": 368, "loss": 1.2010260820388794, "percent_done": 73.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13841724395752, "wps": 5526.495643780223, "avg_wps": 4704.849585446528, "eta_in_seconds": 1838.6883242259855, "at": "2024-05-26T01:17:03.394351"}
{"lr": 1.0573394998738269e-05, "step": 369, "loss": 1.5033233165740967, "percent_done": 73.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1399564743042, "wps": 5507.461435735282, "avg_wps": 4706.708438388072, "eta_in_seconds": 1824.0382025745826, "at": "2024-05-26T01:17:15.294947"}
{"lr": 1.0422625464566322e-05, "step": 370, "loss": 1.3334954977035522, "percent_done": 74.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13773012161255, "wps": 5522.791219683612, "avg_wps": 4708.588900724632, "eta_in_seconds": 1809.3913441219845, "at": "2024-05-26T01:17:27.162559"}
{"lr": 1.0272712313427651e-05, "step": 371, "loss": 1.3419601917266846, "percent_done": 74.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13963794708252, "wps": 5529.395736000402, "avg_wps": 4710.47365162892, "eta_in_seconds": 1794.7545459842424, "at": "2024-05-26T01:17:39.016142"}
{"lr": 1.0123662103009122e-05, "step": 372, "loss": 1.3665707111358643, "percent_done": 74.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13747549057007, "wps": 5522.847256467364, "avg_wps": 4712.336966156755, "eta_in_seconds": 1780.1375538815735, "at": "2024-05-26T01:17:50.907777"}
{"lr": 9.97548135324981e-06, "step": 373, "loss": 1.5524204969406128, "percent_done": 74.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.139872074127197, "wps": 5532.042791465737, "avg_wps": 4714.209684888793, "eta_in_seconds": 1765.5285946824274, "at": "2024-05-26T01:18:02.755547"}
{"lr": 9.828176546055728e-06, "step": 374, "loss": 1.3623601198196411, "percent_done": 74.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5514.188711466234, "avg_wps": 4716.039060005281, "eta_in_seconds": 1750.947329938093, "at": "2024-05-26T01:18:14.641646"}
{"lr": 9.681754125016368e-06, "step": 375, "loss": 1.293965458869934, "percent_done": 75.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13792896270752, "wps": 5525.246475025507, "avg_wps": 4717.881629896226, "eta_in_seconds": 1736.3725168704987, "at": "2024-05-26T01:18:26.503964"}
{"lr": 9.536220495122747e-06, "step": 376, "loss": 1.1819424629211426, "percent_done": 75.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13792896270752, "wps": 5532.530815271963, "avg_wps": 4719.729945333812, "eta_in_seconds": 1721.80698771426, "at": "2024-05-26T01:18:38.350780"}
{"lr": 9.391582022487311e-06, "step": 377, "loss": 1.5811065435409546, "percent_done": 75.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13841724395752, "wps": 5533.474483046087, "avg_wps": 4721.571715420697, "eta_in_seconds": 1707.2552289469488, "at": "2024-05-26T01:18:50.195408"}
{"lr": 9.247845034065422e-06, "step": 378, "loss": 1.3237336874008179, "percent_done": 75.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13841676712036, "wps": 5511.9933881242905, "avg_wps": 4723.3635987550615, "eta_in_seconds": 1692.7326962733393, "at": "2024-05-26T01:19:02.086237"}
{"lr": 9.105015817378586e-06, "step": 379, "loss": 1.3288097381591797, "percent_done": 75.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5528.435557153815, "avg_wps": 4725.1791625702135, "eta_in_seconds": 1678.2127676374994, "at": "2024-05-26T01:19:13.941709"}
{"lr": 8.963100620239454e-06, "step": 380, "loss": 1.3023933172225952, "percent_done": 76.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.137242794036865, "wps": 5520.170523800052, "avg_wps": 4726.970631263569, "eta_in_seconds": 1663.7124732670031, "at": "2024-05-26T01:19:25.815220"}
{"lr": 8.82210565047849e-06, "step": 381, "loss": 1.1715354919433594, "percent_done": 76.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1399564743042, "wps": 5506.105486671179, "avg_wps": 4728.726885406522, "eta_in_seconds": 1649.235447297259, "at": "2024-05-26T01:19:37.718827"}
{"lr": 8.682037075672413e-06, "step": 382, "loss": 1.1838302612304688, "percent_done": 76.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5528.568988047758, "avg_wps": 4730.518468300828, "eta_in_seconds": 1634.756962015991, "at": "2024-05-26T01:19:49.574183"}
{"lr": 8.542901022874465e-06, "step": 383, "loss": 1.512841820716858, "percent_done": 76.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13841724395752, "wps": 5525.2364795099165, "avg_wps": 4732.295664116231, "eta_in_seconds": 1620.294365405414, "at": "2024-05-26T01:20:01.436485"}
{"lr": 8.404703578346311e-06, "step": 384, "loss": 1.6261485815048218, "percent_done": 76.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1397123336792, "wps": 5530.608502228467, "avg_wps": 4734.075189238517, "eta_in_seconds": 1605.8418373415868, "at": "2024-05-26T01:20:13.287311"}
{"lr": 8.267450787291907e-06, "step": 385, "loss": 1.2234678268432617, "percent_done": 77.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13792896270752, "wps": 5536.221114101282, "avg_wps": 4735.857477097785, "eta_in_seconds": 1591.3992421534156, "at": "2024-05-26T01:20:25.126278"}
{"lr": 8.13114865359295e-06, "step": 386, "loss": 1.6184728145599365, "percent_done": 77.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.139348030090332, "wps": 5526.538199892597, "avg_wps": 4737.613460043199, "eta_in_seconds": 1576.9762693835046, "at": "2024-05-26T01:20:36.985919"}
{"lr": 7.995803139546319e-06, "step": 387, "loss": 1.0855679512023926, "percent_done": 77.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5536.265269688946, "avg_wps": 4739.380112679149, "eta_in_seconds": 1562.5604665445726, "at": "2024-05-26T01:20:48.824605"}
{"lr": 7.861420165603275e-06, "step": 388, "loss": 1.6422431468963623, "percent_done": 77.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.14134693145752, "wps": 5526.940126363365, "avg_wps": 4741.121311001862, "eta_in_seconds": 1548.1637187741467, "at": "2024-05-26T01:21:00.683489"}
{"lr": 7.728005610110419e-06, "step": 389, "loss": 1.691611886024475, "percent_done": 77.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5528.500603910024, "avg_wps": 4742.857780377795, "eta_in_seconds": 1533.7790709424446, "at": "2024-05-26T01:21:12.538764"}
{"lr": 7.59556530905263e-06, "step": 390, "loss": 1.298542857170105, "percent_done": 78.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.140429973602295, "wps": 5532.2326239417325, "avg_wps": 4744.59365064626, "eta_in_seconds": 1519.4051442146301, "at": "2024-05-26T01:21:24.386260"}
{"lr": 7.464105055797707e-06, "step": 391, "loss": 1.1656980514526367, "percent_done": 78.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5535.855631003735, "avg_wps": 4746.328719039921, "eta_in_seconds": 1505.0419856812948, "at": "2024-05-26T01:21:36.225912"}
{"lr": 7.333630600843008e-06, "step": 392, "loss": 1.1147528886795044, "percent_done": 78.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1370267868042, "wps": 5524.541213566124, "avg_wps": 4748.034918572801, "eta_in_seconds": 1490.6983881507601, "at": "2024-05-26T01:21:48.089824"}
{"lr": 7.204147651563878e-06, "step": 393, "loss": 1.438295841217041, "percent_done": 78.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13963794708252, "wps": 5526.148330405151, "avg_wps": 4749.736674789495, "eta_in_seconds": 1476.366476739636, "at": "2024-05-26T01:21:59.950307"}
{"lr": 7.07566187196397e-06, "step": 394, "loss": 1.6418980360031128, "percent_done": 78.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.139430046081543, "wps": 5526.016904899557, "avg_wps": 4751.430757068726, "eta_in_seconds": 1462.0471927671867, "at": "2024-05-26T01:22:11.811073"}
{"lr": 6.948178882427538e-06, "step": 395, "loss": 1.5248198509216309, "percent_done": 79.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5539.695165392135, "avg_wps": 4753.143017563693, "eta_in_seconds": 1447.732579173921, "at": "2024-05-26T01:22:23.642574"}
{"lr": 6.821704259473511e-06, "step": 396, "loss": 1.4680887460708618, "percent_done": 79.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1380033493042, "wps": 5518.337770856426, "avg_wps": 4754.807968729612, "eta_in_seconds": 1433.4425374955842, "at": "2024-05-26T01:22:35.519833"}
{"lr": 6.696243535511637e-06, "step": 397, "loss": 1.472925066947937, "percent_done": 79.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.137734413146973, "wps": 5517.009791321851, "avg_wps": 4756.463204499338, "eta_in_seconds": 1419.165398696808, "at": "2024-05-26T01:22:47.399807"}
{"lr": 6.571802198600406e-06, "step": 398, "loss": 1.1985504627227783, "percent_done": 79.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13963794708252, "wps": 5527.859543194786, "avg_wps": 4758.131503702449, "eta_in_seconds": 1404.8943361061902, "at": "2024-05-26T01:22:59.256654"}
{"lr": 6.4483856922070286e-06, "step": 399, "loss": 1.4447048902511597, "percent_done": 79.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1397123336792, "wps": 5535.095050174162, "avg_wps": 4759.806029795003, "eta_in_seconds": 1390.6314582077782, "at": "2024-05-26T01:23:11.097976"}
{"lr": 6.325999414969323e-06, "step": 400, "loss": 1.5511690378189087, "percent_done": 80.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13890552520752, "wps": 5517.873403748047, "avg_wps": 4761.441394141816, "eta_in_seconds": 1376.389932692051, "at": "2024-05-26T01:23:22.976216"}
{"lr": 6.2046487204595115e-06, "step": 401, "loss": 1.290692687034607, "percent_done": 80.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13841962814331, "wps": 5598.55335408203, "avg_wps": 4763.2174792128435, "eta_in_seconds": 1362.1179440818225, "at": "2024-05-26T01:23:50.044411"}
{"lr": 6.084338916950114e-06, "step": 402, "loss": 1.6321139335632324, "percent_done": 80.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5559.21089959873, "avg_wps": 4764.914649424374, "eta_in_seconds": 1347.8789175742893, "at": "2024-05-26T01:24:01.834274"}
{"lr": 5.965075267181666e-06, "step": 403, "loss": 1.2665281295776367, "percent_done": 80.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13898754119873, "wps": 5541.611847253161, "avg_wps": 4766.572390819128, "eta_in_seconds": 1333.6610626630097, "at": "2024-05-26T01:24:13.661546"}
{"lr": 5.846862988132589e-06, "step": 404, "loss": 1.478092908859253, "percent_done": 80.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.14134693145752, "wps": 5536.284560103616, "avg_wps": 4768.213298916344, "eta_in_seconds": 1319.4577519067443, "at": "2024-05-26T01:24:25.500261"}
{"lr": 5.7297072507909045e-06, "step": 405, "loss": 1.8101279735565186, "percent_done": 81.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13792848587036, "wps": 5522.525920368058, "avg_wps": 4769.821945925478, "eta_in_seconds": 1305.2730417575365, "at": "2024-05-26T01:24:37.368321"}
{"lr": 5.613613179928103e-06, "step": 406, "loss": 1.4218931198120117, "percent_done": 81.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.137152671813965, "wps": 5537.558917220902, "avg_wps": 4771.451311582195, "eta_in_seconds": 1291.092289896434, "at": "2024-05-26T01:24:49.204305"}
{"lr": 5.498585853874947e-06, "step": 407, "loss": 1.4505722522735596, "percent_done": 81.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.139375686645508, "wps": 5534.44844776445, "avg_wps": 4773.068094762466, "eta_in_seconds": 1276.9245858210018, "at": "2024-05-26T01:25:01.046787"}
{"lr": 5.384630304299297e-06, "step": 408, "loss": 1.7245798110961914, "percent_done": 81.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13792848587036, "wps": 5529.601516113697, "avg_wps": 4774.669190890225, "eta_in_seconds": 1262.7706253458473, "at": "2024-05-26T01:25:12.899780"}
{"lr": 5.271751515986073e-06, "step": 409, "loss": 1.5155235528945923, "percent_done": 81.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13807201385498, "wps": 5527.431251628049, "avg_wps": 4776.2595638576395, "eta_in_seconds": 1248.6289575064968, "at": "2024-05-26T01:25:24.757450"}
{"lr": 5.159954426619136e-06, "step": 410, "loss": 1.1947604417800903, "percent_done": 82.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1372709274292, "wps": 5534.080078998145, "avg_wps": 4777.855332981898, "eta_in_seconds": 1234.495309911123, "at": "2024-05-26T01:25:36.600760"}
{"lr": 5.049243926565364e-06, "step": 411, "loss": 1.4178783893585205, "percent_done": 82.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13890552520752, "wps": 5524.907980357002, "avg_wps": 4779.427722849318, "eta_in_seconds": 1220.3770698561286, "at": "2024-05-26T01:25:48.463751"}
{"lr": 4.939624858660665e-06, "step": 412, "loss": 1.444692611694336, "percent_done": 82.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5532.407882614163, "avg_wps": 4781.007120603711, "eta_in_seconds": 1206.2663481814188, "at": "2024-05-26T01:26:00.310831"}
{"lr": 4.831102017998196e-06, "step": 413, "loss": 1.3638207912445068, "percent_done": 82.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.139493942260742, "wps": 5535.21029990303, "avg_wps": 4782.584974826806, "eta_in_seconds": 1192.165331094086, "at": "2024-05-26T01:26:12.151762"}
{"lr": 4.7236801517185786e-06, "step": 414, "loss": 1.175404667854309, "percent_done": 82.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.14134693145752, "wps": 5531.479605673014, "avg_wps": 4784.149504495401, "eta_in_seconds": 1178.0768963645623, "at": "2024-05-26T01:26:24.000761"}
{"lr": 4.617363958802224e-06, "step": 415, "loss": 1.4109824895858765, "percent_done": 83.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5522.800096722068, "avg_wps": 4785.691831132305, "eta_in_seconds": 1164.0030734452857, "at": "2024-05-26T01:26:35.868225"}
{"lr": 4.512158089863847e-06, "step": 416, "loss": 1.238850474357605, "percent_done": 83.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5528.04275175627, "avg_wps": 4787.237190444588, "eta_in_seconds": 1149.937590514238, "at": "2024-05-26T01:26:47.724487"}
{"lr": 4.408067146948968e-06, "step": 417, "loss": 1.3194738626480103, "percent_done": 83.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13749408721924, "wps": 5522.282280213682, "avg_wps": 4788.7657519447175, "eta_in_seconds": 1135.8851699503205, "at": "2024-05-26T01:26:59.593137"}
{"lr": 4.305095683332627e-06, "step": 418, "loss": 1.1203041076660156, "percent_done": 83.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13963794708252, "wps": 5534.156177782416, "avg_wps": 4790.309298286976, "eta_in_seconds": 1121.8382082179403, "at": "2024-05-26T01:27:11.436318"}
{"lr": 4.20324820332023e-06, "step": 419, "loss": 1.1515454053878784, "percent_done": 83.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13792896270752, "wps": 5529.878175461868, "avg_wps": 4791.838804481042, "eta_in_seconds": 1107.8035419379896, "at": "2024-05-26T01:27:23.288760"}
{"lr": 4.102529162050497e-06, "step": 420, "loss": 1.3843259811401367, "percent_done": 84.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13963794708252, "wps": 5531.054425724364, "avg_wps": 4793.364101187676, "eta_in_seconds": 1093.7787927900042, "at": "2024-05-26T01:27:35.138532"}
{"lr": 4.002942965300582e-06, "step": 421, "loss": 1.2896846532821655, "percent_done": 84.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13866138458252, "wps": 5533.5867689741135, "avg_wps": 4794.887634639773, "eta_in_seconds": 1079.7633635035038, "at": "2024-05-26T01:27:46.982964"}
{"lr": 3.90449396929334e-06, "step": 422, "loss": 1.2825158834457397, "percent_done": 84.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5528.319032774927, "avg_wps": 4796.395522130321, "eta_in_seconds": 1065.7603144724787, "at": "2024-05-26T01:27:58.838668"}
{"lr": 3.8071864805067762e-06, "step": 423, "loss": 1.3010966777801514, "percent_done": 84.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.139546394348145, "wps": 5529.526098704965, "avg_wps": 4797.899370981466, "eta_in_seconds": 1051.7669525377576, "at": "2024-05-26T01:28:10.691912"}
{"lr": 3.711024755485704e-06, "step": 424, "loss": 1.4910497665405273, "percent_done": 84.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817262649536, "wps": 5536.696381195103, "avg_wps": 4799.409786353237, "eta_in_seconds": 1037.7809400985825, "at": "2024-05-26T01:28:22.529706"}
{"lr": 3.6160130006554755e-06, "step": 425, "loss": 1.4145011901855469, "percent_done": 85.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13841724395752, "wps": 5539.8051360317895, "avg_wps": 4800.919535145401, "eta_in_seconds": 1023.8038700748892, "at": "2024-05-26T01:28:34.360845"}
{"lr": 3.522155372138053e-06, "step": 426, "loss": 1.562549352645874, "percent_done": 85.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1397123336792, "wps": 5533.877530500427, "avg_wps": 4802.412671329722, "eta_in_seconds": 1009.8390812918614, "at": "2024-05-26T01:28:46.204751"}
{"lr": 3.4294559755701608e-06, "step": 427, "loss": 1.6161084175109863, "percent_done": 85.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1399564743042, "wps": 5522.926153747918, "avg_wps": 4803.880370958066, "eta_in_seconds": 995.888246702087, "at": "2024-05-26T01:28:58.072083"}
{"lr": 3.337918865923721e-06, "step": 428, "loss": 1.4051026105880737, "percent_done": 85.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13795518875122, "wps": 5522.344741464484, "avg_wps": 4805.3410747971175, "eta_in_seconds": 981.9473636841105, "at": "2024-05-26T01:29:09.940752"}
{"lr": 3.2475480473284393e-06, "step": 429, "loss": 1.441631555557251, "percent_done": 85.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5521.300393126491, "avg_wps": 4806.794006461246, "eta_in_seconds": 968.0165186495213, "at": "2024-05-26T01:29:21.811505"}
{"lr": 3.158347472896674e-06, "step": 430, "loss": 1.296938180923462, "percent_done": 86.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13873529434204, "wps": 5530.113251980821, "avg_wps": 4808.256571451793, "eta_in_seconds": 954.0921811946603, "at": "2024-05-26T01:29:33.663367"}
{"lr": 3.0703210445505373e-06, "step": 431, "loss": 1.2587578296661377, "percent_done": 86.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1370267868042, "wps": 5529.654798974455, "avg_wps": 4809.71242902935, "eta_in_seconds": 940.1776232415175, "at": "2024-05-26T01:29:45.516228"}
{"lr": 2.9834726128511543e-06, "step": 432, "loss": 0.9100736379623413, "percent_done": 86.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13841724395752, "wps": 5535.013352838121, "avg_wps": 4811.171803270384, "eta_in_seconds": 926.2708093214918, "at": "2024-05-26T01:29:57.357596"}
{"lr": 2.897805976830286e-06, "step": 433, "loss": 1.4476325511932373, "percent_done": 86.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.137044429779053, "wps": 5540.317533962669, "avg_wps": 4812.634568642638, "eta_in_seconds": 912.3717866736802, "at": "2024-05-26T01:30:09.187761"}
{"lr": 2.8133248838241186e-06, "step": 434, "loss": 1.1574301719665527, "percent_done": 86.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1382474899292, "wps": 5536.409226256145, "avg_wps": 4814.084672754298, "eta_in_seconds": 898.4835735191398, "at": "2024-05-26T01:30:21.026124"}
{"lr": 2.7300330293093305e-06, "step": 435, "loss": 1.352285385131836, "percent_done": 87.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.139604568481445, "wps": 5525.974467905801, "avg_wps": 4815.510795797779, "eta_in_seconds": 884.6081299864012, "at": "2024-05-26T01:30:32.886969"}
{"lr": 2.6479340567414757e-06, "step": 436, "loss": 1.0167021751403809, "percent_done": 87.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13966131210327, "wps": 5527.076819131005, "avg_wps": 4816.93313713064, "eta_in_seconds": 870.7415861077264, "at": "2024-05-26T01:30:44.745338"}
{"lr": 2.5670315573955692e-06, "step": 437, "loss": 1.5493172407150269, "percent_done": 87.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1399564743042, "wps": 5508.993597610047, "avg_wps": 4818.318252074068, "eta_in_seconds": 856.8898491133814, "at": "2024-05-26T01:30:56.642640"}
{"lr": 2.48732907020903e-06, "step": 438, "loss": 1.7014528512954712, "percent_done": 87.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1406888961792, "wps": 5533.007342301095, "avg_wps": 4819.739616271812, "eta_in_seconds": 843.0397331594877, "at": "2024-05-26T01:31:08.488447"}
{"lr": 2.4088300816268335e-06, "step": 439, "loss": 1.4381757974624634, "percent_done": 87.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5526.920789883583, "avg_wps": 4821.144799977807, "eta_in_seconds": 829.200566641019, "at": "2024-05-26T01:31:20.347121"}
{"lr": 2.3315380254490547e-06, "step": 440, "loss": 1.1990140676498413, "percent_done": 88.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1370267868042, "wps": 5531.856757145654, "avg_wps": 4822.5529438318035, "eta_in_seconds": 815.368964487856, "at": "2024-05-26T01:31:32.195255"}
{"lr": 2.2554562826806213e-06, "step": 441, "loss": 1.2472739219665527, "percent_done": 88.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.137741088867188, "wps": 5522.19951845925, "avg_wps": 4823.938837216493, "eta_in_seconds": 801.5491345307184, "at": "2024-05-26T01:31:44.064138"}
{"lr": 2.1805881813834265e-06, "step": 442, "loss": 1.6326481103897095, "percent_done": 88.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.14134645462036, "wps": 5529.34334794191, "avg_wps": 4825.331575668181, "eta_in_seconds": 787.736125568459, "at": "2024-05-26T01:31:55.917841"}
{"lr": 2.106936996530766e-06, "step": 443, "loss": 1.249131441116333, "percent_done": 88.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13866090774536, "wps": 5528.971321179561, "avg_wps": 4826.718185394002, "eta_in_seconds": 773.9320707192002, "at": "2024-05-26T01:32:07.772114"}
{"lr": 2.034505949864056e-06, "step": 444, "loss": 1.2009150981903076, "percent_done": 88.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.139052867889404, "wps": 5528.53562972045, "avg_wps": 4828.098592562468, "eta_in_seconds": 760.1369213241715, "at": "2024-05-26T01:32:19.627373"}
{"lr": 1.9632982097519294e-06, "step": 445, "loss": 1.6638498306274414, "percent_done": 89.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5521.438470694523, "avg_wps": 4829.461394149607, "eta_in_seconds": 746.3523788318206, "at": "2024-05-26T01:32:31.497940"}
{"lr": 1.8933168910516103e-06, "step": 446, "loss": 1.8934630155563354, "percent_done": 89.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5530.25655499734, "avg_wps": 4830.83395961315, "eta_in_seconds": 732.5741330764754, "at": "2024-05-26T01:32:43.349501"}
{"lr": 1.8245650549726923e-06, "step": 447, "loss": 1.3426645994186401, "percent_done": 89.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13792896270752, "wps": 5529.773715784365, "avg_wps": 4832.200334250932, "eta_in_seconds": 718.8046355156824, "at": "2024-05-26T01:32:55.202219"}
{"lr": 1.757045708943213e-06, "step": 448, "loss": 1.1059918403625488, "percent_done": 89.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1387357711792, "wps": 5530.425568642956, "avg_wps": 4833.562488571657, "eta_in_seconds": 705.0435383958476, "at": "2024-05-26T01:33:07.053394"}
{"lr": 1.6907618064780943e-06, "step": 449, "loss": 1.1673721075057983, "percent_done": 89.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5534.731944596605, "avg_wps": 4834.926663134462, "eta_in_seconds": 691.2899063153893, "at": "2024-05-26T01:33:18.895326"}
{"lr": 1.625716247049965e-06, "step": 450, "loss": 1.5422428846359253, "percent_done": 90.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.141543865203857, "wps": 5529.564252092678, "avg_wps": 4836.276763342187, "eta_in_seconds": 677.5460049841139, "at": "2024-05-26T01:33:30.748325"}
{"lr": 1.5619118759623072e-06, "step": 451, "loss": 1.575745701789856, "percent_done": 90.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1389799118042, "wps": 5526.203324335761, "avg_wps": 4837.615918344345, "eta_in_seconds": 663.8112769190329, "at": "2024-05-26T01:33:42.608553"}
{"lr": 1.4993514842250177e-06, "step": 452, "loss": 1.3347529172897339, "percent_done": 90.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5530.399420365948, "avg_wps": 4838.956997357865, "eta_in_seconds": 650.0838924002858, "at": "2024-05-26T01:33:54.459897"}
{"lr": 1.4380378084322957e-06, "step": 453, "loss": 1.3280354738235474, "percent_done": 90.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13995599746704, "wps": 5504.600614814582, "avg_wps": 4840.249065640305, "eta_in_seconds": 636.370558256082, "at": "2024-05-26T01:34:06.366570"}
{"lr": 1.37797353064294e-06, "step": 454, "loss": 1.8662519454956055, "percent_done": 90.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13873529434204, "wps": 5521.9309481375085, "avg_wps": 4841.565565280686, "eta_in_seconds": 622.661401431466, "at": "2024-05-26T01:34:18.235992"}
{"lr": 1.319161278263055e-06, "step": 455, "loss": 1.2935104370117188, "percent_done": 91.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1375150680542, "wps": 5524.135750319221, "avg_wps": 4842.880715456137, "eta_in_seconds": 608.9598677472753, "at": "2024-05-26T01:34:30.100636"}
{"lr": 1.261603623931077e-06, "step": 456, "loss": 1.1133410930633545, "percent_done": 91.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5543.254847133117, "avg_wps": 4844.2229380055915, "eta_in_seconds": 595.2624470225552, "at": "2024-05-26T01:34:41.924339"}
{"lr": 1.205303085405276e-06, "step": 457, "loss": 0.9698067307472229, "percent_done": 91.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1380033493042, "wps": 5522.029897897316, "avg_wps": 4845.524401093386, "eta_in_seconds": 581.5775067326276, "at": "2024-05-26T01:34:53.793598"}
{"lr": 1.1502621254535857e-06, "step": 458, "loss": 1.4360275268554688, "percent_done": 91.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13792848587036, "wps": 5529.291294548543, "avg_wps": 4846.833074219196, "eta_in_seconds": 567.8990709708768, "at": "2024-05-26T01:35:05.647166"}
{"lr": 1.0964831517459112e-06, "step": 459, "loss": 1.423099160194397, "percent_done": 91.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1389799118042, "wps": 5525.477159361278, "avg_wps": 4848.130354698634, "eta_in_seconds": 554.229322112983, "at": "2024-05-26T01:35:17.508882"}
{"lr": 1.0439685167487763e-06, "step": 460, "loss": 1.366470217704773, "percent_done": 92.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5531.416937610161, "avg_wps": 4849.432620379425, "eta_in_seconds": 540.5663311999776, "at": "2024-05-26T01:35:29.357901"}
{"lr": 9.927205176224375e-07, "step": 461, "loss": 1.4344816207885742, "percent_done": 92.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5532.91033750688, "avg_wps": 4850.732422140273, "eta_in_seconds": 526.9109440739398, "at": "2024-05-26T01:35:41.203876"}
{"lr": 9.427413961204031e-07, "step": 462, "loss": 1.2644466161727905, "percent_done": 92.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5533.860373608077, "avg_wps": 4852.028870609693, "eta_in_seconds": 513.2632279014175, "at": "2024-05-26T01:35:53.047738"}
{"lr": 8.940333384913533e-07, "step": 463, "loss": 1.3797340393066406, "percent_done": 92.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13873529434204, "wps": 5514.641063086767, "avg_wps": 4853.288368017841, "eta_in_seconds": 499.62660697829904, "at": "2024-05-26T01:36:04.932824"}
{"lr": 8.465984753835264e-07, "step": 464, "loss": 1.3376905918121338, "percent_done": 92.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13866090774536, "wps": 5526.422311025146, "avg_wps": 4854.562720465085, "eta_in_seconds": 485.9955748545712, "at": "2024-05-26T01:36:16.792582"}
{"lr": 8.004388817514974e-07, "step": 465, "loss": 1.4441041946411133, "percent_done": 93.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5540.984049895522, "avg_wps": 4855.85637033613, "eta_in_seconds": 472.36982008205945, "at": "2024-05-26T01:36:28.621176"}
{"lr": 7.555565767654276e-07, "step": 466, "loss": 1.4485150575637817, "percent_done": 93.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13792896270752, "wps": 5541.514875667664, "avg_wps": 4857.1460284894865, "eta_in_seconds": 458.75170046986426, "at": "2024-05-26T01:36:40.448714"}
{"lr": 7.119535237227388e-07, "step": 467, "loss": 1.4039851427078247, "percent_done": 93.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1380033493042, "wps": 5530.423009438971, "avg_wps": 4858.412551034939, "eta_in_seconds": 445.1429303876848, "at": "2024-05-26T01:36:52.299817"}
{"lr": 6.696316299622224e-07, "step": 468, "loss": 1.4579898118972778, "percent_done": 93.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817262649536, "wps": 5528.233421619218, "avg_wps": 4859.670703555737, "eta_in_seconds": 431.54199696402264, "at": "2024-05-26T01:37:04.155686"}
{"lr": 6.285927467806198e-07, "step": 469, "loss": 1.468167781829834, "percent_done": 93.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.141366481781006, "wps": 5534.032838638812, "avg_wps": 4860.933688865113, "eta_in_seconds": 417.9476886619128, "at": "2024-05-26T01:37:15.999114"}
{"lr": 5.888386693516242e-07, "step": 470, "loss": 1.7039626836776733, "percent_done": 94.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13841724395752, "wps": 5533.433490906272, "avg_wps": 4862.190967746711, "eta_in_seconds": 404.3609173399337, "at": "2024-05-26T01:37:27.867758"}
{"lr": 5.503711366473705e-07, "step": 471, "loss": 1.2690417766571045, "percent_done": 94.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13718271255493, "wps": 2803.200888024254, "avg_wps": 4854.6202964176155, "eta_in_seconds": 391.4917921392275, "at": "2024-05-26T01:37:51.248014"}
{"lr": 5.131918313623563e-07, "step": 472, "loss": 1.1867066621780396, "percent_done": 94.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5554.745465491234, "avg_wps": 4855.917000218266, "eta_in_seconds": 377.8911377434003, "at": "2024-05-26T01:38:03.047413"}
{"lr": 4.773023798398375e-07, "step": 473, "loss": 1.2774744033813477, "percent_done": 94.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13819980621338, "wps": 5545.210685093927, "avg_wps": 4857.19346991733, "eta_in_seconds": 364.29926272426553, "at": "2024-05-26T01:38:14.867100"}
{"lr": 4.4270435200069295e-07, "step": 474, "loss": 1.5921688079833984, "percent_done": 94.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13792896270752, "wps": 5548.378287872638, "avg_wps": 4858.470347732369, "eta_in_seconds": 350.7145002532106, "at": "2024-05-26T01:38:26.680054"}
{"lr": 4.0939926127473865e-07, "step": 475, "loss": 1.4718433618545532, "percent_done": 95.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13961887359619, "wps": 5533.022711914743, "avg_wps": 4859.717646931217, "eta_in_seconds": 337.1389284384878, "at": "2024-05-26T01:38:38.525792"}
{"lr": 3.7738856453453507e-07, "step": 476, "loss": 1.1018459796905518, "percent_done": 95.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1370267868042, "wps": 5536.424503263853, "avg_wps": 4860.965854501864, "eta_in_seconds": 323.5702630051044, "at": "2024-05-26T01:38:50.364255"}
{"lr": 3.4667366203166475e-07, "step": 477, "loss": 1.605708122253418, "percent_done": 95.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1397123336792, "wps": 5531.192991590281, "avg_wps": 4862.200998878406, "eta_in_seconds": 310.0093970503697, "at": "2024-05-26T01:39:02.213912"}
{"lr": 3.172558973354582e-07, "step": 478, "loss": 1.5464510917663574, "percent_done": 95.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13789701461792, "wps": 5523.193933056403, "avg_wps": 4863.4186427379045, "eta_in_seconds": 296.45648584106476, "at": "2024-05-26T01:39:14.080674"}
{"lr": 2.8913655727425123e-07, "step": 479, "loss": 1.4629555940628052, "percent_done": 95.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1370267868042, "wps": 5534.455913700166, "avg_wps": 4864.6500105502755, "eta_in_seconds": 282.9095612254173, "at": "2024-05-26T01:39:25.923283"}
{"lr": 2.623168718790634e-07, "step": 480, "loss": 1.308935523033142, "percent_done": 96.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13841724395752, "wps": 5533.210829539052, "avg_wps": 4865.874861945717, "eta_in_seconds": 269.3698537647724, "at": "2024-05-26T01:39:37.768538"}
{"lr": 2.3679801432982478e-07, "step": 481, "loss": 1.2836899757385254, "percent_done": 96.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1387357711792, "wps": 5538.883527322008, "avg_wps": 4867.104349124798, "eta_in_seconds": 255.83671741574818, "at": "2024-05-26T01:39:49.601629"}
{"lr": 2.1258110090402713e-07, "step": 482, "loss": 1.5766515731811523, "percent_done": 96.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13963794708252, "wps": 5526.650426726287, "avg_wps": 4868.309702273784, "eta_in_seconds": 242.3116178186108, "at": "2024-05-26T01:40:01.460946"}
{"lr": 1.896671909279231e-07, "step": 483, "loss": 1.0516997575759888, "percent_done": 96.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.139439582824707, "wps": 5530.952592586363, "avg_wps": 4869.517567317775, "eta_in_seconds": 228.79309594803962, "at": "2024-05-26T01:40:13.311042"}
{"lr": 1.6805728673016362e-07, "step": 484, "loss": 1.6656585931777954, "percent_done": 96.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817262649536, "wps": 5531.944595848905, "avg_wps": 4870.722626175347, "eta_in_seconds": 215.28140287951004, "at": "2024-05-26T01:40:25.159010"}
{"lr": 1.477523335979629e-07, "step": 485, "loss": 1.372025489807129, "percent_done": 97.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13963794708252, "wps": 5521.838768312022, "avg_wps": 4871.907117821334, "eta_in_seconds": 201.77724579437492, "at": "2024-05-26T01:40:37.028650"}
{"lr": 1.2875321973575205e-07, "step": 486, "loss": 1.479919195175171, "percent_done": 97.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13792896270752, "wps": 5534.706424234692, "avg_wps": 4873.10788058636, "eta_in_seconds": 188.2790249021946, "at": "2024-05-26T01:40:48.870698"}
{"lr": 1.1106077622631656e-07, "step": 487, "loss": 1.4514286518096924, "percent_done": 97.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13841724395752, "wps": 5538.060746146945, "avg_wps": 4874.309639355246, "eta_in_seconds": 174.78741873950685, "at": "2024-05-26T01:41:00.705528"}
{"lr": 9.467577699445256e-08, "step": 488, "loss": 1.652998447418213, "percent_done": 97.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5533.492974264452, "avg_wps": 4875.4998016228965, "eta_in_seconds": 161.3028472974652, "at": "2024-05-26T01:41:12.550138"}
{"lr": 7.959893877311043e-08, "step": 489, "loss": 1.6865766048431396, "percent_done": 97.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13866090774536, "wps": 5527.329329568334, "avg_wps": 4876.67587310956, "eta_in_seconds": 147.82528483696998, "at": "2024-05-26T01:41:24.407965"}
{"lr": 6.58309210720302e-08, "step": 490, "loss": 1.6229629516601562, "percent_done": 98.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.138378620147705, "wps": 5530.420116428623, "avg_wps": 4877.852618073053, "eta_in_seconds": 134.35420282519596, "at": "2024-05-26T01:41:36.259189"}
{"lr": 5.337232614891126e-08, "step": 491, "loss": 1.1492687463760376, "percent_done": 98.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1370267868042, "wps": 5537.087628946555, "avg_wps": 4879.035690602307, "eta_in_seconds": 120.88946205826738, "at": "2024-05-26T01:41:48.096162"}
{"lr": 4.222369898305362e-08, "step": 492, "loss": 1.3562477827072144, "percent_done": 98.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13769817352295, "wps": 5529.093100213343, "avg_wps": 4880.2018837778005, "eta_in_seconds": 107.4316211677179, "at": "2024-05-26T01:41:59.950321"}
{"lr": 3.2385527251530405e-08, "step": 493, "loss": 1.3547463417053223, "percent_done": 98.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.138689517974854, "wps": 5528.314696561733, "avg_wps": 4881.362669363302, "eta_in_seconds": 93.98031473449954, "at": "2024-05-26T01:42:11.806184"}
{"lr": 2.385824130784165e-08, "step": 494, "loss": 1.603198528289795, "percent_done": 98.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1392240524292, "wps": 5534.3604181010805, "avg_wps": 4882.5288400314985, "eta_in_seconds": 80.5353153833011, "at": "2024-05-26T01:42:23.649073"}
{"lr": 1.6642214163099443e-08, "step": 495, "loss": 1.408722162246704, "percent_done": 99.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13817310333252, "wps": 5542.347735327411, "avg_wps": 4883.703399631958, "eta_in_seconds": 67.09662180235892, "at": "2024-05-26T01:42:35.474906"}
{"lr": 1.0737761469707708e-08, "step": 496, "loss": 1.444448471069336, "percent_done": 99.2, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.138458728790283, "wps": 5534.3021417759355, "avg_wps": 4884.861165927321, "eta_in_seconds": 53.66457532682726, "at": "2024-05-26T01:42:47.317871"}
{"lr": 6.145141507556636e-09, "step": 497, "loss": 1.5961229801177979, "percent_done": 99.4, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.1397123336792, "wps": 5531.425731089284, "avg_wps": 4886.010305561376, "eta_in_seconds": 40.23896547582308, "at": "2024-05-26T01:42:59.166964"}
{"lr": 2.864555172718443e-09, "step": 498, "loss": 1.2048214673995972, "percent_done": 99.6, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13988208770752, "wps": 5537.711866112709, "avg_wps": 4887.165210088157, "eta_in_seconds": 26.81963763562551, "at": "2024-05-26T01:43:11.002721"}
{"lr": 8.961459686677561e-10, "step": 499, "loss": 1.4899966716766357, "percent_done": 99.8, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.14134693145752, "wps": 5538.832075409613, "avg_wps": 4888.317777472936, "eta_in_seconds": 13.406657051227853, "at": "2024-05-26T01:43:22.835988"}
{"lr": 2.4e-10, "step": 500, "loss": 1.5752968788146973, "percent_done": 100.0, "peak_allocated_mem": 64.85457944869995, "allocated_mem": 24.13963794708252, "wps": 5520.256994018846, "avg_wps": 4889.437227938565, "eta_in_seconds": 0.0, "at": "2024-05-26T01:43:34.709027"}