CHEMISTral7Bv0.3 / runseed5 /metrics.train.jsonl
Clemspace's picture
Initial model upload
cb9e677
{"lr": 2.3999999999999974e-06, "step": 1, "loss": 2.262953042984009, "percent_done": 0.2, "peak_allocated_mem": 63.57235288619995, "allocated_mem": 24.13692855834961, "wps": 88.16643749820423, "avg_wps": 88.16643749820423, "eta_in_seconds": 370917.37999129295, "at": "2024-05-25T21:59:10.332723"}
{"lr": 2.646387992434257e-06, "step": 2, "loss": 2.1094534397125244, "percent_done": 0.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13880491256714, "wps": 5641.716752178008, "avg_wps": 173.61961874185505, "eta_in_seconds": 187979.49354171753, "at": "2024-05-25T21:59:21.950364"}
{"lr": 3.3813362028748325e-06, "step": 3, "loss": 1.950036644935608, "percent_done": 0.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1414213180542, "wps": 5581.752965709586, "avg_wps": 256.44114573749755, "eta_in_seconds": 127013.12773474057, "at": "2024-05-25T21:59:33.692711"}
{"lr": 4.592269463674938e-06, "step": 4, "loss": 2.1372272968292236, "percent_done": 0.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5568.708412525151, "avg_wps": 336.7523364839041, "eta_in_seconds": 96527.48467731476, "at": "2024-05-25T21:59:45.462542"}
{"lr": 6.258468371008163e-06, "step": 5, "loss": 2.4573512077331543, "percent_done": 1.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5556.700210769298, "avg_wps": 414.65804703405377, "eta_in_seconds": 78233.90919828415, "at": "2024-05-25T21:59:57.257808"}
{"lr": 8.351423799612423e-06, "step": 6, "loss": 2.1645777225494385, "percent_done": 1.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139694690704346, "wps": 5539.8033496717935, "avg_wps": 490.25053920820994, "eta_in_seconds": 66037.22262557347, "at": "2024-05-25T22:00:09.089028"}
{"lr": 1.0835324701827431e-05, "step": 7, "loss": 1.8717948198318481, "percent_done": 1.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.138723373413086, "wps": 5544.172879147123, "avg_wps": 563.6520212491118, "eta_in_seconds": 57321.2669909341, "at": "2024-05-25T22:00:20.910955"}
{"lr": 1.3667670844548846e-05, "step": 8, "loss": 2.1801249980926514, "percent_done": 1.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13971185684204, "wps": 5528.093002828564, "avg_wps": 634.9254699210051, "eta_in_seconds": 50783.45967757702, "at": "2024-05-25T22:00:32.767220"}
{"lr": 1.6799999999999995e-05, "step": 9, "loss": 2.0575146675109863, "percent_done": 1.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5534.476640134749, "avg_wps": 704.1928640175574, "eta_in_seconds": 45695.11797722181, "at": "2024-05-25T22:00:44.609869"}
{"lr": 2.017871714788541e-05, "step": 10, "loss": 1.8830426931381226, "percent_done": 2.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139169692993164, "wps": 5542.375561228271, "avg_wps": 771.5443544496028, "eta_in_seconds": 41621.24940037727, "at": "2024-05-25T22:00:56.435655"}
{"lr": 2.37460115010474e-05, "step": 11, "loss": 2.232516288757324, "percent_done": 2.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5536.732403121099, "avg_wps": 837.0347008453684, "eta_in_seconds": 38286.47004435279, "at": "2024-05-25T22:01:08.273425"}
{"lr": 2.7440845664062507e-05, "step": 12, "loss": 1.8419462442398071, "percent_done": 2.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5539.74138602249, "avg_wps": 900.7559521764189, "eta_in_seconds": 35505.25302966436, "at": "2024-05-25T22:01:20.104820"}
{"lr": 3.12e-05, "step": 13, "loss": 1.7451030015945435, "percent_done": 2.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1411771774292, "wps": 5539.755341678419, "avg_wps": 962.7734871603661, "eta_in_seconds": 33150.09441538957, "at": "2024-05-25T22:01:31.936253"}
{"lr": 3.495915433593748e-05, "step": 14, "loss": 1.5826107263565063, "percent_done": 2.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5539.311251368314, "avg_wps": 1023.153623997986, "eta_in_seconds": 31129.729937859942, "at": "2024-05-25T22:01:43.768550"}
{"lr": 3.86539884989526e-05, "step": 15, "loss": 1.8554575443267822, "percent_done": 3.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.140127182006836, "wps": 5528.257214583447, "avg_wps": 1081.933096932108, "eta_in_seconds": 29377.93481882413, "at": "2024-05-25T22:01:55.624507"}
{"lr": 4.222128285211459e-05, "step": 16, "loss": 1.8528378009796143, "percent_done": 3.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5531.100390981026, "avg_wps": 1139.2060386867545, "eta_in_seconds": 27843.447912693024, "at": "2024-05-25T22:02:07.474357"}
{"lr": 4.56e-05, "step": 17, "loss": 1.729903221130371, "percent_done": 3.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5536.814820374232, "avg_wps": 1195.0388768566274, "eta_in_seconds": 26487.747480869293, "at": "2024-05-25T22:02:19.312027"}
{"lr": 4.873232915545115e-05, "step": 18, "loss": 2.0164880752563477, "percent_done": 3.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5527.944920430914, "avg_wps": 1249.4466271322206, "eta_in_seconds": 25281.873842424815, "at": "2024-05-25T22:02:31.168654"}
{"lr": 5.156467529817257e-05, "step": 19, "loss": 1.915980339050293, "percent_done": 3.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5518.685654291463, "avg_wps": 1302.4778394687057, "eta_in_seconds": 24202.189891275608, "at": "2024-05-25T22:02:43.045117"}
{"lr": 5.404857620038757e-05, "step": 20, "loss": 1.928839087486267, "percent_done": 4.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.14018678665161, "wps": 5525.959470694772, "avg_wps": 1354.2296114341582, "eta_in_seconds": 23228.911651611328, "at": "2024-05-25T22:02:54.905990"}
{"lr": 5.6141531628991836e-05, "step": 21, "loss": 1.9956589937210083, "percent_done": 4.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5530.314412356966, "avg_wps": 1404.741861693786, "eta_in_seconds": 22346.984065918696, "at": "2024-05-25T22:03:06.757515"}
{"lr": 5.780773053632506e-05, "step": 22, "loss": 1.6539652347564697, "percent_done": 4.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5546.238248460089, "avg_wps": 1454.0966576327437, "eta_in_seconds": 21543.415175026115, "at": "2024-05-25T22:03:18.575075"}
{"lr": 5.9018663797125166e-05, "step": 23, "loss": 1.766621470451355, "percent_done": 4.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5537.985655685933, "avg_wps": 1502.262606911442, "eta_in_seconds": 20809.059518741527, "at": "2024-05-25T22:03:30.410244"}
{"lr": 5.975361200756574e-05, "step": 24, "loss": 1.3346548080444336, "percent_done": 4.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5539.707781091524, "avg_wps": 1549.311262478215, "eta_in_seconds": 20134.841045498848, "at": "2024-05-25T22:03:42.241800"}
{"lr": 6e-05, "step": 25, "loss": 1.706301212310791, "percent_done": 5.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.14044427871704, "wps": 5545.542833733442, "avg_wps": 1595.2953608999255, "eta_in_seconds": 19513.377123117447, "at": "2024-05-25T22:03:54.060805"}
{"lr": 5.9999343854031334e-05, "step": 26, "loss": 1.46425199508667, "percent_done": 5.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5543.427451060901, "avg_wps": 1640.226112090874, "eta_in_seconds": 18938.89127298502, "at": "2024-05-25T22:04:05.884316"}
{"lr": 5.999737544482728e-05, "step": 27, "loss": 2.186837911605835, "percent_done": 5.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139450550079346, "wps": 5539.600493658582, "avg_wps": 1684.132631983322, "eta_in_seconds": 18406.227283592576, "at": "2024-05-25T22:04:17.715992"}
{"lr": 5.999409485849245e-05, "step": 28, "loss": 1.7592682838439941, "percent_done": 5.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5540.458016107884, "avg_wps": 1727.0643725974264, "eta_in_seconds": 17910.73482309069, "at": "2024-05-25T22:04:29.545819"}
{"lr": 5.9989502238530296e-05, "step": 29, "loss": 2.010122537612915, "percent_done": 5.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139456272125244, "wps": 5536.871365159185, "avg_wps": 1769.0381189621935, "eta_in_seconds": 17448.722935438156, "at": "2024-05-25T22:04:41.383339"}
{"lr": 5.99835977858369e-05, "step": 30, "loss": 1.865985631942749, "percent_done": 6.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5533.739832727509, "avg_wps": 1810.0859077694442, "eta_in_seconds": 17016.827691872917, "at": "2024-05-25T22:04:53.227570"}
{"lr": 5.9976381758692166e-05, "step": 31, "loss": 1.4043118953704834, "percent_done": 6.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5532.196994566016, "avg_wps": 1850.242670335246, "eta_in_seconds": 16612.082562354302, "at": "2024-05-25T22:05:05.075097"}
{"lr": 5.9967854472748474e-05, "step": 32, "loss": 1.771388053894043, "percent_done": 6.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13995599746704, "wps": 5528.366398008164, "avg_wps": 1889.5282279310034, "eta_in_seconds": 16232.013656437397, "at": "2024-05-25T22:05:16.930835"}
{"lr": 5.9958016301016944e-05, "step": 33, "loss": 1.6079459190368652, "percent_done": 6.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1399564743042, "wps": 5530.096007165038, "avg_wps": 1927.9898190231859, "eta_in_seconds": 15874.208306507631, "at": "2024-05-25T22:05:28.782877"}
{"lr": 5.994686767385109e-05, "step": 34, "loss": 1.8389538526535034, "percent_done": 6.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5548.02575516183, "avg_wps": 1965.7136464029804, "eta_in_seconds": 15536.228308677673, "at": "2024-05-25T22:05:40.596542"}
{"lr": 5.993440907892797e-05, "step": 35, "loss": 1.840371012687683, "percent_done": 7.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139039993286133, "wps": 5546.35485799353, "avg_wps": 2002.6531319906146, "eta_in_seconds": 15216.933733156748, "at": "2024-05-25T22:05:52.413778"}
{"lr": 5.9920641061226885e-05, "step": 36, "loss": 1.7521817684173584, "percent_done": 7.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.14044427871704, "wps": 5540.577621386599, "avg_wps": 2038.8165240629946, "eta_in_seconds": 14914.880098872714, "at": "2024-05-25T22:06:04.243314"}
{"lr": 5.9905564223005546e-05, "step": 37, "loss": 1.7343847751617432, "percent_done": 7.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5543.818420816132, "avg_wps": 2074.2603671670677, "eta_in_seconds": 14628.42779059668, "at": "2024-05-25T22:06:16.065952"}
{"lr": 5.988917922377368e-05, "step": 38, "loss": 1.3425891399383545, "percent_done": 7.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5548.527579044411, "avg_wps": 2109.012464386962, "eta_in_seconds": 14356.307756009855, "at": "2024-05-25T22:06:27.878578"}
{"lr": 5.9871486780264246e-05, "step": 39, "loss": 1.4163566827774048, "percent_done": 7.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5535.693754583073, "avg_wps": 2143.0270116881056, "eta_in_seconds": 14097.86056602307, "at": "2024-05-25T22:06:39.718619"}
{"lr": 5.985248766640204e-05, "step": 40, "loss": 1.7220834493637085, "percent_done": 8.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5536.443348739875, "avg_wps": 2176.3758096566335, "eta_in_seconds": 13851.725362062454, "at": "2024-05-25T22:06:51.557025"}
{"lr": 5.983218271326983e-05, "step": 41, "loss": 1.53286612033844, "percent_done": 8.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5537.267880265823, "avg_wps": 2209.078717214353, "eta_in_seconds": 13616.999596072406, "at": "2024-05-25T22:07:03.393696"}
{"lr": 5.981057280907208e-05, "step": 42, "loss": 1.1175395250320435, "percent_done": 8.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1409330368042, "wps": 5529.745793791417, "avg_wps": 2241.1219532407085, "eta_in_seconds": 13393.063218446006, "at": "2024-05-25T22:07:15.246432"}
{"lr": 5.978765889909597e-05, "step": 43, "loss": 1.2107163667678833, "percent_done": 8.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1384916305542, "wps": 5545.109448641502, "avg_wps": 2272.6128681348164, "eta_in_seconds": 13178.642266766969, "at": "2024-05-25T22:07:27.066384"}
{"lr": 5.976344198567018e-05, "step": 44, "loss": 1.7663185596466064, "percent_done": 8.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5540.493975321999, "avg_wps": 2303.4910422531702, "eta_in_seconds": 12973.532543355768, "at": "2024-05-25T22:07:38.896115"}
{"lr": 5.9737923128120935e-05, "step": 45, "loss": 1.2885420322418213, "percent_done": 9.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5531.567432399225, "avg_wps": 2333.7558908646724, "eta_in_seconds": 12777.20609800021, "at": "2024-05-25T22:07:50.744945"}
{"lr": 5.971110344272575e-05, "step": 46, "loss": 1.4329020977020264, "percent_done": 9.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13971185684204, "wps": 5526.3755346328535, "avg_wps": 2363.4378901504992, "eta_in_seconds": 12589.010324322659, "at": "2024-05-25T22:08:02.604890"}
{"lr": 5.968298410266454e-05, "step": 47, "loss": 1.9799071550369263, "percent_done": 9.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13873529434204, "wps": 5539.442863470415, "avg_wps": 2392.6250525446417, "eta_in_seconds": 12408.04862777223, "at": "2024-05-25T22:08:14.436901"}
{"lr": 5.9653566337968336e-05, "step": 48, "loss": 1.4268672466278076, "percent_done": 9.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13966703414917, "wps": 5538.246974814324, "avg_wps": 2421.2758848761755, "eta_in_seconds": 12234.158108552298, "at": "2024-05-25T22:08:26.271483"}
{"lr": 5.9622851435465466e-05, "step": 49, "loss": 1.9112210273742676, "percent_done": 9.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13922357559204, "wps": 5520.597025623152, "avg_wps": 2449.338834708171, "eta_in_seconds": 12067.230381182262, "at": "2024-05-25T22:08:38.143905"}
{"lr": 5.9590840738725265e-05, "step": 50, "loss": 1.664664387702942, "percent_done": 10.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13933753967285, "wps": 5540.159639641797, "avg_wps": 2476.976633654808, "eta_in_seconds": 11906.127655506134, "at": "2024-05-25T22:08:49.974438"}
{"lr": 5.955753564799931e-05, "step": 51, "loss": 1.698335886001587, "percent_done": 10.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13935899734497, "wps": 5542.056753488515, "avg_wps": 2504.1321414867934, "eta_in_seconds": 11750.843141420215, "at": "2024-05-25T22:09:01.800838"}
{"lr": 5.9522937620160167e-05, "step": 52, "loss": 1.842172384262085, "percent_done": 10.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13971185684204, "wps": 5536.226912269592, "avg_wps": 2530.7872951936006, "eta_in_seconds": 11601.183574676514, "at": "2024-05-25T22:09:13.639853"}
{"lr": 5.9487048168637646e-05, "step": 53, "loss": 1.6874887943267822, "percent_done": 10.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.14142084121704, "wps": 5519.104502091987, "avg_wps": 2556.9087546851515, "eta_in_seconds": 11457.034572048007, "at": "2024-05-25T22:09:25.515428"}
{"lr": 5.944986886335264e-05, "step": 54, "loss": 1.5346497297286987, "percent_done": 10.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13853931427002, "wps": 5529.741010370717, "avg_wps": 2582.6205532103518, "eta_in_seconds": 11317.59598353174, "at": "2024-05-25T22:09:37.368175"}
{"lr": 5.941140133064838e-05, "step": 55, "loss": 1.6654815673828125, "percent_done": 11.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5533.699839270242, "avg_wps": 2607.9074046690016, "eta_in_seconds": 11182.72832378474, "at": "2024-05-25T22:09:49.212434"}
{"lr": 5.937164725321938e-05, "step": 56, "loss": 1.5459319353103638, "percent_done": 11.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5534.284759400332, "avg_wps": 2632.76695202972, "eta_in_seconds": 11052.244475177356, "at": "2024-05-25T22:10:01.055467"}
{"lr": 5.933060837003778e-05, "step": 57, "loss": 1.263810634613037, "percent_done": 11.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.14113140106201, "wps": 5524.281408249896, "avg_wps": 2657.167163803352, "eta_in_seconds": 10926.09015928235, "at": "2024-05-25T22:10:12.919993"}
{"lr": 5.928828647627726e-05, "step": 58, "loss": 1.76726496219635, "percent_done": 11.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5539.613667125813, "avg_wps": 2681.221114413725, "eta_in_seconds": 10803.626692434837, "at": "2024-05-25T22:10:24.751609"}
{"lr": 5.924468342323457e-05, "step": 59, "loss": 1.5752986669540405, "percent_done": 11.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1384916305542, "wps": 5525.510591862112, "avg_wps": 2704.819793975247, "eta_in_seconds": 10685.139196472654, "at": "2024-05-25T22:10:36.613443"}
{"lr": 5.919980111824851e-05, "step": 60, "loss": 1.4939701557159424, "percent_done": 12.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1409330368042, "wps": 5526.555978097075, "avg_wps": 2728.0343519292246, "eta_in_seconds": 10570.189477125803, "at": "2024-05-25T22:10:48.473005"}
{"lr": 5.915364152461648e-05, "step": 61, "loss": 1.3114984035491943, "percent_done": 12.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5532.251886264102, "avg_wps": 2750.893163305559, "eta_in_seconds": 10458.531935652749, "at": "2024-05-25T22:11:00.320352"}
{"lr": 5.9106206661508645e-05, "step": 62, "loss": 1.5468474626541138, "percent_done": 12.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139453887939453, "wps": 5532.953660697286, "avg_wps": 2773.3851612342896, "eta_in_seconds": 10350.083501285122, "at": "2024-05-25T22:11:12.166197"}
{"lr": 5.90574986038796e-05, "step": 63, "loss": 1.3879033327102661, "percent_done": 12.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5537.726146236248, "avg_wps": 2795.535717326603, "eta_in_seconds": 10244.631046026472, "at": "2024-05-25T22:11:24.001887"}
{"lr": 5.9007519482377565e-05, "step": 64, "loss": 1.4439136981964111, "percent_done": 12.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5534.993736920034, "avg_wps": 2817.323056344394, "eta_in_seconds": 10142.143953159451, "at": "2024-05-25T22:11:35.843333"}
{"lr": 5.8956271483251227e-05, "step": 65, "loss": 1.567832112312317, "percent_done": 13.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5533.965544802702, "avg_wps": 2838.7624119314255, "eta_in_seconds": 10042.46071463365, "at": "2024-05-25T22:11:47.687056"}
{"lr": 5.8903756848254094e-05, "step": 66, "loss": 1.8967957496643066, "percent_done": 13.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5537.435314807347, "avg_wps": 2859.880056007073, "eta_in_seconds": 9945.390520926678, "at": "2024-05-25T22:11:59.523357"}
{"lr": 5.884997787454641e-05, "step": 67, "loss": 1.7465324401855469, "percent_done": 13.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1411771774292, "wps": 5538.385678118816, "avg_wps": 2880.6736048710677, "eta_in_seconds": 9850.85153417445, "at": "2024-05-25T22:12:11.357630"}
{"lr": 5.879493691459472e-05, "step": 68, "loss": 1.7675424814224243, "percent_done": 13.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5532.369133234906, "avg_wps": 2901.122491159192, "eta_in_seconds": 9758.82682867611, "at": "2024-05-25T22:12:23.204732"}
{"lr": 5.873863637606892e-05, "step": 69, "loss": 1.8643747568130493, "percent_done": 13.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139580726623535, "wps": 5531.476934181323, "avg_wps": 2921.2547968484523, "eta_in_seconds": 9669.138080824976, "at": "2024-05-25T22:12:35.053733"}
{"lr": 5.868107872173695e-05, "step": 70, "loss": 2.0621795654296875, "percent_done": 14.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13907241821289, "wps": 5528.966761520842, "avg_wps": 2941.0711223561316, "eta_in_seconds": 9581.706401382175, "at": "2024-05-25T22:12:46.908150"}
{"lr": 5.862226646935706e-05, "step": 71, "loss": 1.7251265048980713, "percent_done": 14.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.141066551208496, "wps": 5535.076659704005, "avg_wps": 2960.6131930519027, "eta_in_seconds": 9496.324635038913, "at": "2024-05-25T22:12:58.749481"}
{"lr": 5.856220219156771e-05, "step": 72, "loss": 1.6062341928482056, "percent_done": 14.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5538.399515354115, "avg_wps": 2979.8763909947434, "eta_in_seconds": 9412.943464623559, "at": "2024-05-25T22:13:10.583721"}
{"lr": 5.8500888515774985e-05, "step": 73, "loss": 1.569394826889038, "percent_done": 14.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1384916305542, "wps": 5535.043891532772, "avg_wps": 2998.840340494905, "eta_in_seconds": 9331.56447914855, "at": "2024-05-25T22:13:22.425119"}
{"lr": 5.84383281240377e-05, "step": 74, "loss": 1.465248703956604, "percent_done": 14.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5533.697054232073, "avg_wps": 3017.5194597715245, "eta_in_seconds": 9252.081510060543, "at": "2024-05-25T22:13:34.269418"}
{"lr": 5.8374523752950034e-05, "step": 75, "loss": 1.4536652565002441, "percent_done": 15.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5547.902132953314, "avg_wps": 3035.982166299971, "eta_in_seconds": 9174.230438232422, "at": "2024-05-25T22:13:46.083424"}
{"lr": 5.830947819352191e-05, "step": 76, "loss": 1.9199892282485962, "percent_done": 15.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5523.671294926767, "avg_wps": 3054.0803565473693, "eta_in_seconds": 9098.406314172244, "at": "2024-05-25T22:13:57.949194"}
{"lr": 5.8243194291056786e-05, "step": 77, "loss": 1.7800021171569824, "percent_done": 15.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13897943496704, "wps": 5538.398064672976, "avg_wps": 3071.976113690907, "eta_in_seconds": 9024.07016657854, "at": "2024-05-25T22:14:09.783429"}
{"lr": 5.817567494502731e-05, "step": 78, "loss": 1.5275590419769287, "percent_done": 15.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13873529434204, "wps": 5535.078220102789, "avg_wps": 3089.602637728104, "eta_in_seconds": 8951.37506107795, "at": "2024-05-25T22:14:21.638665"}
{"lr": 5.810692310894839e-05, "step": 79, "loss": 1.35567307472229, "percent_done": 15.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.14020013809204, "wps": 5519.279262417243, "avg_wps": 3106.915483279532, "eta_in_seconds": 8880.401204501526, "at": "2024-05-25T22:14:33.513860"}
{"lr": 5.8036941790248074e-05, "step": 80, "loss": 1.568904995918274, "percent_done": 16.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.14093255996704, "wps": 5518.295230159511, "avg_wps": 3123.9794050907803, "eta_in_seconds": 8810.91596031189, "at": "2024-05-25T22:14:45.391215"}
{"lr": 5.796573405013595e-05, "step": 81, "loss": 1.6607871055603027, "percent_done": 16.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1388578414917, "wps": 5535.235156131349, "avg_wps": 3140.8710634908134, "eta_in_seconds": 8742.665154003804, "at": "2024-05-25T22:14:57.232186"}
{"lr": 5.7893303003469235e-05, "step": 82, "loss": 1.8185405731201172, "percent_done": 16.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.14020013809204, "wps": 5531.238180032508, "avg_wps": 3157.511832033713, "eta_in_seconds": 8675.833839189714, "at": "2024-05-25T22:15:09.081719"}
{"lr": 5.7819651818616575e-05, "step": 83, "loss": 1.7938737869262695, "percent_done": 16.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5538.24318093579, "avg_wps": 3173.9502642027755, "eta_in_seconds": 8610.252122795726, "at": "2024-05-25T22:15:20.916268"}
{"lr": 5.774478371731938e-05, "step": 84, "loss": 1.3827170133590698, "percent_done": 16.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5526.76199138343, "avg_wps": 3190.1178006375894, "eta_in_seconds": 8546.071870622181, "at": "2024-05-25T22:15:32.775405"}
{"lr": 5.766870197455095e-05, "step": 85, "loss": 1.6816377639770508, "percent_done": 17.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5531.788180325271, "avg_wps": 3206.084541058031, "eta_in_seconds": 8483.070128595127, "at": "2024-05-25T22:15:44.623825"}
{"lr": 5.759140991837317e-05, "step": 86, "loss": 1.3680201768875122, "percent_done": 17.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5525.592675365883, "avg_wps": 3221.81055226947, "eta_in_seconds": 8421.321974033533, "at": "2024-05-25T22:15:56.485525"}
{"lr": 5.751291092979098e-05, "step": 87, "loss": 1.7220127582550049, "percent_done": 17.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13897943496704, "wps": 5535.422086578825, "avg_wps": 3237.3634711881114, "eta_in_seconds": 8360.620684357895, "at": "2024-05-25T22:16:08.326192"}
{"lr": 5.743320844260443e-05, "step": 88, "loss": 1.316036343574524, "percent_done": 17.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5536.561107992587, "avg_wps": 3252.713150271047, "eta_in_seconds": 8301.018489057367, "at": "2024-05-25T22:16:20.164363"}
{"lr": 5.735230594325853e-05, "step": 89, "loss": 1.5626420974731445, "percent_done": 17.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5528.980774154521, "avg_wps": 3267.8295242257354, "eta_in_seconds": 8242.564613703931, "at": "2024-05-25T22:16:32.018795"}
{"lr": 5.727020697069067e-05, "step": 90, "loss": 1.6677188873291016, "percent_done": 18.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.14020013809204, "wps": 5529.578712697917, "avg_wps": 3282.748793053368, "eta_in_seconds": 8185.140470345815, "at": "2024-05-25T22:16:43.871913"}
{"lr": 5.718691511617588e-05, "step": 91, "loss": 1.5478179454803467, "percent_done": 18.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13849115371704, "wps": 5531.183419749006, "avg_wps": 3297.4787956632053, "eta_in_seconds": 8128.702460574579, "at": "2024-05-25T22:16:55.721611"}
{"lr": 5.7102434023169716e-05, "step": 92, "loss": 1.4003026485443115, "percent_done": 18.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13897943496704, "wps": 5498.951573208651, "avg_wps": 3311.890707400976, "eta_in_seconds": 8073.541780907175, "at": "2024-05-25T22:17:07.640749"}
{"lr": 5.701676738714885e-05, "step": 93, "loss": 1.3452470302581787, "percent_done": 18.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5526.587645807131, "avg_wps": 3326.223331155903, "eta_in_seconds": 8019.050239398915, "at": "2024-05-25T22:17:19.500291"}
{"lr": 5.6929918955449466e-05, "step": 94, "loss": 1.50814950466156, "percent_done": 18.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5536.120651613291, "avg_wps": 3340.408623531156, "eta_in_seconds": 7965.377592599139, "at": "2024-05-25T22:17:31.339417"}
{"lr": 5.6841892527103325e-05, "step": 95, "loss": 1.449243187904358, "percent_done": 19.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5534.185815649729, "avg_wps": 3354.4054872665934, "eta_in_seconds": 7912.603321439342, "at": "2024-05-25T22:17:43.182648"}
{"lr": 5.675269195267157e-05, "step": 96, "loss": 1.5438588857650757, "percent_done": 19.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.14142084121704, "wps": 5518.593693577431, "avg_wps": 3368.1645443526363, "eta_in_seconds": 7860.822608679533, "at": "2024-05-25T22:17:55.059376"}
{"lr": 5.6662321134076275e-05, "step": 97, "loss": 1.4851049184799194, "percent_done": 19.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.14044427871704, "wps": 5531.843397891452, "avg_wps": 3381.800928535651, "eta_in_seconds": 7809.74651025251, "at": "2024-05-25T22:18:06.907604"}
{"lr": 5.657078402442983e-05, "step": 98, "loss": 1.485952377319336, "percent_done": 19.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5536.484273972819, "avg_wps": 3395.2843297455797, "eta_in_seconds": 7759.43026897372, "at": "2024-05-25T22:18:18.745900"}
{"lr": 5.6478084627861946e-05, "step": 99, "loss": 1.4768633842468262, "percent_done": 19.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5521.5026874343275, "avg_wps": 3408.5425154087948, "eta_in_seconds": 7710.021477273017, "at": "2024-05-25T22:18:30.616325"}
{"lr": 5.638422699934453e-05, "step": 100, "loss": 1.587773084640503, "percent_done": 20.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.138602256774902, "wps": 5527.2304120796, "avg_wps": 3421.6583539038124, "eta_in_seconds": 7661.314277648926, "at": "2024-05-25T22:18:42.474456"}
{"lr": 5.62892152445143e-05, "step": 101, "loss": 1.4422743320465088, "percent_done": 20.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1399564743042, "wps": 5599.027294895566, "avg_wps": 3434.8837934325293, "eta_in_seconds": 7612.736142630624, "at": "2024-05-25T22:19:08.929106"}
{"lr": 5.619305351949323e-05, "step": 102, "loss": 1.6620022058486938, "percent_done": 20.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5550.775309031288, "avg_wps": 3447.768593583235, "eta_in_seconds": 7565.278031868093, "at": "2024-05-25T22:19:20.736985"}
{"lr": 5.609574603070667e-05, "step": 103, "loss": 1.7876899242401123, "percent_done": 20.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5548.168756200814, "avg_wps": 3460.4875784576047, "eta_in_seconds": 7518.533562139401, "at": "2024-05-25T22:19:32.550395"}
{"lr": 5.599729703469942e-05, "step": 104, "loss": 1.6648534536361694, "percent_done": 20.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13893413543701, "wps": 5536.105487780869, "avg_wps": 3473.0079000580445, "eta_in_seconds": 7472.558873121555, "at": "2024-05-25T22:19:44.389502"}
{"lr": 5.589771083794951e-05, "step": 105, "loss": 1.4844549894332886, "percent_done": 21.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5532.074744759462, "avg_wps": 3485.3628532805133, "eta_in_seconds": 7427.266855625879, "at": "2024-05-25T22:19:56.237238"}
{"lr": 5.579699179667977e-05, "step": 106, "loss": 1.725979208946228, "percent_done": 21.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13897943496704, "wps": 5507.068846778387, "avg_wps": 3497.4757031259414, "eta_in_seconds": 7382.805826762938, "at": "2024-05-25T22:20:08.138792"}
{"lr": 5.569514431666738e-05, "step": 107, "loss": 1.2329559326171875, "percent_done": 21.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 3116.60980459032, "avg_wps": 3493.4857769672835, "eta_in_seconds": 7372.478276513448, "at": "2024-05-25T22:20:29.167841"}
{"lr": 5.559217285305104e-05, "step": 108, "loss": 1.6703511476516724, "percent_done": 21.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5559.812583536628, "avg_wps": 3505.5492170397974, "eta_in_seconds": 7328.4128704071045, "at": "2024-05-25T22:20:40.956426"}
{"lr": 5.548808191013616e-05, "step": 109, "loss": 1.4362456798553467, "percent_done": 21.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.141066074371338, "wps": 5537.786391318181, "avg_wps": 3517.391417086075, "eta_in_seconds": 7285.107899998306, "at": "2024-05-25T22:20:52.791888"}
{"lr": 5.538287604119777e-05, "step": 110, "loss": 1.3590904474258423, "percent_done": 22.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13897943496704, "wps": 5522.457796593279, "avg_wps": 3529.0396541955142, "eta_in_seconds": 7242.491585384715, "at": "2024-05-25T22:21:04.660314"}
{"lr": 5.5276559848281426e-05, "step": 111, "loss": 1.4913303852081299, "percent_done": 22.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13857650756836, "wps": 5542.21944924541, "avg_wps": 3540.6262525175707, "eta_in_seconds": 7200.281018611548, "at": "2024-05-25T22:21:16.486296"}
{"lr": 5.516913798200181e-05, "step": 112, "loss": 1.6864898204803467, "percent_done": 22.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5533.368550797568, "avg_wps": 3552.0477306393095, "eta_in_seconds": 7158.6785787429135, "at": "2024-05-25T22:21:28.331246"}
{"lr": 5.506061514133933e-05, "step": 113, "loss": 1.7275524139404297, "percent_done": 22.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139621257781982, "wps": 5526.840889427636, "avg_wps": 3563.3150454863935, "eta_in_seconds": 7117.650748318275, "at": "2024-05-25T22:21:40.190190"}
{"lr": 5.495099607343464e-05, "step": 114, "loss": 1.4053714275360107, "percent_done": 22.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5540.172704106169, "avg_wps": 3574.5033157661283, "eta_in_seconds": 7077.038056846251, "at": "2024-05-25T22:21:52.020570"}
{"lr": 5.4840285573380864e-05, "step": 115, "loss": 1.5559868812561035, "percent_done": 23.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5544.330666818346, "avg_wps": 3585.5807890519436, "eta_in_seconds": 7036.896247614985, "at": "2024-05-25T22:22:03.842237"}
{"lr": 5.4728488484013935e-05, "step": 116, "loss": 1.700688362121582, "percent_done": 23.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5527.996614961164, "avg_wps": 3596.4749425207824, "eta_in_seconds": 6997.35835844895, "at": "2024-05-25T22:22:15.698614"}
{"lr": 5.46156096957007e-05, "step": 117, "loss": 1.8308873176574707, "percent_done": 23.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5538.991233443881, "avg_wps": 3607.28751143355, "eta_in_seconds": 6958.216643514796, "at": "2024-05-25T22:22:27.531521"}
{"lr": 5.450165414612506e-05, "step": 118, "loss": 1.7806788682937622, "percent_done": 23.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5524.7541833277655, "avg_wps": 3617.92876689174, "eta_in_seconds": 6919.636513879745, "at": "2024-05-25T22:22:39.395007"}
{"lr": 5.43866268200719e-05, "step": 119, "loss": 1.4693626165390015, "percent_done": 23.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1409330368042, "wps": 5528.15726327424, "avg_wps": 3628.464891399468, "eta_in_seconds": 6881.482044702819, "at": "2024-05-25T22:22:51.251098"}
{"lr": 5.42705327492091e-05, "step": 120, "loss": 1.557875394821167, "percent_done": 24.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5535.1552380218445, "avg_wps": 3638.91066261737, "eta_in_seconds": 6843.718439102173, "at": "2024-05-25T22:23:03.092310"}
{"lr": 5.415337701186742e-05, "step": 121, "loss": 1.5516443252563477, "percent_done": 24.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.140570163726807, "wps": 5530.38495546787, "avg_wps": 3649.225452978279, "eta_in_seconds": 6806.415311974927, "at": "2024-05-25T22:23:14.943580"}
{"lr": 5.403516473281833e-05, "step": 122, "loss": 1.649458885192871, "percent_done": 24.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5534.151609567946, "avg_wps": 3659.441862890493, "eta_in_seconds": 6769.504456735048, "at": "2024-05-25T22:23:26.786920"}
{"lr": 5.391590108304989e-05, "step": 123, "loss": 1.552938461303711, "percent_done": 24.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.140043258666992, "wps": 5524.233557884312, "avg_wps": 3669.5126071461127, "eta_in_seconds": 6733.066389221486, "at": "2024-05-25T22:23:38.651487"}
{"lr": 5.3795591279540496e-05, "step": 124, "loss": 1.5583155155181885, "percent_done": 24.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139499187469482, "wps": 5528.478365530576, "avg_wps": 3679.490337371718, "eta_in_seconds": 6696.997067697587, "at": "2024-05-25T22:23:50.506940"}
{"lr": 5.3674240585030686e-05, "step": 125, "loss": 1.4841161966323853, "percent_done": 25.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5528.541856577655, "avg_wps": 3689.3617575612607, "eta_in_seconds": 6661.314778804778, "at": "2024-05-25T22:24:02.362356"}
{"lr": 5.3551854307792975e-05, "step": 126, "loss": 1.5494056940078735, "percent_done": 25.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5523.731345589434, "avg_wps": 3699.1112305221154, "eta_in_seconds": 6626.041357653481, "at": "2024-05-25T22:24:14.227903"}
{"lr": 5.3428437801399596e-05, "step": 127, "loss": 1.463014006614685, "percent_done": 25.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5531.165834359518, "avg_wps": 3708.7839713260078, "eta_in_seconds": 6591.089745046585, "at": "2024-05-25T22:24:26.077518"}
{"lr": 5.3303996464488364e-05, "step": 128, "loss": 1.713060975074768, "percent_done": 25.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5535.1767499219595, "avg_wps": 3718.369260831204, "eta_in_seconds": 6556.474166460335, "at": "2024-05-25T22:24:37.918589"}
{"lr": 5.317853574052649e-05, "step": 129, "loss": 1.561232089996338, "percent_done": 25.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.14098072052002, "wps": 5528.585111383596, "avg_wps": 3727.8312598566954, "eta_in_seconds": 6522.252297689748, "at": "2024-05-25T22:24:49.773921"}
{"lr": 5.3052061117572476e-05, "step": 130, "loss": 1.5533205270767212, "percent_done": 26.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1409330368042, "wps": 5523.546868781365, "avg_wps": 3737.1771322003938, "eta_in_seconds": 6488.405323652121, "at": "2024-05-25T22:25:01.639827"}
{"lr": 5.292457812803603e-05, "step": 131, "loss": 1.6568609476089478, "percent_done": 26.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5528.329261817617, "avg_wps": 3746.4430065582296, "eta_in_seconds": 6454.865043367138, "at": "2024-05-25T22:25:13.495524"}
{"lr": 5.2796092348436136e-05, "step": 132, "loss": 1.3584004640579224, "percent_done": 26.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13897943496704, "wps": 5516.80550091994, "avg_wps": 3755.573133584753, "eta_in_seconds": 6421.722368905038, "at": "2024-05-25T22:25:25.375968"}
{"lr": 5.266660939915699e-05, "step": 133, "loss": 1.4305424690246582, "percent_done": 26.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5530.349572420729, "avg_wps": 3764.656876385959, "eta_in_seconds": 6388.819164600587, "at": "2024-05-25T22:25:37.227363"}
{"lr": 5.25361349442023e-05, "step": 134, "loss": 1.5304365158081055, "percent_done": 26.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5522.819848235018, "avg_wps": 3773.621908271301, "eta_in_seconds": 6356.274312332494, "at": "2024-05-25T22:25:49.095116"}
{"lr": 5.240467469094738e-05, "step": 135, "loss": 1.8120039701461792, "percent_done": 27.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139307498931885, "wps": 5535.127707492048, "avg_wps": 3782.538646915194, "eta_in_seconds": 6323.964467490161, "at": "2024-05-25T22:26:00.936199"}
{"lr": 5.227223438988959e-05, "step": 136, "loss": 1.4749547243118286, "percent_done": 27.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5489.787344893303, "avg_wps": 3791.2078655688274, "eta_in_seconds": 6292.217373953146, "at": "2024-05-25T22:26:12.875129"}
{"lr": 5.2138819834396735e-05, "step": 137, "loss": 1.613757610321045, "percent_done": 27.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5525.56635062068, "avg_wps": 3799.9137971247605, "eta_in_seconds": 6260.5546520556845, "at": "2024-05-25T22:26:24.736742"}
{"lr": 5.200443686045369e-05, "step": 138, "loss": 1.5715901851654053, "percent_done": 27.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5523.934040091993, "avg_wps": 3808.5271421746756, "eta_in_seconds": 6229.188112455866, "at": "2024-05-25T22:26:36.601900"}
{"lr": 5.1869091346407056e-05, "step": 139, "loss": 1.4897774457931519, "percent_done": 27.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5534.811850483233, "avg_wps": 3817.0921429157083, "eta_in_seconds": 6198.041628077734, "at": "2024-05-25T22:26:48.443835"}
{"lr": 5.1732789212708097e-05, "step": 140, "loss": 1.5047266483306885, "percent_done": 28.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1384916305542, "wps": 5532.469348260165, "avg_wps": 3825.5645754605275, "eta_in_seconds": 6167.183832509177, "at": "2024-05-25T22:27:00.290624"}
{"lr": 5.159553642165368e-05, "step": 141, "loss": 1.8195000886917114, "percent_done": 28.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5537.891488654509, "avg_wps": 3833.972176303514, "eta_in_seconds": 6136.566182043535, "at": "2024-05-25T22:27:12.125840"}
{"lr": 5.145733897712554e-05, "step": 142, "loss": 1.4714698791503906, "percent_done": 28.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13897943496704, "wps": 5524.16039616699, "avg_wps": 3842.250953086935, "eta_in_seconds": 6106.287248403254, "at": "2024-05-25T22:27:23.990534"}
{"lr": 5.131820292432759e-05, "step": 143, "loss": 1.49951171875, "percent_done": 28.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1384916305542, "wps": 5527.2720903651525, "avg_wps": 3850.459589909883, "eta_in_seconds": 6076.249199267034, "at": "2024-05-25T22:27:35.848480"}
{"lr": 5.117813434952152e-05, "step": 144, "loss": 1.6421213150024414, "percent_done": 28.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5532.893966195105, "avg_wps": 3858.6076442062945, "eta_in_seconds": 6046.433882706696, "at": "2024-05-25T22:27:47.694640"}
{"lr": 5.103713937976054e-05, "step": 145, "loss": 1.5833499431610107, "percent_done": 29.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.14060688018799, "wps": 5534.089215198446, "avg_wps": 3866.681181611136, "eta_in_seconds": 6016.860172140187, "at": "2024-05-25T22:27:59.538005"}
{"lr": 5.0895224182621414e-05, "step": 146, "loss": 1.7415547370910645, "percent_done": 29.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5538.220864108457, "avg_wps": 3874.69114727732, "eta_in_seconds": 5987.507937581572, "at": "2024-05-25T22:28:11.372536"}
{"lr": 5.075239496593458e-05, "step": 147, "loss": 1.363211989402771, "percent_done": 29.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5525.6680965942705, "avg_wps": 3882.5826477907335, "eta_in_seconds": 5958.458608257528, "at": "2024-05-25T22:28:23.233990"}
{"lr": 5.0608657977512685e-05, "step": 148, "loss": 1.411226749420166, "percent_done": 29.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5536.754484904988, "avg_wps": 3890.4361239585437, "eta_in_seconds": 5929.585081203564, "at": "2024-05-25T22:28:35.071801"}
{"lr": 5.0464019504877256e-05, "step": 149, "loss": 1.9325288534164429, "percent_done": 29.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5533.476042541659, "avg_wps": 3898.2044675756474, "eta_in_seconds": 5900.956758767967, "at": "2024-05-25T22:28:46.916420"}
{"lr": 5.031848587498364e-05, "step": 150, "loss": 1.431246280670166, "percent_done": 30.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5529.682275088901, "avg_wps": 3905.8870887304815, "eta_in_seconds": 5872.571192900339, "at": "2024-05-25T22:28:58.769256"}
{"lr": 5.017206345394427e-05, "step": 151, "loss": 1.4973747730255127, "percent_done": 30.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1399564743042, "wps": 5526.7336553117175, "avg_wps": 3913.4879082228986, "eta_in_seconds": 5844.419233273197, "at": "2024-05-25T22:29:10.628409"}
{"lr": 5.00247586467502e-05, "step": 152, "loss": 1.4542311429977417, "percent_done": 30.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5532.066951239151, "avg_wps": 3921.035417625128, "eta_in_seconds": 5816.455494761467, "at": "2024-05-25T22:29:22.476201"}
{"lr": 4.987657789699088e-05, "step": 153, "loss": 1.8025246858596802, "percent_done": 30.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5539.373986806565, "avg_wps": 3928.5369174809694, "eta_in_seconds": 5788.666996817184, "at": "2024-05-25T22:29:34.308481"}
{"lr": 4.9727527686572356e-05, "step": 154, "loss": 1.5920372009277344, "percent_done": 30.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5535.196032751744, "avg_wps": 3935.9554873862685, "eta_in_seconds": 5761.105803322482, "at": "2024-05-25T22:29:46.149494"}
{"lr": 4.957761453543368e-05, "step": 155, "loss": 1.2139917612075806, "percent_done": 31.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5527.079264103846, "avg_wps": 3943.2792474493085, "eta_in_seconds": 5733.786166583338, "at": "2024-05-25T22:29:58.007926"}
{"lr": 4.942684500126173e-05, "step": 156, "loss": 1.8046396970748901, "percent_done": 31.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5534.837929054387, "avg_wps": 3950.5612688475035, "eta_in_seconds": 5706.628113269806, "at": "2024-05-25T22:30:09.849705"}
{"lr": 4.927522567920438e-05, "step": 157, "loss": 1.65402090549469, "percent_done": 31.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13886022567749, "wps": 5522.012592526507, "avg_wps": 3957.7350910627347, "eta_in_seconds": 5679.7252678081495, "at": "2024-05-25T22:30:21.718994"}
{"lr": 4.9122763201581924e-05, "step": 158, "loss": 1.6110213994979858, "percent_done": 31.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5525.584233648117, "avg_wps": 3964.855358902498, "eta_in_seconds": 5652.996130028858, "at": "2024-05-25T22:30:33.580731"}
{"lr": 4.8969464237597066e-05, "step": 159, "loss": 1.2890688180923462, "percent_done": 31.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5540.148585143146, "avg_wps": 3971.9584529639815, "eta_in_seconds": 5626.387149977234, "at": "2024-05-25T22:30:45.411148"}
{"lr": 4.8815335493043095e-05, "step": 160, "loss": 1.5860767364501953, "percent_done": 32.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1384916305542, "wps": 5525.745852593415, "avg_wps": 3978.951224212477, "eta_in_seconds": 5600.028435736895, "at": "2024-05-25T22:30:57.272398"}
{"lr": 4.866038371001062e-05, "step": 161, "loss": 1.0712507963180542, "percent_done": 32.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139376640319824, "wps": 5532.372807721712, "avg_wps": 3985.902727249423, "eta_in_seconds": 5573.819914900739, "at": "2024-05-25T22:31:09.119445"}
{"lr": 4.850461566659259e-05, "step": 162, "loss": 1.2214797735214233, "percent_done": 32.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5539.230099270619, "avg_wps": 3992.814312803984, "eta_in_seconds": 5547.758113610892, "at": "2024-05-25T22:31:20.951833"}
{"lr": 4.834803817658786e-05, "step": 163, "loss": 1.8359795808792114, "percent_done": 32.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13971185684204, "wps": 5536.410229852604, "avg_wps": 3999.655639904624, "eta_in_seconds": 5521.883379071768, "at": "2024-05-25T22:31:32.790385"}
{"lr": 4.819065808920307e-05, "step": 164, "loss": 1.3456029891967773, "percent_done": 32.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5539.916562513642, "avg_wps": 4006.447781202731, "eta_in_seconds": 5496.164483489059, "at": "2024-05-25T22:31:44.621283"}
{"lr": 4.803248228875308e-05, "step": 165, "loss": 1.512420892715454, "percent_done": 33.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5544.381661777678, "avg_wps": 4013.1944720073416, "eta_in_seconds": 5470.594598177708, "at": "2024-05-25T22:31:56.442753"}
{"lr": 4.7873517694359834e-05, "step": 166, "loss": 1.333431363105774, "percent_done": 33.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13935899734497, "wps": 5543.356127668449, "avg_wps": 4019.8789796635306, "eta_in_seconds": 5445.194770970977, "at": "2024-05-25T22:32:08.266379"}
{"lr": 4.7713771259649654e-05, "step": 167, "loss": 1.384599208831787, "percent_done": 33.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5543.143845234439, "avg_wps": 4026.504668133657, "eta_in_seconds": 5419.95844999616, "at": "2024-05-25T22:32:20.090524"}
{"lr": 4.755324997244911e-05, "step": 168, "loss": 1.3218507766723633, "percent_done": 33.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1384916305542, "wps": 5539.795311066067, "avg_wps": 4033.0624095732774, "eta_in_seconds": 5394.895935245923, "at": "2024-05-25T22:32:31.921649"}
{"lr": 4.739196085447931e-05, "step": 169, "loss": 1.4310145378112793, "percent_done": 33.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1392240524292, "wps": 5539.7708604503805, "avg_wps": 4039.563484265146, "eta_in_seconds": 5369.990120094909, "at": "2024-05-25T22:32:43.752867"}
{"lr": 4.722991096104879e-05, "step": 170, "loss": 1.3229132890701294, "percent_done": 34.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5522.456576150099, "avg_wps": 4045.9542010776304, "eta_in_seconds": 5345.3101357992955, "at": "2024-05-25T22:32:55.621230"}
{"lr": 4.706710738074485e-05, "step": 171, "loss": 1.4226155281066895, "percent_done": 34.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5533.96075407876, "avg_wps": 4052.3262200198014, "eta_in_seconds": 5320.732544551816, "at": "2024-05-25T22:33:07.464856"}
{"lr": 4.6903557235123503e-05, "step": 172, "loss": 1.5008213520050049, "percent_done": 34.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5538.737433173409, "avg_wps": 4058.6588234779615, "eta_in_seconds": 5296.283559399983, "at": "2024-05-25T22:33:19.298460"}
{"lr": 4.673926767839795e-05, "step": 173, "loss": 1.2238497734069824, "percent_done": 34.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13941717147827, "wps": 5536.440560939478, "avg_wps": 4064.9305437467933, "eta_in_seconds": 5271.989710369551, "at": "2024-05-25T22:33:31.136760"}
{"lr": 4.6574245897125624e-05, "step": 174, "loss": 1.0429325103759766, "percent_done": 34.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5528.988225345801, "avg_wps": 4071.1260646272876, "eta_in_seconds": 5247.868933765368, "at": "2024-05-25T22:33:42.991038"}
{"lr": 4.640849910989384e-05, "step": 175, "loss": 1.3254176378250122, "percent_done": 35.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5534.000528480136, "avg_wps": 4077.284932343515, "eta_in_seconds": 5223.868420634951, "at": "2024-05-25T22:33:54.834594"}
{"lr": 4.6242034567004e-05, "step": 176, "loss": 1.284037470817566, "percent_done": 35.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5522.944241627757, "avg_wps": 4083.3578875268263, "eta_in_seconds": 5200.049710279161, "at": "2024-05-25T22:34:06.725057"}
{"lr": 4.60748595501545e-05, "step": 177, "loss": 1.6696220636367798, "percent_done": 35.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5540.69600331122, "avg_wps": 4089.434842627239, "eta_in_seconds": 5176.296680252431, "at": "2024-05-25T22:34:18.554388"}
{"lr": 4.590698137212215e-05, "step": 178, "loss": 1.2060277462005615, "percent_done": 35.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5528.969653010865, "avg_wps": 4095.4252584140954, "eta_in_seconds": 5152.7230186033785, "at": "2024-05-25T22:34:30.408665"}
{"lr": 4.5738407376442294e-05, "step": 179, "loss": 1.4724308252334595, "percent_done": 35.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13897943496704, "wps": 5499.342895623346, "avg_wps": 4101.274460591106, "eta_in_seconds": 5129.394826448164, "at": "2024-05-25T22:34:42.326808"}
{"lr": 4.5569144937087604e-05, "step": 180, "loss": 1.3961241245269775, "percent_done": 36.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1399564743042, "wps": 5535.978828425462, "avg_wps": 4107.1878988471835, "eta_in_seconds": 5106.053220960829, "at": "2024-05-25T22:34:54.166070"}
{"lr": 4.5399201458145525e-05, "step": 181, "loss": 1.4968873262405396, "percent_done": 36.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5536.853408997794, "avg_wps": 4113.055457033859, "eta_in_seconds": 5082.835429376001, "at": "2024-05-25T22:35:06.003488"}
{"lr": 4.522858437349436e-05, "step": 182, "loss": 1.233327031135559, "percent_done": 36.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5539.635213694547, "avg_wps": 4118.883503565273, "eta_in_seconds": 5059.732323567946, "at": "2024-05-25T22:35:17.835049"}
{"lr": 4.505730114647811e-05, "step": 183, "loss": 1.6046642065048218, "percent_done": 36.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5521.777760493074, "avg_wps": 4124.609852381241, "eta_in_seconds": 5036.818691592399, "at": "2024-05-25T22:35:29.704688"}
{"lr": 4.488535926958002e-05, "step": 184, "loss": 1.260197401046753, "percent_done": 36.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5539.118030681845, "avg_wps": 4130.342207085291, "eta_in_seconds": 5013.961304338082, "at": "2024-05-25T22:35:41.537243"}
{"lr": 4.471276626409479e-05, "step": 185, "loss": 1.5981565713882446, "percent_done": 37.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5541.857642972014, "avg_wps": 4136.036540662585, "eta_in_seconds": 4991.213157099646, "at": "2024-05-25T22:35:53.363964"}
{"lr": 4.45395296797996e-05, "step": 186, "loss": 1.5876941680908203, "percent_done": 37.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5546.001351484951, "avg_wps": 4141.697548283214, "eta_in_seconds": 4968.56754026618, "at": "2024-05-25T22:36:05.181939"}
{"lr": 4.4365657094623857e-05, "step": 187, "loss": 1.6379966735839844, "percent_done": 37.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5537.327446090922, "avg_wps": 4147.287300719299, "eta_in_seconds": 4946.068722184329, "at": "2024-05-25T22:36:17.018276"}
{"lr": 4.419115611431772e-05, "step": 188, "loss": 1.8801261186599731, "percent_done": 37.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139856815338135, "wps": 5523.667742987618, "avg_wps": 4152.791488249696, "eta_in_seconds": 4923.731918121906, "at": "2024-05-25T22:36:28.884026"}
{"lr": 4.401603437211934e-05, "step": 189, "loss": 1.3729376792907715, "percent_done": 37.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.138864517211914, "wps": 5533.013356487571, "avg_wps": 4158.279804016645, "eta_in_seconds": 4901.472955310155, "at": "2024-05-25T22:36:40.729562"}
{"lr": 4.384029952842108e-05, "step": 190, "loss": 1.5538232326507568, "percent_done": 38.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5528.783936523735, "avg_wps": 4163.712029837937, "eta_in_seconds": 4879.338401505822, "at": "2024-05-25T22:36:52.584226"}
{"lr": 4.366395927043427e-05, "step": 191, "loss": 1.683979868888855, "percent_done": 38.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13849115371704, "wps": 5530.42723769031, "avg_wps": 4169.1062533859085, "eta_in_seconds": 4857.305803504914, "at": "2024-05-25T22:37:04.435571"}
{"lr": 4.348702131185308e-05, "step": 192, "loss": 1.6441792249679565, "percent_done": 38.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5537.756045483439, "avg_wps": 4174.479783032736, "eta_in_seconds": 4835.354115749399, "at": "2024-05-25T22:37:16.271069"}
{"lr": 4.3309493392517e-05, "step": 193, "loss": 1.573068380355835, "percent_done": 38.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13971185684204, "wps": 5541.468848867806, "avg_wps": 4179.82223526197, "eta_in_seconds": 4813.494657803076, "at": "2024-05-25T22:37:28.098659"}
{"lr": 4.313138327807234e-05, "step": 194, "loss": 1.5878041982650757, "percent_done": 38.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5536.753035085491, "avg_wps": 4185.109214607493, "eta_in_seconds": 4791.754521006162, "at": "2024-05-25T22:37:39.936367"}
{"lr": 4.2952698759632504e-05, "step": 195, "loss": 1.5733189582824707, "percent_done": 39.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.14044427871704, "wps": 5534.239966858734, "avg_wps": 4190.347769654751, "eta_in_seconds": 4770.124366466815, "at": "2024-05-25T22:37:51.779418"}
{"lr": 4.277344765343719e-05, "step": 196, "loss": 1.3800745010375977, "percent_done": 39.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139386653900146, "wps": 5539.15542358136, "avg_wps": 4195.560201101285, "eta_in_seconds": 4748.577792965636, "at": "2024-05-25T22:38:03.612119"}
{"lr": 4.2593637800510475e-05, "step": 197, "loss": 1.6179745197296143, "percent_done": 39.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5539.640349170898, "avg_wps": 4200.733916607026, "eta_in_seconds": 4727.1282576352805, "at": "2024-05-25T22:38:15.443591"}
{"lr": 4.241327706631782e-05, "step": 198, "loss": 1.4495550394058228, "percent_done": 39.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5515.075784395491, "avg_wps": 4205.7961234189415, "eta_in_seconds": 4705.856256273058, "at": "2024-05-25T22:38:27.327769"}
{"lr": 4.223237334042203e-05, "step": 199, "loss": 1.693682074546814, "percent_done": 39.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13873529434204, "wps": 5534.125760301313, "avg_wps": 4210.8750989645405, "eta_in_seconds": 4684.6167450682005, "at": "2024-05-25T22:38:39.171042"}
{"lr": 4.205093453613813e-05, "step": 200, "loss": 1.4700599908828735, "percent_done": 40.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1384916305542, "wps": 5537.086290490554, "avg_wps": 4215.9239687641675, "eta_in_seconds": 4663.461709856987, "at": "2024-05-25T22:38:51.007986"}
{"lr": 4.186896859018719e-05, "step": 201, "loss": 1.369512915611267, "percent_done": 40.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.138686656951904, "wps": 5595.435397297564, "avg_wps": 4221.101481224286, "eta_in_seconds": 4642.215802477367, "at": "2024-05-25T22:39:17.079303"}
{"lr": 4.1686483462349175e-05, "step": 202, "loss": 1.2966172695159912, "percent_done": 40.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139472007751465, "wps": 5561.9329520145475, "avg_wps": 4226.145091015676, "eta_in_seconds": 4621.168364881289, "at": "2024-05-25T22:39:28.863491"}
{"lr": 4.1503487135114756e-05, "step": 203, "loss": 1.4266027212142944, "percent_done": 40.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5543.294308093675, "avg_wps": 4231.097586008466, "eta_in_seconds": 4600.2701673355, "at": "2024-05-25T22:39:40.687235"}
{"lr": 4.1319987613336105e-05, "step": 204, "loss": 1.4435640573501587, "percent_done": 40.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5536.516836170746, "avg_wps": 4235.993553334483, "eta_in_seconds": 4579.481945795172, "at": "2024-05-25T22:39:52.525354"}
{"lr": 4.113599292387675e-05, "step": 205, "loss": 1.3507176637649536, "percent_done": 41.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5534.672991802267, "avg_wps": 4240.847654335366, "eta_in_seconds": 4558.786727515662, "at": "2024-05-25T22:40:04.367607"}
{"lr": 4.095151111526049e-05, "step": 206, "loss": 1.550918698310852, "percent_done": 41.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5530.640105119984, "avg_wps": 4245.654075438708, "eta_in_seconds": 4538.189795410749, "at": "2024-05-25T22:40:16.218426"}
{"lr": 4.076655025731926e-05, "step": 207, "loss": 1.2539643049240112, "percent_done": 41.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13878059387207, "wps": 5525.05068056548, "avg_wps": 4250.408842975308, "eta_in_seconds": 4517.694346447497, "at": "2024-05-25T22:40:28.081219"}
{"lr": 4.058111844084018e-05, "step": 208, "loss": 1.5834758281707764, "percent_done": 41.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5535.966006718693, "avg_wps": 4255.159465059896, "eta_in_seconds": 4497.249082469023, "at": "2024-05-25T22:40:39.920649"}
{"lr": 4.0395223777211613e-05, "step": 209, "loss": 1.621875286102295, "percent_done": 41.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5529.24213391026, "avg_wps": 4259.856033280293, "eta_in_seconds": 4476.906226644105, "at": "2024-05-25T22:40:51.774459"}
{"lr": 4.020887439806836e-05, "step": 210, "loss": 1.5037541389465332, "percent_done": 42.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5535.651168833208, "avg_wps": 4264.536236824635, "eta_in_seconds": 4456.625279880705, "at": "2024-05-25T22:41:03.614549"}
{"lr": 4.0022078454935966e-05, "step": 211, "loss": 1.6204335689544678, "percent_done": 42.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1384916305542, "wps": 5533.3081790277165, "avg_wps": 4269.175620311635, "eta_in_seconds": 4436.431218685132, "at": "2024-05-25T22:41:15.459637"}
{"lr": 3.9834844118874095e-05, "step": 212, "loss": 1.549316167831421, "percent_done": 42.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5531.893272769696, "avg_wps": 4273.777216215136, "eta_in_seconds": 4416.3200478463805, "at": "2024-05-25T22:41:27.307751"}
{"lr": 3.964717958011919e-05, "step": 213, "loss": 1.008284568786621, "percent_done": 42.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5529.038716036724, "avg_wps": 4278.337375397288, "eta_in_seconds": 4396.294716765623, "at": "2024-05-25T22:41:39.161993"}
{"lr": 3.9459093047726116e-05, "step": 214, "loss": 1.1781988143920898, "percent_done": 42.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5528.792610429211, "avg_wps": 4282.863831812949, "eta_in_seconds": 4376.346467234264, "at": "2024-05-25T22:41:51.016714"}
{"lr": 3.92705927492091e-05, "step": 215, "loss": 1.2642954587936401, "percent_done": 43.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1409330368042, "wps": 5524.645253572456, "avg_wps": 4287.346027755422, "eta_in_seconds": 4356.485312611558, "at": "2024-05-25T22:42:02.880291"}
{"lr": 3.908168693018187e-05, "step": 216, "loss": 1.4156056642532349, "percent_done": 43.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5533.407871127302, "avg_wps": 4291.820426712731, "eta_in_seconds": 4336.673520670996, "at": "2024-05-25T22:42:14.725120"}
{"lr": 3.889238385399692e-05, "step": 217, "loss": 1.051167607307434, "percent_done": 43.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5537.368384395405, "avg_wps": 4296.273801586775, "eta_in_seconds": 4316.924119954834, "at": "2024-05-25T22:42:26.561508"}
{"lr": 3.870269180138406e-05, "step": 218, "loss": 1.093568205833435, "percent_done": 43.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5548.996224077958, "avg_wps": 4300.727551831314, "eta_in_seconds": 4297.21524492535, "at": "2024-05-25T22:42:38.373204"}
{"lr": 3.851261907008817e-05, "step": 219, "loss": 1.4760338068008423, "percent_done": 43.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.141066551208496, "wps": 5534.63198190342, "avg_wps": 4305.110162880705, "eta_in_seconds": 4277.617831660188, "at": "2024-05-25T22:42:50.215507"}
{"lr": 3.8322173974506286e-05, "step": 220, "loss": 1.2785446643829346, "percent_done": 44.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13966703414917, "wps": 5540.802216305511, "avg_wps": 4309.478736584486, "eta_in_seconds": 4258.074148091403, "at": "2024-05-25T22:43:02.044583"}
{"lr": 3.813136484532385e-05, "step": 221, "loss": 1.3685591220855713, "percent_done": 44.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5533.759885374925, "avg_wps": 4313.797190617208, "eta_in_seconds": 4238.619293408156, "at": "2024-05-25T22:43:13.888729"}
{"lr": 3.794020002915029e-05, "step": 222, "loss": 1.6812156438827515, "percent_done": 44.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.14044427871704, "wps": 5533.822049505497, "avg_wps": 4318.085456935062, "eta_in_seconds": 4219.232847913965, "at": "2024-05-25T22:43:25.732736"}
{"lr": 3.774868788815397e-05, "step": 223, "loss": 1.6355894804000854, "percent_done": 44.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13873529434204, "wps": 5535.39332722666, "avg_wps": 4322.3479806554005, "eta_in_seconds": 4199.909882602135, "at": "2024-05-25T22:43:37.573393"}
{"lr": 3.755683679969634e-05, "step": 224, "loss": 1.2441591024398804, "percent_done": 44.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5538.676162978722, "avg_wps": 4326.5897054741245, "eta_in_seconds": 4180.645088004215, "at": "2024-05-25T22:43:49.407047"}
{"lr": 3.736465515596552e-05, "step": 225, "loss": 1.7374337911605835, "percent_done": 45.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5527.72203358173, "avg_wps": 4330.772123855132, "eta_in_seconds": 4161.475017521117, "at": "2024-05-25T22:44:01.264121"}
{"lr": 3.717215136360919e-05, "step": 226, "loss": 1.3517248630523682, "percent_done": 45.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5533.533076126499, "avg_wps": 4334.941312950405, "eta_in_seconds": 4142.354579600613, "at": "2024-05-25T22:44:13.108762"}
{"lr": 3.697933384336687e-05, "step": 227, "loss": 1.5427135229110718, "percent_done": 45.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13971185684204, "wps": 5532.932388814647, "avg_wps": 4339.080070889723, "eta_in_seconds": 4123.299802654115, "at": "2024-05-25T22:44:24.954749"}
{"lr": 3.6786211029701516e-05, "step": 228, "loss": 1.4166542291641235, "percent_done": 45.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 2669.9194216301294, "avg_wps": 4327.214910834508, "eta_in_seconds": 4119.460754160295, "at": "2024-05-25T22:44:49.501886"}
{"lr": 3.659279137043063e-05, "step": 229, "loss": 1.2034482955932617, "percent_done": 45.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1409330368042, "wps": 5547.563767731052, "avg_wps": 4331.375665085092, "eta_in_seconds": 4100.373039254975, "at": "2024-05-25T22:45:01.316589"}
{"lr": 3.639908332635672e-05, "step": 230, "loss": 1.5192251205444336, "percent_done": 46.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13909387588501, "wps": 5539.994608380083, "avg_wps": 4335.488016399378, "eta_in_seconds": 4081.367526116578, "at": "2024-05-25T22:45:13.147369"}
{"lr": 3.6205095370897137e-05, "step": 231, "loss": 1.5551331043243408, "percent_done": 46.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139253616333008, "wps": 5536.502116225615, "avg_wps": 4339.56319524393, "eta_in_seconds": 4062.4328317931204, "at": "2024-05-25T22:45:24.985583"}
{"lr": 3.601083598971351e-05, "step": 232, "loss": 1.3341258764266968, "percent_done": 46.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5530.741704186446, "avg_wps": 4343.595514073156, "eta_in_seconds": 4043.5735655159788, "at": "2024-05-25T22:45:36.836302"}
{"lr": 3.581631368034047e-05, "step": 233, "loss": 1.7266117334365845, "percent_done": 46.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5536.8398025431225, "avg_wps": 4347.616779511352, "eta_in_seconds": 4024.759514790236, "at": "2024-05-25T22:45:48.673797"}
{"lr": 3.5621536951813995e-05, "step": 234, "loss": 1.6123225688934326, "percent_done": 46.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5534.2751768553435, "avg_wps": 4351.604259377046, "eta_in_seconds": 4006.011337642996, "at": "2024-05-25T22:46:00.516802"}
{"lr": 3.542651432429918e-05, "step": 235, "loss": 1.3343654870986938, "percent_done": 47.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1411771774292, "wps": 5531.498640126004, "avg_wps": 4355.5577092161975, "eta_in_seconds": 3987.328640658805, "at": "2024-05-25T22:46:12.365791"}
{"lr": 3.523125432871754e-05, "step": 236, "loss": 1.1647117137908936, "percent_done": 47.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5534.28843643222, "avg_wps": 4359.492092862663, "eta_in_seconds": 3968.697185694161, "at": "2024-05-25T22:46:24.208726"}
{"lr": 3.503576550637384e-05, "step": 237, "loss": 1.777500867843628, "percent_done": 47.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5514.7734970101465, "avg_wps": 4363.348933563799, "eta_in_seconds": 3950.169528597015, "at": "2024-05-25T22:46:36.093776"}
{"lr": 3.484005640858246e-05, "step": 238, "loss": 1.4067996740341187, "percent_done": 47.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5525.385083236194, "avg_wps": 4367.208015584494, "eta_in_seconds": 3931.672578619308, "at": "2024-05-25T22:46:47.955734"}
{"lr": 3.464413559629336e-05, "step": 239, "loss": 1.2412711381912231, "percent_done": 47.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5534.256903256877, "avg_wps": 4371.064744126738, "eta_in_seconds": 3913.210396387587, "at": "2024-05-25T22:46:59.798816"}
{"lr": 3.444801163971754e-05, "step": 240, "loss": 1.4133297204971313, "percent_done": 48.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5530.940016732186, "avg_wps": 4374.887424455268, "eta_in_seconds": 3894.811076680819, "at": "2024-05-25T22:47:11.648940"}
{"lr": 3.4251693117952235e-05, "step": 241, "loss": 1.4693609476089478, "percent_done": 48.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1392240524292, "wps": 5522.709330349719, "avg_wps": 4378.663553752841, "eta_in_seconds": 3876.485094510668, "at": "2024-05-25T22:47:23.516714"}
{"lr": 3.4055188618605555e-05, "step": 242, "loss": 1.3353869915008545, "percent_done": 48.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.138741493225098, "wps": 5539.252870733412, "avg_wps": 4382.457837082424, "eta_in_seconds": 3858.1747112155945, "at": "2024-05-25T22:47:35.349209"}
{"lr": 3.3858506737420905e-05, "step": 243, "loss": 1.2679318189620972, "percent_done": 48.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13873529434204, "wps": 5519.522415991749, "avg_wps": 4386.1762998708455, "eta_in_seconds": 3839.9623837500444, "at": "2024-05-25T22:47:47.223794"}
{"lr": 3.366165607790091e-05, "step": 244, "loss": 1.3092782497406006, "percent_done": 48.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5533.8629359943325, "avg_wps": 4389.907602546346, "eta_in_seconds": 3821.7697316154104, "at": "2024-05-25T22:47:59.067713"}
{"lr": 3.3464645250931154e-05, "step": 245, "loss": 1.3463435173034668, "percent_done": 49.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5542.63763010593, "avg_wps": 4393.637262477201, "eta_in_seconds": 3803.6094018780454, "at": "2024-05-25T22:48:10.892919"}
{"lr": 3.3267482874403404e-05, "step": 246, "loss": 1.691806674003601, "percent_done": 49.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5529.3287773420025, "avg_wps": 4397.308731074106, "eta_in_seconds": 3785.529972541623, "at": "2024-05-25T22:48:22.746613"}
{"lr": 3.3070177572838744e-05, "step": 247, "loss": 1.520065426826477, "percent_done": 49.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5521.833222090956, "avg_wps": 4400.937287322642, "eta_in_seconds": 3767.5174440140668, "at": "2024-05-25T22:48:34.616243"}
{"lr": 3.287273797701024e-05, "step": 248, "loss": 1.6431244611740112, "percent_done": 49.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.140637397766113, "wps": 5534.171553779217, "avg_wps": 4404.574086490185, "eta_in_seconds": 3749.5275764926787, "at": "2024-05-25T22:48:46.459472"}
{"lr": 3.267517272356543e-05, "step": 249, "loss": 1.0544090270996094, "percent_done": 49.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5529.259818292591, "avg_wps": 4408.175091096154, "eta_in_seconds": 3731.597692937736, "at": "2024-05-25T22:48:58.313206"}
{"lr": 3.247749045464852e-05, "step": 250, "loss": 1.5963233709335327, "percent_done": 50.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13971185684204, "wps": 5534.015569369136, "avg_wps": 4411.765210272437, "eta_in_seconds": 3713.706242084503, "at": "2024-05-25T22:49:10.156712"}
{"lr": 3.227969981752235e-05, "step": 251, "loss": 1.6758294105529785, "percent_done": 50.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1384916305542, "wps": 5532.253890444075, "avg_wps": 4415.328036363264, "eta_in_seconds": 3695.8667318953935, "at": "2024-05-25T22:49:22.004135"}
{"lr": 3.208180946419016e-05, "step": 252, "loss": 1.1712573766708374, "percent_done": 50.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1399564743042, "wps": 5538.17723523053, "avg_wps": 4418.883257101735, "eta_in_seconds": 3678.0623189986695, "at": "2024-05-25T22:49:33.838737"}
{"lr": 3.188382805101706e-05, "step": 253, "loss": 1.2246155738830566, "percent_done": 50.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5540.9633863865265, "avg_wps": 4422.423054089256, "eta_in_seconds": 3660.2992979226847, "at": "2024-05-25T22:49:45.667391"}
{"lr": 3.168576423835144e-05, "step": 254, "loss": 1.5317556858062744, "percent_done": 50.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139402866363525, "wps": 5532.742953765316, "avg_wps": 4425.9199077964195, "eta_in_seconds": 3642.600032504149, "at": "2024-05-25T22:49:57.513821"}
{"lr": 3.148762669014611e-05, "step": 255, "loss": 1.5544838905334473, "percent_done": 51.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.141308784484863, "wps": 5527.811964316946, "avg_wps": 4429.382399854723, "eta_in_seconds": 3624.956833830067, "at": "2024-05-25T22:50:09.370538"}
{"lr": 3.12894240735793e-05, "step": 256, "loss": 1.4938002824783325, "percent_done": 51.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5518.587156727684, "avg_wps": 4432.799988547965, "eta_in_seconds": 3607.377738971263, "at": "2024-05-25T22:50:21.247309"}
{"lr": 3.109116505867555e-05, "step": 257, "loss": 1.6491687297821045, "percent_done": 51.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5539.9196887721655, "avg_wps": 4436.249630038278, "eta_in_seconds": 3589.7997921867595, "at": "2024-05-25T22:50:33.078155"}
{"lr": 3.089285831792642e-05, "step": 258, "loss": 1.2178406715393066, "percent_done": 51.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.14020013809204, "wps": 5522.017029790733, "avg_wps": 4439.633132010343, "eta_in_seconds": 3572.302379142406, "at": "2024-05-25T22:50:44.947419"}
{"lr": 3.0694512525911205e-05, "step": 259, "loss": 1.3444440364837646, "percent_done": 51.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1399564743042, "wps": 5536.3724279705675, "avg_wps": 4443.031400791835, "eta_in_seconds": 3554.8198010000942, "at": "2024-05-25T22:50:56.785908"}
{"lr": 3.0496136358917387e-05, "step": 260, "loss": 1.1937881708145142, "percent_done": 52.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5539.539762552092, "avg_wps": 4446.416528515833, "eta_in_seconds": 3537.3744000654956, "at": "2024-05-25T22:51:08.617601"}
{"lr": 3.029773849456115e-05, "step": 261, "loss": 1.566652536392212, "percent_done": 52.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5530.235860158809, "avg_wps": 4449.757779523455, "eta_in_seconds": 3519.990250273226, "at": "2024-05-25T22:51:20.469390"}
{"lr": 3.009932761140782e-05, "step": 262, "loss": 1.2333173751831055, "percent_done": 52.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13897943496704, "wps": 5520.503892488975, "avg_wps": 4453.054366147088, "eta_in_seconds": 3502.6673194415694, "at": "2024-05-25T22:51:32.341856"}
{"lr": 2.9900912388592177e-05, "step": 263, "loss": 1.7521350383758545, "percent_done": 52.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5531.126768482994, "avg_wps": 4456.356985652556, "eta_in_seconds": 3485.365299504973, "at": "2024-05-25T22:51:44.191626"}
{"lr": 2.9702501505438846e-05, "step": 264, "loss": 1.538033366203308, "percent_done": 52.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13849115371704, "wps": 5525.8686004459205, "avg_wps": 4459.626471859686, "eta_in_seconds": 3468.1146722923627, "at": "2024-05-25T22:51:56.052683"}
{"lr": 2.9504103641082615e-05, "step": 265, "loss": 1.256603717803955, "percent_done": 53.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5532.640501648141, "avg_wps": 4462.89267745163, "eta_in_seconds": 3450.891857160712, "at": "2024-05-25T22:52:07.899351"}
{"lr": 2.93057274740888e-05, "step": 266, "loss": 1.1758630275726318, "percent_done": 53.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5506.620163418131, "avg_wps": 4466.075015979773, "eta_in_seconds": 3433.75871321671, "at": "2024-05-25T22:52:19.801851"}
{"lr": 2.9107381682073582e-05, "step": 267, "loss": 1.818198800086975, "percent_done": 53.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5527.10704803808, "avg_wps": 4469.288363781493, "eta_in_seconds": 3416.6262628621375, "at": "2024-05-25T22:52:31.660121"}
{"lr": 2.8909074941324465e-05, "step": 268, "loss": 1.5012140274047852, "percent_done": 53.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5508.707763393108, "avg_wps": 4472.437203406224, "eta_in_seconds": 3399.567463668425, "at": "2024-05-25T22:52:43.558114"}
{"lr": 2.8710815926420708e-05, "step": 269, "loss": 1.3686946630477905, "percent_done": 53.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1384916305542, "wps": 5518.555802222994, "avg_wps": 4475.591144741124, "eta_in_seconds": 3382.528812487329, "at": "2024-05-25T22:52:55.434835"}
{"lr": 2.851261330985389e-05, "step": 270, "loss": 1.3505845069885254, "percent_done": 54.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1414213180542, "wps": 5519.38221771944, "avg_wps": 4478.728141323957, "eta_in_seconds": 3365.5268916465616, "at": "2024-05-25T22:53:07.309876"}
{"lr": 2.8314475761648556e-05, "step": 271, "loss": 1.2980961799621582, "percent_done": 54.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13862705230713, "wps": 5517.019203439364, "avg_wps": 4481.840586670939, "eta_in_seconds": 3348.567114286317, "at": "2024-05-25T22:53:19.189873"}
{"lr": 2.811641194898294e-05, "step": 272, "loss": 1.1465059518814087, "percent_done": 54.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139700889587402, "wps": 5535.403025114344, "avg_wps": 4484.9789450574035, "eta_in_seconds": 3331.6116269546396, "at": "2024-05-25T22:53:31.030440"}
{"lr": 2.7918430535809843e-05, "step": 273, "loss": 1.430358648300171, "percent_done": 54.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5534.783320362093, "avg_wps": 4488.097169410093, "eta_in_seconds": 3314.6947221633714, "at": "2024-05-25T22:53:42.872491"}
{"lr": 2.772054018247765e-05, "step": 274, "loss": 1.3976505994796753, "percent_done": 54.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5531.3996846627415, "avg_wps": 4491.188788370687, "eta_in_seconds": 3297.820843860181, "at": "2024-05-25T22:53:54.746479"}
{"lr": 2.7522749545351488e-05, "step": 275, "loss": 1.4968034029006958, "percent_done": 55.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13971185684204, "wps": 5516.209767995939, "avg_wps": 4494.2255741311355, "eta_in_seconds": 3281.010211164301, "at": "2024-05-25T22:54:06.628320"}
{"lr": 2.7325067276434586e-05, "step": 276, "loss": 1.3039748668670654, "percent_done": 55.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5521.563467348104, "avg_wps": 4497.257299739244, "eta_in_seconds": 3264.225954083429, "at": "2024-05-25T22:54:18.498509"}
{"lr": 2.7127502022989765e-05, "step": 277, "loss": 1.4881929159164429, "percent_done": 55.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5527.085932222587, "avg_wps": 4500.284414865999, "eta_in_seconds": 3247.4676382059656, "at": "2024-05-25T22:54:30.356878"}
{"lr": 2.693006242716126e-05, "step": 278, "loss": 1.4972293376922607, "percent_done": 55.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5530.62141040813, "avg_wps": 4503.302223255821, "eta_in_seconds": 3230.738528910301, "at": "2024-05-25T22:54:42.207725"}
{"lr": 2.6732757125596597e-05, "step": 279, "loss": 1.898256540298462, "percent_done": 55.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13971185684204, "wps": 5531.435526390087, "avg_wps": 4506.304342153716, "eta_in_seconds": 3214.043016250843, "at": "2024-05-25T22:54:54.056755"}
{"lr": 2.653559474906885e-05, "step": 280, "loss": 1.4742891788482666, "percent_done": 56.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139620780944824, "wps": 5527.689352432536, "avg_wps": 4509.280082486838, "eta_in_seconds": 3197.388438122613, "at": "2024-05-25T22:55:05.913967"}
{"lr": 2.6338583922099093e-05, "step": 281, "loss": 1.401398777961731, "percent_done": 56.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13962173461914, "wps": 5526.032346794623, "avg_wps": 4512.2346034606035, "eta_in_seconds": 3180.7707846113794, "at": "2024-05-25T22:55:17.774548"}
{"lr": 2.6141733262579107e-05, "step": 282, "loss": 1.512309193611145, "percent_done": 56.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13897943496704, "wps": 5514.92718144086, "avg_wps": 4515.145660230392, "eta_in_seconds": 3164.2053380113966, "at": "2024-05-25T22:55:29.659065"}
{"lr": 2.5945051381394456e-05, "step": 283, "loss": 1.4032942056655884, "percent_done": 56.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5526.4626437996, "avg_wps": 4518.06716304446, "eta_in_seconds": 3147.6539605969674, "at": "2024-05-25T22:55:41.518790"}
{"lr": 2.574854688204777e-05, "step": 284, "loss": 1.499544620513916, "percent_done": 56.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1411771774292, "wps": 5533.669315404924, "avg_wps": 4520.988794962859, "eta_in_seconds": 3131.1238850606996, "at": "2024-05-25T22:55:53.363059"}
{"lr": 2.555222836028246e-05, "step": 285, "loss": 1.3525288105010986, "percent_done": 57.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5532.152347152449, "avg_wps": 4523.890107148779, "eta_in_seconds": 3114.629150194034, "at": "2024-05-25T22:56:05.210709"}
{"lr": 2.5356104403706647e-05, "step": 286, "loss": 1.1315374374389648, "percent_done": 57.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5544.867167346487, "avg_wps": 4526.804516454784, "eta_in_seconds": 3098.146595246308, "at": "2024-05-25T22:56:17.030982"}
{"lr": 2.5160183591417547e-05, "step": 287, "loss": 1.4872703552246094, "percent_done": 57.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.14044427871704, "wps": 5532.0106158739645, "avg_wps": 4529.672370232537, "eta_in_seconds": 3081.7169232227243, "at": "2024-05-25T22:56:28.878790"}
{"lr": 2.4964474493626167e-05, "step": 288, "loss": 1.560407042503357, "percent_done": 57.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5526.816219656265, "avg_wps": 4532.51178767463, "eta_in_seconds": 3065.32727345162, "at": "2024-05-25T22:56:40.737731"}
{"lr": 2.4768985671282466e-05, "step": 289, "loss": 1.445494532585144, "percent_done": 57.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5533.251372845789, "avg_wps": 4535.350057298082, "eta_in_seconds": 3048.958917239133, "at": "2024-05-25T22:56:52.583051"}
{"lr": 2.457372567570083e-05, "step": 290, "loss": 1.3846065998077393, "percent_done": 58.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5537.491649158071, "avg_wps": 4538.18210082149, "eta_in_seconds": 3032.615195742969, "at": "2024-05-25T22:57:04.419083"}
{"lr": 2.4378703048186006e-05, "step": 291, "loss": 1.8785253763198853, "percent_done": 58.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5532.5514159347595, "avg_wps": 4540.986756178741, "eta_in_seconds": 3016.3100522949117, "at": "2024-05-25T22:57:16.265721"}
{"lr": 2.4183926319659536e-05, "step": 292, "loss": 1.461996078491211, "percent_done": 58.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.14020013809204, "wps": 5512.864386334081, "avg_wps": 4543.7299970438635, "eta_in_seconds": 3000.065586834738, "at": "2024-05-25T22:57:28.154768"}
{"lr": 2.3989404010286496e-05, "step": 293, "loss": 1.5814299583435059, "percent_done": 58.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5528.897033042693, "avg_wps": 4546.494903598449, "eta_in_seconds": 2983.826505394926, "at": "2024-05-25T22:57:40.009228"}
{"lr": 2.379514462910286e-05, "step": 294, "loss": 1.5236884355545044, "percent_done": 58.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13971185684204, "wps": 5527.577194556655, "avg_wps": 4549.241293935507, "eta_in_seconds": 2967.6192419155927, "at": "2024-05-25T22:57:51.866663"}
{"lr": 2.3601156673643287e-05, "step": 295, "loss": 1.4485158920288086, "percent_done": 59.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5532.5411712616515, "avg_wps": 4551.983752141016, "eta_in_seconds": 2951.434084904396, "at": "2024-05-25T22:58:03.713288"}
{"lr": 2.340744862956937e-05, "step": 296, "loss": 1.3660223484039307, "percent_done": 59.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5534.305038849152, "avg_wps": 4554.714992730175, "eta_in_seconds": 2935.275647617675, "at": "2024-05-25T22:58:15.556179"}
{"lr": 2.3214028970298496e-05, "step": 297, "loss": 1.129741907119751, "percent_done": 59.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.140511512756348, "wps": 5518.5887078431715, "avg_wps": 4557.395101013946, "eta_in_seconds": 2919.169329216183, "at": "2024-05-25T22:58:27.432813"}
{"lr": 2.3020906156633134e-05, "step": 298, "loss": 1.5862302780151367, "percent_done": 59.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.14044427871704, "wps": 5533.277436713865, "avg_wps": 4560.093912398799, "eta_in_seconds": 2903.07003634408, "at": "2024-05-25T22:58:39.277966"}
{"lr": 2.2828088636390805e-05, "step": 299, "loss": 1.3507128953933716, "percent_done": 59.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1414213180542, "wps": 5517.752007677699, "avg_wps": 4562.742431270372, "eta_in_seconds": 2887.02161001282, "at": "2024-05-25T22:58:51.156507"}
{"lr": 2.2635584844034485e-05, "step": 300, "loss": 1.279242753982544, "percent_done": 60.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5522.372588765262, "avg_wps": 4565.386876121166, "eta_in_seconds": 2870.9943660100303, "at": "2024-05-25T22:59:03.024962"}
{"lr": 2.244340320030367e-05, "step": 301, "loss": 1.6162009239196777, "percent_done": 60.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5596.0634045652, "avg_wps": 4568.182100476005, "eta_in_seconds": 2854.891445470411, "at": "2024-05-25T22:59:29.055705"}
{"lr": 2.225155211184604e-05, "step": 302, "loss": 1.3532904386520386, "percent_done": 60.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13971185684204, "wps": 5549.411170931847, "avg_wps": 4570.8582742782555, "eta_in_seconds": 2838.8821576510045, "at": "2024-05-25T22:59:40.866360"}
{"lr": 2.2060039970849715e-05, "step": 303, "loss": 1.305881142616272, "percent_done": 60.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1384916305542, "wps": 5544.700065993084, "avg_wps": 4573.509320437121, "eta_in_seconds": 2822.907114741826, "at": "2024-05-25T22:59:52.687165"}
{"lr": 2.186887515467616e-05, "step": 304, "loss": 1.4735749959945679, "percent_done": 60.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139169692993164, "wps": 5538.719688114189, "avg_wps": 4576.132557891767, "eta_in_seconds": 2806.9676386117935, "at": "2024-05-25T23:00:04.520603"}
{"lr": 2.167806602549372e-05, "step": 305, "loss": 1.7670332193374634, "percent_done": 61.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139360904693604, "wps": 5532.913010383309, "avg_wps": 4578.728550846804, "eta_in_seconds": 2791.063033784022, "at": "2024-05-25T23:00:16.366505"}
{"lr": 2.148762092991183e-05, "step": 306, "loss": 1.459661841392517, "percent_done": 61.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13961887359619, "wps": 5536.567799009618, "avg_wps": 4581.318677984091, "eta_in_seconds": 2775.1800068172756, "at": "2024-05-25T23:00:28.204548"}
{"lr": 2.129754819861595e-05, "step": 307, "loss": 1.5853192806243896, "percent_done": 61.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5528.797503413538, "avg_wps": 4583.877460962019, "eta_in_seconds": 2759.3337971441906, "at": "2024-05-25T23:00:40.059221"}
{"lr": 2.1107856146003084e-05, "step": 308, "loss": 1.692198634147644, "percent_done": 61.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13971185684204, "wps": 5531.496302554545, "avg_wps": 4586.428487465176, "eta_in_seconds": 2743.5099085027523, "at": "2024-05-25T23:00:51.908251"}
{"lr": 2.0918553069818132e-05, "step": 309, "loss": 1.3194557428359985, "percent_done": 61.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5528.914381590603, "avg_wps": 4588.96006243418, "eta_in_seconds": 2727.7151750499766, "at": "2024-05-25T23:01:03.762668"}
{"lr": 2.0729647250790905e-05, "step": 310, "loss": 1.5714393854141235, "percent_done": 62.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13873529434204, "wps": 5520.829983091125, "avg_wps": 4591.460062602073, "eta_in_seconds": 2711.9565084365104, "at": "2024-05-25T23:01:15.634504"}
{"lr": 2.0541146952273892e-05, "step": 311, "loss": 1.3738967180252075, "percent_done": 62.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139092445373535, "wps": 5538.4990562134735, "avg_wps": 4593.9858979910505, "eta_in_seconds": 2696.199830612569, "at": "2024-05-25T23:01:27.468432"}
{"lr": 2.0353060419880816e-05, "step": 312, "loss": 1.5305222272872925, "percent_done": 62.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5536.386701186902, "avg_wps": 4596.493631016975, "eta_in_seconds": 2680.471026188288, "at": "2024-05-25T23:01:39.306881"}
{"lr": 2.01653958811259e-05, "step": 313, "loss": 1.6897908449172974, "percent_done": 62.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13897943496704, "wps": 5529.008132358318, "avg_wps": 4598.971764930777, "eta_in_seconds": 2664.7765253641355, "at": "2024-05-25T23:01:51.161305"}
{"lr": 1.997816154506404e-05, "step": 314, "loss": 1.4919114112854004, "percent_done": 62.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5529.193085366338, "avg_wps": 4601.43717054892, "eta_in_seconds": 2649.1062570666054, "at": "2024-05-25T23:02:03.015069"}
{"lr": 1.979136560193164e-05, "step": 315, "loss": 1.362998127937317, "percent_done": 63.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5534.578825955238, "avg_wps": 4603.901384762293, "eta_in_seconds": 2633.4534532229104, "at": "2024-05-25T23:02:14.857367"}
{"lr": 1.9605016222788395e-05, "step": 316, "loss": 1.5362869501113892, "percent_done": 63.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5525.791396409157, "avg_wps": 4606.333325022306, "eta_in_seconds": 2617.8357381337805, "at": "2024-05-25T23:02:26.718549"}
{"lr": 1.9419121559159824e-05, "step": 317, "loss": 0.9179596900939941, "percent_done": 63.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5531.0191454039505, "avg_wps": 4608.763929184131, "eta_in_seconds": 2602.235259666052, "at": "2024-05-25T23:02:38.568435"}
{"lr": 1.9233689742680746e-05, "step": 318, "loss": 1.6024270057678223, "percent_done": 63.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13916778564453, "wps": 5538.60161382314, "avg_wps": 4611.198339043205, "eta_in_seconds": 2586.6490927117425, "at": "2024-05-25T23:02:50.402344"}
{"lr": 1.9048728884739516e-05, "step": 319, "loss": 1.501809000968933, "percent_done": 63.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5530.255776156526, "avg_wps": 4613.601854202438, "eta_in_seconds": 2571.09659109295, "at": "2024-05-25T23:03:02.253864"}
{"lr": 1.886424707612324e-05, "step": 320, "loss": 1.1742545366287231, "percent_done": 64.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1384916305542, "wps": 5541.663239100619, "avg_wps": 4616.017615678441, "eta_in_seconds": 2555.5535056740046, "at": "2024-05-25T23:03:14.081117"}
{"lr": 1.86802523866639e-05, "step": 321, "loss": 1.3116861581802368, "percent_done": 64.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139100551605225, "wps": 5535.098393909138, "avg_wps": 4618.4066119485515, "eta_in_seconds": 2540.0414007831587, "at": "2024-05-25T23:03:25.922345"}
{"lr": 1.8496752864885245e-05, "step": 322, "loss": 1.5555421113967896, "percent_done": 64.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5531.708918326537, "avg_wps": 4620.7758803812885, "eta_in_seconds": 2524.556113947993, "at": "2024-05-25T23:03:37.771006"}
{"lr": 1.831375653765083e-05, "step": 323, "loss": 1.3761317729949951, "percent_done": 64.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5539.595246617048, "avg_wps": 4623.149917805754, "eta_in_seconds": 2509.084110667462, "at": "2024-05-25T23:03:49.602566"}
{"lr": 1.813127140981282e-05, "step": 324, "loss": 1.3383431434631348, "percent_done": 64.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5531.276023138408, "avg_wps": 4625.493789967782, "eta_in_seconds": 2493.644251564403, "at": "2024-05-25T23:04:01.451921"}
{"lr": 1.794930546386188e-05, "step": 325, "loss": 1.469743013381958, "percent_done": 65.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.140552043914795, "wps": 5536.761287914303, "avg_wps": 4627.837397100857, "eta_in_seconds": 2478.2201741108524, "at": "2024-05-25T23:04:13.289520"}
{"lr": 1.7767866659577976e-05, "step": 326, "loss": 1.0628798007965088, "percent_done": 65.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.138704299926758, "wps": 5531.573888719816, "avg_wps": 4630.157842197907, "eta_in_seconds": 2462.8240307649953, "at": "2024-05-25T23:04:25.138260"}
{"lr": 1.758696293368218e-05, "step": 327, "loss": 1.1498101949691772, "percent_done": 65.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5545.600563860817, "avg_wps": 4632.496409804798, "eta_in_seconds": 2447.4337370242547, "at": "2024-05-25T23:04:36.957089"}
{"lr": 1.740660219948953e-05, "step": 328, "loss": 1.3323389291763306, "percent_done": 65.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5542.183691117202, "avg_wps": 4634.815778759825, "eta_in_seconds": 2432.0690482796695, "at": "2024-05-25T23:04:48.783043"}
{"lr": 1.7226792346562806e-05, "step": 329, "loss": 0.9280859231948853, "percent_done": 65.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1399564743042, "wps": 5529.7981894762115, "avg_wps": 4637.096937432788, "eta_in_seconds": 2416.739643619416, "at": "2024-05-25T23:05:00.635547"}
{"lr": 1.7047541240367497e-05, "step": 330, "loss": 1.5664188861846924, "percent_done": 66.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5541.807699985924, "avg_wps": 4639.392057656485, "eta_in_seconds": 2401.4180870128403, "at": "2024-05-25T23:05:12.462379"}
{"lr": 1.6868856721927658e-05, "step": 331, "loss": 1.3574612140655518, "percent_done": 66.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5522.906179539739, "avg_wps": 4641.6353654054765, "eta_in_seconds": 2386.1383172291644, "at": "2024-05-25T23:05:24.329689"}
{"lr": 1.669074660748301e-05, "step": 332, "loss": 1.5006729364395142, "percent_done": 66.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.140617847442627, "wps": 5521.832556545177, "avg_wps": 4643.865023388572, "eta_in_seconds": 2370.880278506911, "at": "2024-05-25T23:05:36.199372"}
{"lr": 1.6513218688146936e-05, "step": 333, "loss": 1.2552119493484497, "percent_done": 66.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5535.35431307931, "avg_wps": 4646.112091076746, "eta_in_seconds": 2355.6280574934617, "at": "2024-05-25T23:05:48.039929"}
{"lr": 1.6336280729565724e-05, "step": 334, "loss": 1.4726775884628296, "percent_done": 66.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5531.309525849591, "avg_wps": 4648.33931324541, "eta_in_seconds": 2340.4005746741495, "at": "2024-05-25T23:05:59.889218"}
{"lr": 1.6159940471578926e-05, "step": 335, "loss": 1.24460768699646, "percent_done": 67.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.138813495635986, "wps": 5530.559095614715, "avg_wps": 4650.553772113003, "eta_in_seconds": 2325.1940585748475, "at": "2024-05-25T23:06:11.740111"}
{"lr": 1.598420562788065e-05, "step": 336, "loss": 1.1442080736160278, "percent_done": 67.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5534.7047526034785, "avg_wps": 4652.76586773327, "eta_in_seconds": 2310.003190690563, "at": "2024-05-25T23:06:23.582104"}
{"lr": 1.5809083885682293e-05, "step": 337, "loss": 1.2265191078186035, "percent_done": 67.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5528.203625111734, "avg_wps": 4654.953259967956, "eta_in_seconds": 2294.838938957152, "at": "2024-05-25T23:06:35.438183"}
{"lr": 1.5634582905376138e-05, "step": 338, "loss": 1.097861409187317, "percent_done": 67.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.138688564300537, "wps": 5533.373674661561, "avg_wps": 4657.140593795531, "eta_in_seconds": 2279.688960677773, "at": "2024-05-25T23:06:47.283064"}
{"lr": 1.546071032020041e-05, "step": 339, "loss": 1.5978518724441528, "percent_done": 67.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.14020013809204, "wps": 5522.545004202414, "avg_wps": 4659.294368598296, "eta_in_seconds": 2264.5695174598413, "at": "2024-05-25T23:06:59.151214"}
{"lr": 1.5287473735905225e-05, "step": 340, "loss": 1.364516258239746, "percent_done": 68.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5530.858108143184, "avg_wps": 4661.454843378572, "eta_in_seconds": 2249.460812624763, "at": "2024-05-25T23:07:11.001606"}
{"lr": 1.5114880730419973e-05, "step": 341, "loss": 1.7650222778320312, "percent_done": 68.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.140679836273193, "wps": 5537.121648253804, "avg_wps": 4663.6176783473375, "eta_in_seconds": 2234.364975581071, "at": "2024-05-25T23:07:22.838743"}
{"lr": 1.4942938853521888e-05, "step": 342, "loss": 1.610933542251587, "percent_done": 68.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139131546020508, "wps": 5538.157038975037, "avg_wps": 4665.772004735956, "eta_in_seconds": 2219.2871810901934, "at": "2024-05-25T23:07:34.673395"}
{"lr": 1.4771655626505637e-05, "step": 343, "loss": 1.2632454633712769, "percent_done": 68.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5533.930338745834, "avg_wps": 4667.906982341584, "eta_in_seconds": 2204.2324405613167, "at": "2024-05-25T23:07:46.517174"}
{"lr": 1.4601038541854481e-05, "step": 344, "loss": 1.2216689586639404, "percent_done": 68.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5536.899136097767, "avg_wps": 4670.037627758494, "eta_in_seconds": 2189.1934958363686, "at": "2024-05-25T23:07:58.354608"}
{"lr": 1.4431095062912406e-05, "step": 345, "loss": 1.3331900835037231, "percent_done": 69.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5540.763237562274, "avg_wps": 4672.165820111177, "eta_in_seconds": 2174.1694090297256, "at": "2024-05-25T23:08:10.183720"}
{"lr": 1.426183262355772e-05, "step": 346, "loss": 1.6556040048599243, "percent_done": 69.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13903045654297, "wps": 5530.2705741695045, "avg_wps": 4674.2620112551, "eta_in_seconds": 2159.173785230328, "at": "2024-05-25T23:08:22.035434"}
{"lr": 1.4093258627877864e-05, "step": 347, "loss": 1.0908232927322388, "percent_done": 69.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5531.034949151135, "avg_wps": 4676.349560986865, "eta_in_seconds": 2144.1955673399166, "at": "2024-05-25T23:08:33.885303"}
{"lr": 1.392538044984549e-05, "step": 348, "loss": 1.2147232294082642, "percent_done": 69.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1409330368042, "wps": 2773.92066582999, "avg_wps": 4667.151695151093, "eta_in_seconds": 2134.37930683706, "at": "2024-05-25T23:08:57.512262"}
{"lr": 1.3758205432995999e-05, "step": 349, "loss": 1.4657495021820068, "percent_done": 69.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5554.656676722703, "avg_wps": 4669.289356670141, "eta_in_seconds": 2119.3666196470617, "at": "2024-05-25T23:09:09.311908"}
{"lr": 1.3591740890106174e-05, "step": 350, "loss": 1.326554298400879, "percent_done": 70.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13971185684204, "wps": 5523.354524317463, "avg_wps": 4671.353133559756, "eta_in_seconds": 2104.400955983571, "at": "2024-05-25T23:09:21.178377"}
{"lr": 1.342599410287438e-05, "step": 351, "loss": 1.2489190101623535, "percent_done": 70.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5540.562209772346, "avg_wps": 4673.441949404009, "eta_in_seconds": 2089.437315305753, "at": "2024-05-25T23:09:33.007968"}
{"lr": 1.3260972321602061e-05, "step": 352, "loss": 1.0407387018203735, "percent_done": 70.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.141040325164795, "wps": 5523.735119611841, "avg_wps": 4675.486604219299, "eta_in_seconds": 2074.5066387843003, "at": "2024-05-25T23:09:44.873582"}
{"lr": 1.3096682764876501e-05, "step": 353, "loss": 1.242996096611023, "percent_done": 70.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1384916305542, "wps": 5532.060271096363, "avg_wps": 4677.538335435427, "eta_in_seconds": 2059.5858994928362, "at": "2024-05-25T23:09:56.721371"}
{"lr": 1.2933132619255162e-05, "step": 354, "loss": 1.3015520572662354, "percent_done": 70.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5528.803730860661, "avg_wps": 4679.573674806064, "eta_in_seconds": 2044.6854061757106, "at": "2024-05-25T23:10:08.576109"}
{"lr": 1.2770329038951215e-05, "step": 355, "loss": 1.1245949268341064, "percent_done": 71.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5540.074889612845, "avg_wps": 4681.622023299127, "eta_in_seconds": 2029.792228571126, "at": "2024-05-25T23:10:20.406772"}
{"lr": 1.2608279145520686e-05, "step": 356, "loss": 1.2131990194320679, "percent_done": 71.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5537.3947101643935, "avg_wps": 4683.655259638721, "eta_in_seconds": 2014.918578940831, "at": "2024-05-25T23:10:32.243198"}
{"lr": 1.2446990027550896e-05, "step": 357, "loss": 1.1643948554992676, "percent_done": 71.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5543.629134033885, "avg_wps": 4685.691347669286, "eta_in_seconds": 2000.0566201744293, "at": "2024-05-25T23:10:44.066282"}
{"lr": 1.2286468740350344e-05, "step": 358, "loss": 1.3531920909881592, "percent_done": 71.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.14020013809204, "wps": 5526.955684548774, "avg_wps": 4687.684414382027, "eta_in_seconds": 1985.225791106677, "at": "2024-05-25T23:10:55.925040"}
{"lr": 1.2126722305640172e-05, "step": 359, "loss": 1.5578019618988037, "percent_done": 71.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5545.045912070976, "avg_wps": 4689.704221201127, "eta_in_seconds": 1970.3963329340422, "at": "2024-05-25T23:11:07.745087"}
{"lr": 1.1967757711246922e-05, "step": 360, "loss": 1.34718918800354, "percent_done": 72.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5539.455143120374, "avg_wps": 4691.703404629848, "eta_in_seconds": 1955.5882392194535, "at": "2024-05-25T23:11:19.577055"}
{"lr": 1.1809581910796943e-05, "step": 361, "loss": 1.3180506229400635, "percent_done": 72.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139734745025635, "wps": 5527.031031857379, "avg_wps": 4693.668438987415, "eta_in_seconds": 1940.8068802502016, "at": "2024-05-25T23:11:31.435613"}
{"lr": 1.1652201823412147e-05, "step": 362, "loss": 1.455444574356079, "percent_done": 72.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13906764984131, "wps": 5529.942922418844, "avg_wps": 4695.630052750505, "eta_in_seconds": 1926.0392957708455, "at": "2024-05-25T23:11:43.287896"}
{"lr": 1.1495624333407409e-05, "step": 363, "loss": 1.326683759689331, "percent_done": 72.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5538.070788116307, "avg_wps": 4697.598619463122, "eta_in_seconds": 1911.2812156407958, "at": "2024-05-25T23:11:55.122857"}
{"lr": 1.133985628998939e-05, "step": 364, "loss": 1.1185904741287231, "percent_done": 72.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13995599746704, "wps": 5531.728622291043, "avg_wps": 4699.545446399584, "eta_in_seconds": 1896.5442725590297, "at": "2024-05-25T23:12:06.971428"}
{"lr": 1.1184904506956906e-05, "step": 365, "loss": 1.4800939559936523, "percent_done": 73.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5534.16809974351, "avg_wps": 4701.488032567433, "eta_in_seconds": 1881.8212316428146, "at": "2024-05-25T23:12:18.814623"}
{"lr": 1.1030775762402946e-05, "step": 366, "loss": 1.575332522392273, "percent_done": 73.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139241695404053, "wps": 5538.445602773564, "avg_wps": 4703.4300322287345, "eta_in_seconds": 1867.110585216616, "at": "2024-05-25T23:12:30.648620"}
{"lr": 1.0877476798418077e-05, "step": 367, "loss": 1.0277793407440186, "percent_done": 73.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.14020013809204, "wps": 5535.981169787024, "avg_wps": 4705.358191652899, "eta_in_seconds": 1852.4175301812977, "at": "2024-05-25T23:12:42.488063"}
{"lr": 1.0725014320795634e-05, "step": 368, "loss": 1.2328702211380005, "percent_done": 73.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5536.696492717369, "avg_wps": 4707.278845847564, "eta_in_seconds": 1837.7394421048787, "at": "2024-05-25T23:12:54.325961"}
{"lr": 1.0573394998738269e-05, "step": 369, "loss": 1.4363727569580078, "percent_done": 73.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5543.91592029221, "avg_wps": 4709.2047810923605, "eta_in_seconds": 1823.071282537972, "at": "2024-05-25T23:13:06.148393"}
{"lr": 1.0422625464566322e-05, "step": 370, "loss": 1.3193644285202026, "percent_done": 74.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5538.419267011386, "avg_wps": 4711.111131255367, "eta_in_seconds": 1808.4226337767936, "at": "2024-05-25T23:13:17.982601"}
{"lr": 1.0272712313427651e-05, "step": 371, "loss": 1.3883593082427979, "percent_done": 74.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5545.943724907959, "avg_wps": 4713.02340307365, "eta_in_seconds": 1793.7835815724015, "at": "2024-05-25T23:13:29.800728"}
{"lr": 1.0123662103009122e-05, "step": 372, "loss": 1.3066599369049072, "percent_done": 74.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5540.765806345092, "avg_wps": 4714.916864705352, "eta_in_seconds": 1779.1635018625568, "at": "2024-05-25T23:13:41.654050"}
{"lr": 9.97548135324981e-06, "step": 373, "loss": 1.5044260025024414, "percent_done": 74.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5537.0922020094395, "avg_wps": 4716.794541405861, "eta_in_seconds": 1764.561065133711, "at": "2024-05-25T23:13:53.491167"}
{"lr": 9.828176546055728e-06, "step": 374, "loss": 1.1372315883636475, "percent_done": 74.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5532.241976728904, "avg_wps": 4718.654234834191, "eta_in_seconds": 1749.9769190632724, "at": "2024-05-25T23:14:05.338589"}
{"lr": 9.681754125016368e-06, "step": 375, "loss": 1.3641146421432495, "percent_done": 75.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13897943496704, "wps": 5536.0754948569775, "avg_wps": 4720.512902938775, "eta_in_seconds": 1735.4046410719554, "at": "2024-05-25T23:14:17.177809"}
{"lr": 9.536220495122747e-06, "step": 376, "loss": 1.6401150226593018, "percent_done": 75.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.14116334915161, "wps": 5530.04416210854, "avg_wps": 4722.351453104716, "eta_in_seconds": 1720.8511650815924, "at": "2024-05-25T23:14:29.029913"}
{"lr": 9.391582022487311e-06, "step": 377, "loss": 1.5790910720825195, "percent_done": 75.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1399564743042, "wps": 5525.936141861639, "avg_wps": 4724.17371292723, "eta_in_seconds": 1706.3149007290049, "at": "2024-05-25T23:14:40.890834"}
{"lr": 9.247845034065422e-06, "step": 378, "loss": 1.289422869682312, "percent_done": 75.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5535.396894261858, "avg_wps": 4726.006002270691, "eta_in_seconds": 1691.7862559121752, "at": "2024-05-25T23:14:52.731475"}
{"lr": 9.105015817378586e-06, "step": 379, "loss": 1.0527746677398682, "percent_done": 75.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1411771774292, "wps": 5541.28396736375, "avg_wps": 4727.841352638085, "eta_in_seconds": 1677.2677864021866, "at": "2024-05-25T23:15:04.559570"}
{"lr": 8.963100620239454e-06, "step": 380, "loss": 1.3100308179855347, "percent_done": 76.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1399564743042, "wps": 5539.69002981415, "avg_wps": 4729.665401399196, "eta_in_seconds": 1662.7645578635365, "at": "2024-05-25T23:15:16.391059"}
{"lr": 8.82210565047849e-06, "step": 381, "loss": 0.956969141960144, "percent_done": 76.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13971185684204, "wps": 5503.388318396743, "avg_wps": 4731.41130809534, "eta_in_seconds": 1648.2997338778077, "at": "2024-05-25T23:15:28.300572"}
{"lr": 8.682037075672413e-06, "step": 382, "loss": 1.262111783027649, "percent_done": 76.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139315605163574, "wps": 5537.823543105449, "avg_wps": 4733.2156171182, "eta_in_seconds": 1633.8254213545335, "at": "2024-05-25T23:15:40.136043"}
{"lr": 8.542901022874465e-06, "step": 383, "loss": 1.507392406463623, "percent_done": 76.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13897943496704, "wps": 5533.710422440849, "avg_wps": 4735.004013022269, "eta_in_seconds": 1619.367582141886, "at": "2024-05-25T23:15:51.980308"}
{"lr": 8.404703578346311e-06, "step": 384, "loss": 1.2510004043579102, "percent_done": 76.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13886070251465, "wps": 5541.021244600094, "avg_wps": 4736.7983672624005, "eta_in_seconds": 1604.918641363581, "at": "2024-05-25T23:16:03.808950"}
{"lr": 8.267450787291907e-06, "step": 385, "loss": 1.2303383350372314, "percent_done": 77.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13960361480713, "wps": 5543.237296688104, "avg_wps": 4738.588957954422, "eta_in_seconds": 1590.4819065069223, "at": "2024-05-25T23:16:15.632869"}
{"lr": 8.13114865359295e-06, "step": 386, "loss": 1.358881950378418, "percent_done": 77.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5532.4391720205385, "avg_wps": 4740.3511170865595, "eta_in_seconds": 1576.0655308992752, "at": "2024-05-25T23:16:27.479870"}
{"lr": 7.995803139546319e-06, "step": 387, "loss": 1.0685631036758423, "percent_done": 77.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13971185684204, "wps": 5527.543292427566, "avg_wps": 4742.096167620122, "eta_in_seconds": 1561.6655036577574, "at": "2024-05-25T23:16:39.337358"}
{"lr": 7.861420165603275e-06, "step": 388, "loss": 1.5114823579788208, "percent_done": 77.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5533.721451261711, "avg_wps": 4743.845213277877, "eta_in_seconds": 1547.2747676200474, "at": "2024-05-25T23:16:51.181609"}
{"lr": 7.728005610110419e-06, "step": 389, "loss": 1.5361900329589844, "percent_done": 77.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.138672351837158, "wps": 5526.620313930428, "avg_wps": 4745.573104667124, "eta_in_seconds": 1532.901472499867, "at": "2024-05-25T23:17:03.041078"}
{"lr": 7.59556530905263e-06, "step": 390, "loss": 1.2640721797943115, "percent_done": 78.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5539.087447013987, "avg_wps": 4747.316918736619, "eta_in_seconds": 1518.5335471385565, "at": "2024-05-25T23:17:14.873840"}
{"lr": 7.464105055797707e-06, "step": 391, "loss": 1.4845365285873413, "percent_done": 78.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5536.607276339293, "avg_wps": 4749.048420420794, "eta_in_seconds": 1504.1800730612576, "at": "2024-05-25T23:17:26.711932"}
{"lr": 7.333630600843008e-06, "step": 392, "loss": 1.7893493175506592, "percent_done": 78.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1409330368042, "wps": 5532.606871454251, "avg_wps": 4750.76482258026, "eta_in_seconds": 1489.8417969163584, "at": "2024-05-25T23:17:38.558612"}
{"lr": 7.204147651563878e-06, "step": 393, "loss": 1.3601292371749878, "percent_done": 78.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5540.7104105133685, "avg_wps": 4752.488913989457, "eta_in_seconds": 1475.5114902758417, "at": "2024-05-25T23:17:50.387926"}
{"lr": 7.07566187196397e-06, "step": 394, "loss": 1.21010422706604, "percent_done": 78.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139430046081543, "wps": 5538.579628901459, "avg_wps": 4754.201512754854, "eta_in_seconds": 1461.195109496867, "at": "2024-05-25T23:18:02.221782"}
{"lr": 6.948178882427538e-06, "step": 395, "loss": 1.1674048900604248, "percent_done": 79.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.138875007629395, "wps": 5536.00870880737, "avg_wps": 4755.901864172482, "eta_in_seconds": 1446.8927653529977, "at": "2024-05-25T23:18:14.061123"}
{"lr": 6.821704259473511e-06, "step": 396, "loss": 1.3634860515594482, "percent_done": 79.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1392240524292, "wps": 5536.0610002518715, "avg_wps": 4757.594932981414, "eta_in_seconds": 1432.6028373602664, "at": "2024-05-25T23:18:25.900347"}
{"lr": 6.696243535511637e-06, "step": 397, "loss": 1.4827200174331665, "percent_done": 79.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.141201972961426, "wps": 5531.078354273538, "avg_wps": 4759.271385130908, "eta_in_seconds": 1418.328028338382, "at": "2024-05-25T23:18:37.750253"}
{"lr": 6.571802198600406e-06, "step": 398, "loss": 1.3379186391830444, "percent_done": 79.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139405250549316, "wps": 5542.215649922379, "avg_wps": 4760.96127734087, "eta_in_seconds": 1404.0593087397629, "at": "2024-05-25T23:18:49.576350"}
{"lr": 6.4483856922070286e-06, "step": 399, "loss": 1.2363020181655884, "percent_done": 79.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5530.771861911462, "avg_wps": 4762.622666653308, "eta_in_seconds": 1389.809032394175, "at": "2024-05-25T23:19:01.426902"}
{"lr": 6.325999414969323e-06, "step": 400, "loss": 1.4237030744552612, "percent_done": 80.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13873529434204, "wps": 5538.081053278184, "avg_wps": 4764.290441530409, "eta_in_seconds": 1375.5668510198593, "at": "2024-05-25T23:19:13.261812"}
{"lr": 6.2046487204595115e-06, "step": 401, "loss": 1.076772689819336, "percent_done": 80.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1411771774292, "wps": 5606.843480023397, "avg_wps": 4766.076499097849, "eta_in_seconds": 1361.3008522267949, "at": "2024-05-25T23:19:40.077284"}
{"lr": 6.084338916950114e-06, "step": 402, "loss": 1.377065896987915, "percent_done": 80.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5566.783654342226, "avg_wps": 4767.782423341762, "eta_in_seconds": 1347.0681817519724, "at": "2024-05-25T23:19:51.851186"}
{"lr": 5.965075267181666e-06, "step": 403, "loss": 1.2331016063690186, "percent_done": 80.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5548.671726005925, "avg_wps": 4769.447995733995, "eta_in_seconds": 1332.8569691264008, "at": "2024-05-25T23:20:03.663507"}
{"lr": 5.846862988132589e-06, "step": 404, "loss": 1.0951265096664429, "percent_done": 80.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5539.480818928031, "avg_wps": 4771.089629910645, "eta_in_seconds": 1318.6622947843948, "at": "2024-05-25T23:20:15.495393"}
{"lr": 5.7297072507909045e-06, "step": 405, "loss": 1.4920803308486938, "percent_done": 81.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5534.403541143231, "avg_wps": 4772.714964694794, "eta_in_seconds": 1304.48184022197, "at": "2024-05-25T23:20:27.338186"}
{"lr": 5.613613179928103e-06, "step": 406, "loss": 1.2911174297332764, "percent_done": 81.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5526.695652095237, "avg_wps": 4774.319244419228, "eta_in_seconds": 1290.3167309561386, "at": "2024-05-25T23:20:39.197486"}
{"lr": 5.498585853874947e-06, "step": 407, "loss": 1.5607460737228394, "percent_done": 81.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5534.129437121922, "avg_wps": 4775.9303328406495, "eta_in_seconds": 1276.1593187593417, "at": "2024-05-25T23:20:51.040820"}
{"lr": 5.384630304299297e-06, "step": 408, "loss": 1.230184555053711, "percent_done": 81.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5538.970584795458, "avg_wps": 4777.543438708813, "eta_in_seconds": 1262.0109220041948, "at": "2024-05-25T23:21:02.873847"}
{"lr": 5.271751515986073e-06, "step": 409, "loss": 1.7306795120239258, "percent_done": 81.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5534.589301050829, "avg_wps": 4779.141757463665, "eta_in_seconds": 1247.8759372823104, "at": "2024-05-25T23:21:14.716222"}
{"lr": 5.159954426619136e-06, "step": 410, "loss": 1.4807617664337158, "percent_done": 82.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5531.105844536752, "avg_wps": 4780.726998177519, "eta_in_seconds": 1233.7537789228486, "at": "2024-05-25T23:21:26.566047"}
{"lr": 5.049243926565364e-06, "step": 411, "loss": 1.6338636875152588, "percent_done": 82.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5538.592351119124, "avg_wps": 4782.319167994876, "eta_in_seconds": 1219.639215850482, "at": "2024-05-25T23:21:38.399897"}
{"lr": 4.939624858660665e-06, "step": 412, "loss": 1.3516926765441895, "percent_done": 82.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5534.434407402588, "avg_wps": 4783.897127158401, "eta_in_seconds": 1205.5376289886178, "at": "2024-05-25T23:21:50.242641"}
{"lr": 4.831102017998196e-06, "step": 413, "loss": 1.4513237476348877, "percent_done": 82.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5544.145147018787, "avg_wps": 4785.486027677265, "eta_in_seconds": 1191.442617745434, "at": "2024-05-25T23:22:02.064578"}
{"lr": 4.7236801517185786e-06, "step": 414, "loss": 1.3798224925994873, "percent_done": 82.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5538.539677054013, "avg_wps": 4787.058195894252, "eta_in_seconds": 1177.3610784247303, "at": "2024-05-25T23:22:13.898504"}
{"lr": 4.617363958802224e-06, "step": 415, "loss": 1.5379360914230347, "percent_done": 83.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.14020013809204, "wps": 5529.878842948535, "avg_wps": 4788.608188254338, "eta_in_seconds": 1163.2941725455134, "at": "2024-05-25T23:22:25.750962"}
{"lr": 4.512158089863847e-06, "step": 416, "loss": 1.8933963775634766, "percent_done": 83.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13971185684204, "wps": 5532.745626480025, "avg_wps": 4790.156893819346, "eta_in_seconds": 1149.2366788868721, "at": "2024-05-25T23:22:37.597286"}
{"lr": 4.408067146948968e-06, "step": 417, "loss": 1.4693549871444702, "percent_done": 83.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.14060878753662, "wps": 5542.810195597881, "avg_wps": 4791.717236870136, "eta_in_seconds": 1135.1855151521788, "at": "2024-05-25T23:22:49.422074"}
{"lr": 4.305095683332627e-06, "step": 418, "loss": 1.3827508687973022, "percent_done": 83.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.14126491546631, "wps": 5529.436112187818, "avg_wps": 4793.247138794414, "eta_in_seconds": 1121.1506196927796, "at": "2024-05-25T23:23:01.275508"}
{"lr": 4.20324820332023e-06, "step": 419, "loss": 1.205785870552063, "percent_done": 83.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5548.4698999574275, "avg_wps": 4794.804748841511, "eta_in_seconds": 1107.1182828211272, "at": "2024-05-25T23:23:13.088229"}
{"lr": 4.102529162050497e-06, "step": 420, "loss": 1.5002938508987427, "percent_done": 84.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5545.813482066426, "avg_wps": 4796.351218540547, "eta_in_seconds": 1093.0975988024757, "at": "2024-05-25T23:23:24.906675"}
{"lr": 4.002942965300582e-06, "step": 421, "loss": 1.6744729280471802, "percent_done": 84.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5543.668488520225, "avg_wps": 4797.887517488994, "eta_in_seconds": 1079.0882406325352, "at": "2024-05-25T23:23:36.729630"}
{"lr": 3.90449396929334e-06, "step": 422, "loss": 1.101501226425171, "percent_done": 84.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5538.243404104972, "avg_wps": 4799.407867925258, "eta_in_seconds": 1065.0913905781028, "at": "2024-05-25T23:23:48.564191"}
{"lr": 3.8071864805067762e-06, "step": 423, "loss": 1.3566513061523438, "percent_done": 84.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5540.094318244161, "avg_wps": 4800.925274007002, "eta_in_seconds": 1051.1040501549453, "at": "2024-05-25T23:24:00.394820"}
{"lr": 3.711024755485704e-06, "step": 424, "loss": 1.2551512718200684, "percent_done": 84.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5542.924313784657, "avg_wps": 4802.4414884189255, "eta_in_seconds": 1037.1258061157082, "at": "2024-05-25T23:24:12.219363"}
{"lr": 3.6160130006554755e-06, "step": 425, "loss": 1.2069180011749268, "percent_done": 85.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139016151428223, "wps": 5534.400978256311, "avg_wps": 4803.936431805445, "eta_in_seconds": 1023.1609160058639, "at": "2024-05-25T23:24:24.062128"}
{"lr": 3.522155372138053e-06, "step": 426, "loss": 1.1142200231552124, "percent_done": 85.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13873529434204, "wps": 5537.163029679565, "avg_wps": 4805.430166854468, "eta_in_seconds": 1009.2049684647662, "at": "2024-05-25T23:24:35.899037"}
{"lr": 3.4294559755701608e-06, "step": 427, "loss": 1.5559438467025757, "percent_done": 85.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5536.620547093497, "avg_wps": 4806.916870634178, "eta_in_seconds": 995.2591502521301, "at": "2024-05-25T23:24:47.737045"}
{"lr": 3.337918865923721e-06, "step": 428, "loss": 1.4638431072235107, "percent_done": 85.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5542.063457795287, "avg_wps": 4808.407123322748, "eta_in_seconds": 981.3212315390043, "at": "2024-05-25T23:24:59.563431"}
{"lr": 3.2475480473284393e-06, "step": 429, "loss": 1.223836898803711, "percent_done": 85.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1414213180542, "wps": 5529.045500098511, "avg_wps": 4809.868435917796, "eta_in_seconds": 967.3977702286415, "at": "2024-05-25T23:25:11.417679"}
{"lr": 3.158347472896674e-06, "step": 430, "loss": 1.508067011833191, "percent_done": 86.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5552.6900207191175, "avg_wps": 4811.36529515232, "eta_in_seconds": 953.4757222907488, "at": "2024-05-25T23:25:23.221448"}
{"lr": 3.0703210445505373e-06, "step": 431, "loss": 1.4822466373443604, "percent_done": 86.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5541.777533517647, "avg_wps": 4812.837074971461, "eta_in_seconds": 939.5672302135458, "at": "2024-05-25T23:25:35.048424"}
{"lr": 2.9834726128511543e-06, "step": 432, "loss": 1.2388511896133423, "percent_done": 86.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.14012050628662, "wps": 5537.369053691516, "avg_wps": 4814.295227857319, "eta_in_seconds": 925.6698621665989, "at": "2024-05-25T23:25:46.884836"}
{"lr": 2.897805976830286e-06, "step": 433, "loss": 1.2354152202606201, "percent_done": 86.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.138790130615234, "wps": 5534.54405783707, "avg_wps": 4815.742586240146, "eta_in_seconds": 911.7829537953296, "at": "2024-05-25T23:25:58.727314"}
{"lr": 2.8133248838241186e-06, "step": 434, "loss": 1.3420536518096924, "percent_done": 86.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.14108180999756, "wps": 5521.232854084343, "avg_wps": 4817.160847962765, "eta_in_seconds": 897.9098137919254, "at": "2024-05-25T23:26:10.598317"}
{"lr": 2.7300330293093305e-06, "step": 435, "loss": 1.7331186532974243, "percent_done": 87.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5534.876044331215, "avg_wps": 4818.597248682247, "eta_in_seconds": 884.0415125304255, "at": "2024-05-25T23:26:22.440061"}
{"lr": 2.6479340567414757e-06, "step": 436, "loss": 1.6415690183639526, "percent_done": 87.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139389991760254, "wps": 5547.253878420293, "avg_wps": 4820.049393327249, "eta_in_seconds": 870.1786346435547, "at": "2024-05-25T23:26:34.255378"}
{"lr": 2.5670315573955692e-06, "step": 437, "loss": 1.2258780002593994, "percent_done": 87.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5546.94100147263, "avg_wps": 4821.4952205979325, "eta_in_seconds": 856.325229227952, "at": "2024-05-25T23:26:46.071406"}
{"lr": 2.48732907020903e-06, "step": 438, "loss": 1.1916077136993408, "percent_done": 87.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139499187469482, "wps": 5545.094906692296, "avg_wps": 4822.93212020207, "eta_in_seconds": 842.481689298534, "at": "2024-05-25T23:26:57.891361"}
{"lr": 2.4088300816268335e-06, "step": 439, "loss": 1.5336813926696777, "percent_done": 87.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.138530731201172, "wps": 5540.11441697168, "avg_wps": 4824.354729162702, "eta_in_seconds": 828.6488503497391, "at": "2024-05-25T23:27:09.721966"}
{"lr": 2.3315380254490547e-06, "step": 440, "loss": 1.52827787399292, "percent_done": 88.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5529.080087951019, "avg_wps": 4825.752639766269, "eta_in_seconds": 814.8283373659307, "at": "2024-05-25T23:27:21.576167"}
{"lr": 2.2554562826806213e-06, "step": 441, "loss": 1.4440735578536987, "percent_done": 88.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5542.894023386682, "avg_wps": 4827.168831674929, "eta_in_seconds": 801.0127954564127, "at": "2024-05-25T23:27:33.400790"}
{"lr": 2.1805881813834265e-06, "step": 442, "loss": 1.4471334218978882, "percent_done": 88.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139073848724365, "wps": 5537.265314725364, "avg_wps": 4828.5697675933225, "eta_in_seconds": 787.2078447557682, "at": "2024-05-25T23:27:45.237424"}
{"lr": 2.106936996530766e-06, "step": 443, "loss": 1.413780689239502, "percent_done": 88.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5540.2174810711995, "avg_wps": 4829.970254248535, "eta_in_seconds": 773.4109742630685, "at": "2024-05-25T23:27:57.067804"}
{"lr": 2.034505949864056e-06, "step": 444, "loss": 1.568229079246521, "percent_done": 88.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5539.475907015981, "avg_wps": 4831.363969229035, "eta_in_seconds": 759.6231671582472, "at": "2024-05-25T23:28:08.899756"}
{"lr": 1.9632982097519294e-06, "step": 445, "loss": 1.2987884283065796, "percent_done": 89.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5531.397235866023, "avg_wps": 4832.738381756317, "eta_in_seconds": 745.8462915366955, "at": "2024-05-25T23:28:20.748962"}
{"lr": 1.8933168910516103e-06, "step": 446, "loss": 1.2623353004455566, "percent_done": 89.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13873529434204, "wps": 5533.95674324649, "avg_wps": 4834.111789051965, "eta_in_seconds": 732.0774021020385, "at": "2024-05-25T23:28:32.592677"}
{"lr": 1.8245650549726923e-06, "step": 447, "loss": 1.3227944374084473, "percent_done": 89.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5544.433440514158, "avg_wps": 4835.49768790479, "eta_in_seconds": 718.3144785051112, "at": "2024-05-25T23:28:44.414020"}
{"lr": 1.757045708943213e-06, "step": 448, "loss": 1.8180917501449585, "percent_done": 89.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1396541595459, "wps": 5538.572375031584, "avg_wps": 4836.868222076985, "eta_in_seconds": 704.5616798996925, "at": "2024-05-25T23:28:56.247919"}
{"lr": 1.6907618064780943e-06, "step": 449, "loss": 1.5383700132369995, "percent_done": 89.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139648914337158, "wps": 5537.020595403856, "avg_wps": 4838.230785310016, "eta_in_seconds": 690.8178109543892, "at": "2024-05-25T23:29:08.085102"}
{"lr": 1.625716247049965e-06, "step": 450, "loss": 1.5726405382156372, "percent_done": 90.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13873529434204, "wps": 5534.567793716583, "avg_wps": 4839.58388961061, "eta_in_seconds": 677.083004395167, "at": "2024-05-25T23:29:19.927528"}
{"lr": 1.5619118759623072e-06, "step": 451, "loss": 1.229055404663086, "percent_done": 90.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1384916305542, "wps": 5537.345851520766, "avg_wps": 4840.936455656658, "eta_in_seconds": 663.35594970424, "at": "2024-05-25T23:29:31.763999"}
{"lr": 1.4993514842250177e-06, "step": 452, "loss": 1.3133533000946045, "percent_done": 90.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5536.939398876936, "avg_wps": 4842.2831004232, "eta_in_seconds": 649.6373579902987, "at": "2024-05-25T23:29:43.601340"}
{"lr": 1.4380378084322957e-06, "step": 453, "loss": 1.1959723234176636, "percent_done": 90.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.14009380340576, "wps": 5533.535638209661, "avg_wps": 4843.618790749949, "eta_in_seconds": 635.9278326945063, "at": "2024-05-25T23:29:55.445992"}
{"lr": 1.37797353064294e-06, "step": 454, "loss": 1.4957315921783447, "percent_done": 90.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1392240524292, "wps": 5527.092155814596, "avg_wps": 4844.938436304245, "eta_in_seconds": 622.2279270693069, "at": "2024-05-25T23:30:07.304292"}
{"lr": 1.319161278263055e-06, "step": 455, "loss": 1.2987531423568726, "percent_done": 91.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1384916305542, "wps": 5533.508569363958, "avg_wps": 4846.263824964534, "eta_in_seconds": 608.5347613161737, "at": "2024-05-25T23:30:19.148845"}
{"lr": 1.261603623931077e-06, "step": 456, "loss": 1.779760718345642, "percent_done": 91.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139268398284912, "wps": 5537.596065956076, "avg_wps": 4847.590995297616, "eta_in_seconds": 594.8488646829337, "at": "2024-05-25T23:30:30.984704"}
{"lr": 1.205303085405276e-06, "step": 457, "loss": 1.1598193645477295, "percent_done": 91.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1399564743042, "wps": 5529.567366678185, "avg_wps": 4848.899590022369, "eta_in_seconds": 581.1726862314754, "at": "2024-05-25T23:30:42.837739"}
{"lr": 1.1502621254535857e-06, "step": 458, "loss": 1.7242182493209839, "percent_done": 91.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5535.512602459266, "avg_wps": 4850.213148865603, "eta_in_seconds": 567.503306662672, "at": "2024-05-25T23:30:54.678085"}
{"lr": 1.0964831517459112e-06, "step": 459, "loss": 1.4536421298980713, "percent_done": 91.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5538.07558595897, "avg_wps": 4851.525978558798, "eta_in_seconds": 553.8414123463475, "at": "2024-05-25T23:31:06.512881"}
{"lr": 1.0439685167487763e-06, "step": 460, "loss": 1.2507259845733643, "percent_done": 92.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1411771774292, "wps": 5541.388527230523, "avg_wps": 4852.839333307466, "eta_in_seconds": 540.1868514392687, "at": "2024-05-25T23:31:18.340633"}
{"lr": 9.927205176224375e-07, "step": 461, "loss": 1.3502042293548584, "percent_done": 92.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5539.462957471421, "avg_wps": 4854.144490597286, "eta_in_seconds": 526.5405685699943, "at": "2024-05-25T23:31:30.172495"}
{"lr": 9.427413961204031e-07, "step": 462, "loss": 1.4290932416915894, "percent_done": 92.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13957977294922, "wps": 5534.486557677176, "avg_wps": 4855.4364125667935, "eta_in_seconds": 512.9030201187381, "at": "2024-05-25T23:31:42.014967"}
{"lr": 8.940333384913533e-07, "step": 463, "loss": 1.162807822227478, "percent_done": 92.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1411771774292, "wps": 5541.743568701974, "avg_wps": 4856.735491565326, "eta_in_seconds": 499.271991281221, "at": "2024-05-25T23:31:53.841921"}
{"lr": 8.465984753835264e-07, "step": 464, "loss": 1.526496410369873, "percent_done": 92.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5534.90713876165, "avg_wps": 4858.018325554442, "eta_in_seconds": 485.6498765328835, "at": "2024-05-25T23:32:05.683498"}
{"lr": 8.004388817514974e-07, "step": 465, "loss": 1.6751914024353027, "percent_done": 93.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5541.382718245516, "avg_wps": 4859.307036709747, "eta_in_seconds": 472.0343832303119, "at": "2024-05-25T23:32:17.511332"}
{"lr": 7.555565767654276e-07, "step": 466, "loss": 1.8657950162887573, "percent_done": 93.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.140678882598877, "wps": 5540.418260501413, "avg_wps": 4860.589303797008, "eta_in_seconds": 458.42671757092296, "at": "2024-05-25T23:32:29.341241"}
{"lr": 7.119535237227388e-07, "step": 467, "loss": 1.3259780406951904, "percent_done": 93.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5541.7370886199615, "avg_wps": 4861.868926085916, "eta_in_seconds": 444.82647164679696, "at": "2024-05-25T23:32:41.168314"}
{"lr": 6.696316299622224e-07, "step": 468, "loss": 1.1357439756393433, "percent_done": 93.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5528.122019903643, "avg_wps": 4863.121290926681, "eta_in_seconds": 431.2357999198457, "at": "2024-05-25T23:32:53.024499"}
{"lr": 6.285927467806198e-07, "step": 469, "loss": 1.483215570449829, "percent_done": 93.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5536.983565923128, "avg_wps": 4864.383562723774, "eta_in_seconds": 417.6512756042643, "at": "2024-05-25T23:33:04.861725"}
{"lr": 5.888386693516242e-07, "step": 470, "loss": 1.3447225093841553, "percent_done": 94.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 2818.414741643536, "avg_wps": 4856.881964494165, "eta_in_seconds": 404.80291972769066, "at": "2024-05-25T23:33:28.140354"}
{"lr": 5.503711366473705e-07, "step": 471, "loss": 1.2989805936813354, "percent_done": 94.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5565.773708553193, "avg_wps": 4858.195701616006, "eta_in_seconds": 391.20367245967725, "at": "2024-05-25T23:33:39.916395"}
{"lr": 5.131918313623563e-07, "step": 472, "loss": 1.4937809705734253, "percent_done": 94.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5541.998091496166, "avg_wps": 4859.466014763509, "eta_in_seconds": 377.61515245195164, "at": "2024-05-25T23:33:51.742938"}
{"lr": 4.773023798398375e-07, "step": 473, "loss": 1.5734940767288208, "percent_done": 94.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13873529434204, "wps": 5539.568676644442, "avg_wps": 4860.727664124924, "eta_in_seconds": 364.03438379396596, "at": "2024-05-25T23:34:03.574673"}
{"lr": 4.4270435200069295e-07, "step": 474, "loss": 1.2783210277557373, "percent_done": 94.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5540.620618010061, "avg_wps": 4861.986350468246, "eta_in_seconds": 350.46087692860306, "at": "2024-05-25T23:34:15.404144"}
{"lr": 4.0939926127473865e-07, "step": 475, "loss": 1.5040833950042725, "percent_done": 95.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5534.530239860128, "avg_wps": 4863.230495788966, "eta_in_seconds": 336.8954034604524, "at": "2024-05-25T23:34:27.246698"}
{"lr": 3.7738856453453507e-07, "step": 476, "loss": 1.4859583377838135, "percent_done": 95.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139155387878418, "wps": 5531.467583980725, "avg_wps": 4864.46507324175, "eta_in_seconds": 323.3375050119993, "at": "2024-05-25T23:34:39.095749"}
{"lr": 3.4667366203166475e-07, "step": 477, "loss": 1.377013087272644, "percent_done": 95.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5527.310990665434, "avg_wps": 4865.688349634892, "eta_in_seconds": 309.787206184939, "at": "2024-05-25T23:34:50.953697"}
{"lr": 3.172558973354582e-07, "step": 478, "loss": 1.727473258972168, "percent_done": 95.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5528.57488139409, "avg_wps": 4866.909168814225, "eta_in_seconds": 296.24386853952285, "at": "2024-05-25T23:35:02.808942"}
{"lr": 2.8913655727425123e-07, "step": 479, "loss": 1.2657310962677002, "percent_done": 95.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13897943496704, "wps": 5522.30968311067, "avg_wps": 4868.115346713984, "eta_in_seconds": 282.7081738991628, "at": "2024-05-25T23:35:14.677633"}
{"lr": 2.623168718790634e-07, "step": 480, "loss": 1.3324154615402222, "percent_done": 96.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5539.5219007153655, "avg_wps": 4869.344886513437, "eta_in_seconds": 269.17789364854497, "at": "2024-05-25T23:35:26.509479"}
{"lr": 2.3679801432982478e-07, "step": 481, "loss": 1.4634283781051636, "percent_done": 96.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5533.054787905231, "avg_wps": 4870.559525187848, "eta_in_seconds": 255.65522678874882, "at": "2024-05-25T23:35:38.355185"}
{"lr": 2.1258110090402713e-07, "step": 482, "loss": 1.1581710577011108, "percent_done": 96.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5533.8807613556955, "avg_wps": 4871.771054529839, "eta_in_seconds": 242.1394574572931, "at": "2024-05-25T23:35:50.199074"}
{"lr": 1.896671909279231e-07, "step": 483, "loss": 1.384340763092041, "percent_done": 96.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5536.405769426682, "avg_wps": 4872.982218114612, "eta_in_seconds": 228.63042591422732, "at": "2024-05-25T23:36:02.037548"}
{"lr": 1.6805728673016362e-07, "step": 484, "loss": 1.2824896574020386, "percent_done": 96.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1389799118042, "wps": 5534.988832962237, "avg_wps": 4874.186705841601, "eta_in_seconds": 215.12840259961845, "at": "2024-05-25T23:36:13.879042"}
{"lr": 1.477523335979629e-07, "step": 485, "loss": 1.3915427923202515, "percent_done": 97.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13929796218872, "wps": 5530.157866487155, "avg_wps": 4875.379083605387, "eta_in_seconds": 201.6335515951373, "at": "2024-05-25T23:36:25.730955"}
{"lr": 1.2875321973575205e-07, "step": 486, "loss": 1.7751845121383667, "percent_done": 97.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.13979434967041, "wps": 5517.335469256387, "avg_wps": 4876.546571104314, "eta_in_seconds": 188.14626019089312, "at": "2024-05-25T23:36:37.610398"}
{"lr": 1.1106077622631656e-07, "step": 487, "loss": 1.3046096563339233, "percent_done": 97.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5530.925437716181, "avg_wps": 4877.731576689974, "eta_in_seconds": 174.66479788913375, "at": "2024-05-25T23:36:49.460632"}
{"lr": 9.467577699445256e-08, "step": 488, "loss": 1.3110491037368774, "percent_done": 97.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5537.196603743627, "avg_wps": 4878.922286422781, "eta_in_seconds": 161.18969596800258, "at": "2024-05-25T23:37:01.297432"}
{"lr": 7.959893877311043e-08, "step": 489, "loss": 1.4425559043884277, "percent_done": 97.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5533.1076918270655, "avg_wps": 4880.10220431381, "eta_in_seconds": 147.72149635775202, "at": "2024-05-25T23:37:13.143006"}
{"lr": 6.58309210720302e-08, "step": 490, "loss": 1.190127968788147, "percent_done": 98.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5536.834003090966, "avg_wps": 4881.283788090012, "eta_in_seconds": 134.25976207304973, "at": "2024-05-25T23:37:24.980578"}
{"lr": 5.337232614891126e-08, "step": 491, "loss": 1.4984546899795532, "percent_done": 98.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139284133911133, "wps": 5540.317422294481, "avg_wps": 4882.466640951081, "eta_in_seconds": 120.8045120171277, "at": "2024-05-25T23:37:36.810755"}
{"lr": 4.222369898305362e-08, "step": 492, "loss": 1.3258860111236572, "percent_done": 98.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5531.842284623181, "avg_wps": 4883.6318504608325, "eta_in_seconds": 107.35616771573943, "at": "2024-05-25T23:37:48.659041"}
{"lr": 3.2385527251530405e-08, "step": 493, "loss": 1.438199758529663, "percent_done": 98.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1397123336792, "wps": 5535.22545883186, "avg_wps": 4884.798233541129, "eta_in_seconds": 93.9142167326403, "at": "2024-05-25T23:38:00.500070"}
{"lr": 2.385824130784165e-08, "step": 494, "loss": 1.260614275932312, "percent_done": 98.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1387357711792, "wps": 5536.991373302559, "avg_wps": 4885.963232735457, "eta_in_seconds": 80.47870630001732, "at": "2024-05-25T23:38:12.337279"}
{"lr": 1.6642214163099443e-08, "step": 495, "loss": 1.3144422769546509, "percent_done": 99.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1409330368042, "wps": 5527.284538401669, "avg_wps": 4887.108773774314, "eta_in_seconds": 67.04986837175157, "at": "2024-05-25T23:38:24.195333"}
{"lr": 1.0737761469707708e-08, "step": 496, "loss": 1.1841107606887817, "percent_done": 99.2, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1402006149292, "wps": 5524.8966534966985, "avg_wps": 4888.246462675485, "eta_in_seconds": 53.62741056565316, "at": "2024-05-25T23:38:36.058509"}
{"lr": 6.145141507556636e-09, "step": 497, "loss": 1.244451642036438, "percent_done": 99.4, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5528.994675647007, "avg_wps": 4889.38655288693, "eta_in_seconds": 40.21117943393393, "at": "2024-05-25T23:38:47.912875"}
{"lr": 2.864555172718443e-09, "step": 498, "loss": 1.3902086019515991, "percent_done": 99.6, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.1404447555542, "wps": 5532.748076470777, "avg_wps": 4890.52848592629, "eta_in_seconds": 26.80119344508313, "at": "2024-05-25T23:38:59.759170"}
{"lr": 8.961459686677561e-10, "step": 499, "loss": 1.4591144323349, "percent_done": 99.8, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.139838218688965, "wps": 5530.526158362615, "avg_wps": 4891.662890367311, "eta_in_seconds": 13.397489047958283, "at": "2024-05-25T23:39:11.610269"}
{"lr": 2.4e-10, "step": 500, "loss": 1.562139868736267, "percent_done": 100.0, "peak_allocated_mem": 64.85545778274536, "allocated_mem": 24.14044427871704, "wps": 5528.798504252308, "avg_wps": 4892.790575206737, "eta_in_seconds": 0.0, "at": "2024-05-25T23:39:23.465087"}