{ "best_metric": 1.509622573852539, "best_model_checkpoint": "ai-light-dance_singing_ft_pretrain_wav2vec2-large-lv60/checkpoint-2208", "epoch": 29.99864314789688, "global_step": 5520, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.05, "learning_rate": 3.5000000000000004e-06, "loss": 24.452, "step": 10 }, { "epoch": 0.11, "learning_rate": 8.500000000000002e-06, "loss": 4.8937, "step": 20 }, { "epoch": 0.16, "learning_rate": 1.3500000000000001e-05, "loss": 3.1628, "step": 30 }, { "epoch": 0.22, "learning_rate": 1.85e-05, "loss": 2.7289, "step": 40 }, { "epoch": 0.27, "learning_rate": 2.35e-05, "loss": 2.6206, "step": 50 }, { "epoch": 0.33, "learning_rate": 2.8499999999999998e-05, "loss": 2.5345, "step": 60 }, { "epoch": 0.38, "learning_rate": 3.35e-05, "loss": 2.3627, "step": 70 }, { "epoch": 0.43, "learning_rate": 3.85e-05, "loss": 2.4229, "step": 80 }, { "epoch": 0.49, "learning_rate": 4.35e-05, "loss": 2.2473, "step": 90 }, { "epoch": 0.54, "learning_rate": 4.85e-05, "loss": 2.1727, "step": 100 }, { "epoch": 0.6, "learning_rate": 4.9935424354243546e-05, "loss": 2.068, "step": 110 }, { "epoch": 0.65, "learning_rate": 4.9843173431734316e-05, "loss": 1.942, "step": 120 }, { "epoch": 0.71, "learning_rate": 4.975092250922509e-05, "loss": 1.9866, "step": 130 }, { "epoch": 0.76, "learning_rate": 4.965867158671587e-05, "loss": 1.901, "step": 140 }, { "epoch": 0.81, "learning_rate": 4.956642066420664e-05, "loss": 1.9123, "step": 150 }, { "epoch": 0.87, "learning_rate": 4.947416974169742e-05, "loss": 1.9567, "step": 160 }, { "epoch": 0.92, "learning_rate": 4.9381918819188194e-05, "loss": 1.9209, "step": 170 }, { "epoch": 0.98, "learning_rate": 4.928966789667897e-05, "loss": 1.8237, "step": 180 }, { "epoch": 1.0, "eval_loss": 1.9361721277236938, "eval_runtime": 222.0007, "eval_samples_per_second": 8.851, "eval_steps_per_second": 0.739, "eval_wer": 1.0743022611052924, "step": 184 }, { "epoch": 1.03, "learning_rate": 4.919741697416975e-05, "loss": 1.8381, "step": 190 }, { "epoch": 1.09, "learning_rate": 4.910516605166052e-05, "loss": 1.7931, "step": 200 }, { "epoch": 1.14, "learning_rate": 4.9012915129151295e-05, "loss": 1.6989, "step": 210 }, { "epoch": 1.2, "learning_rate": 4.892066420664207e-05, "loss": 1.772, "step": 220 }, { "epoch": 1.25, "learning_rate": 4.882841328413285e-05, "loss": 1.851, "step": 230 }, { "epoch": 1.3, "learning_rate": 4.873616236162362e-05, "loss": 1.7447, "step": 240 }, { "epoch": 1.36, "learning_rate": 4.864391143911439e-05, "loss": 1.6539, "step": 250 }, { "epoch": 1.41, "learning_rate": 4.8551660516605166e-05, "loss": 1.6666, "step": 260 }, { "epoch": 1.47, "learning_rate": 4.845940959409594e-05, "loss": 1.6747, "step": 270 }, { "epoch": 1.52, "learning_rate": 4.836715867158672e-05, "loss": 1.9576, "step": 280 }, { "epoch": 1.58, "learning_rate": 4.827490774907749e-05, "loss": 1.7807, "step": 290 }, { "epoch": 1.63, "learning_rate": 4.818265682656827e-05, "loss": 1.7131, "step": 300 }, { "epoch": 1.68, "learning_rate": 4.8090405904059044e-05, "loss": 1.6683, "step": 310 }, { "epoch": 1.74, "learning_rate": 4.799815498154982e-05, "loss": 1.652, "step": 320 }, { "epoch": 1.79, "learning_rate": 4.790590405904059e-05, "loss": 1.6841, "step": 330 }, { "epoch": 1.85, "learning_rate": 4.781365313653137e-05, "loss": 1.6687, "step": 340 }, { "epoch": 1.9, "learning_rate": 4.7721402214022145e-05, "loss": 1.7193, "step": 350 }, { "epoch": 1.96, "learning_rate": 4.762915129151292e-05, "loss": 1.6396, "step": 360 }, { "epoch": 2.0, "eval_loss": 1.7375205755233765, "eval_runtime": 221.4077, "eval_samples_per_second": 8.875, "eval_steps_per_second": 0.741, "eval_wer": 1.0047132031298134, "step": 368 }, { "epoch": 2.01, "learning_rate": 4.753690036900369e-05, "loss": 1.7377, "step": 370 }, { "epoch": 2.07, "learning_rate": 4.744464944649447e-05, "loss": 1.6228, "step": 380 }, { "epoch": 2.12, "learning_rate": 4.735239852398524e-05, "loss": 1.5957, "step": 390 }, { "epoch": 2.17, "learning_rate": 4.7260147601476016e-05, "loss": 1.5835, "step": 400 }, { "epoch": 2.23, "learning_rate": 4.716789667896679e-05, "loss": 1.6163, "step": 410 }, { "epoch": 2.28, "learning_rate": 4.707564575645756e-05, "loss": 1.6906, "step": 420 }, { "epoch": 2.34, "learning_rate": 4.698339483394834e-05, "loss": 1.5954, "step": 430 }, { "epoch": 2.39, "learning_rate": 4.689114391143912e-05, "loss": 1.6243, "step": 440 }, { "epoch": 2.45, "learning_rate": 4.6798892988929894e-05, "loss": 1.6176, "step": 450 }, { "epoch": 2.5, "learning_rate": 4.6706642066420664e-05, "loss": 1.6545, "step": 460 }, { "epoch": 2.55, "learning_rate": 4.661439114391144e-05, "loss": 1.6033, "step": 470 }, { "epoch": 2.61, "learning_rate": 4.652214022140222e-05, "loss": 1.5814, "step": 480 }, { "epoch": 2.66, "learning_rate": 4.6429889298892995e-05, "loss": 1.6126, "step": 490 }, { "epoch": 2.72, "learning_rate": 4.633763837638377e-05, "loss": 1.6164, "step": 500 }, { "epoch": 2.77, "learning_rate": 4.624538745387454e-05, "loss": 1.6162, "step": 510 }, { "epoch": 2.82, "learning_rate": 4.615313653136532e-05, "loss": 1.5878, "step": 520 }, { "epoch": 2.88, "learning_rate": 4.606088560885609e-05, "loss": 1.5904, "step": 530 }, { "epoch": 2.93, "learning_rate": 4.5968634686346866e-05, "loss": 1.5893, "step": 540 }, { "epoch": 2.99, "learning_rate": 4.5876383763837636e-05, "loss": 1.593, "step": 550 }, { "epoch": 3.0, "eval_loss": 1.5942492485046387, "eval_runtime": 220.0723, "eval_samples_per_second": 8.929, "eval_steps_per_second": 0.745, "eval_wer": 0.9464296716160434, "step": 552 }, { "epoch": 3.04, "learning_rate": 4.578413284132841e-05, "loss": 1.627, "step": 560 }, { "epoch": 3.1, "learning_rate": 4.569188191881919e-05, "loss": 1.5336, "step": 570 }, { "epoch": 3.15, "learning_rate": 4.5599630996309966e-05, "loss": 1.5652, "step": 580 }, { "epoch": 3.21, "learning_rate": 4.550738007380074e-05, "loss": 1.552, "step": 590 }, { "epoch": 3.26, "learning_rate": 4.5415129151291513e-05, "loss": 1.5808, "step": 600 }, { "epoch": 3.31, "learning_rate": 4.532287822878229e-05, "loss": 1.562, "step": 610 }, { "epoch": 3.37, "learning_rate": 4.523062730627307e-05, "loss": 1.6355, "step": 620 }, { "epoch": 3.42, "learning_rate": 4.5138376383763844e-05, "loss": 1.4959, "step": 630 }, { "epoch": 3.48, "learning_rate": 4.5046125461254614e-05, "loss": 1.5578, "step": 640 }, { "epoch": 3.53, "learning_rate": 4.495387453874539e-05, "loss": 1.5428, "step": 650 }, { "epoch": 3.59, "learning_rate": 4.486162361623616e-05, "loss": 1.5499, "step": 660 }, { "epoch": 3.64, "learning_rate": 4.476937269372694e-05, "loss": 1.5335, "step": 670 }, { "epoch": 3.69, "learning_rate": 4.4677121771217715e-05, "loss": 1.5617, "step": 680 }, { "epoch": 3.75, "learning_rate": 4.4584870848708485e-05, "loss": 1.5798, "step": 690 }, { "epoch": 3.8, "learning_rate": 4.449261992619926e-05, "loss": 1.6642, "step": 700 }, { "epoch": 3.86, "learning_rate": 4.440036900369004e-05, "loss": 1.5389, "step": 710 }, { "epoch": 3.91, "learning_rate": 4.4308118081180816e-05, "loss": 1.5419, "step": 720 }, { "epoch": 3.97, "learning_rate": 4.4215867158671586e-05, "loss": 1.5281, "step": 730 }, { "epoch": 4.0, "eval_loss": 1.603651762008667, "eval_runtime": 220.139, "eval_samples_per_second": 8.926, "eval_steps_per_second": 0.745, "eval_wer": 0.9525599162097221, "step": 736 }, { "epoch": 4.02, "learning_rate": 4.412361623616236e-05, "loss": 1.6156, "step": 740 }, { "epoch": 4.08, "learning_rate": 4.403136531365314e-05, "loss": 1.5245, "step": 750 }, { "epoch": 4.13, "learning_rate": 4.393911439114392e-05, "loss": 1.5406, "step": 760 }, { "epoch": 4.18, "learning_rate": 4.384686346863469e-05, "loss": 1.5113, "step": 770 }, { "epoch": 4.24, "learning_rate": 4.3754612546125464e-05, "loss": 1.4826, "step": 780 }, { "epoch": 4.29, "learning_rate": 4.366236162361624e-05, "loss": 1.5617, "step": 790 }, { "epoch": 4.35, "learning_rate": 4.357011070110701e-05, "loss": 1.4855, "step": 800 }, { "epoch": 4.4, "learning_rate": 4.347785977859779e-05, "loss": 1.4794, "step": 810 }, { "epoch": 4.46, "learning_rate": 4.338560885608856e-05, "loss": 1.5432, "step": 820 }, { "epoch": 4.51, "learning_rate": 4.3293357933579335e-05, "loss": 1.5393, "step": 830 }, { "epoch": 4.56, "learning_rate": 4.320110701107011e-05, "loss": 1.4692, "step": 840 }, { "epoch": 4.62, "learning_rate": 4.310885608856089e-05, "loss": 1.4912, "step": 850 }, { "epoch": 4.67, "learning_rate": 4.301660516605166e-05, "loss": 1.525, "step": 860 }, { "epoch": 4.73, "learning_rate": 4.2924354243542436e-05, "loss": 1.537, "step": 870 }, { "epoch": 4.78, "learning_rate": 4.283210332103321e-05, "loss": 1.6147, "step": 880 }, { "epoch": 4.84, "learning_rate": 4.273985239852399e-05, "loss": 1.4958, "step": 890 }, { "epoch": 4.89, "learning_rate": 4.264760147601477e-05, "loss": 1.4511, "step": 900 }, { "epoch": 4.94, "learning_rate": 4.255535055350554e-05, "loss": 1.4764, "step": 910 }, { "epoch": 5.0, "learning_rate": 4.2463099630996314e-05, "loss": 1.5243, "step": 920 }, { "epoch": 5.0, "eval_loss": 1.5291955471038818, "eval_runtime": 219.2797, "eval_samples_per_second": 8.961, "eval_steps_per_second": 0.748, "eval_wer": 0.9407307005113671, "step": 920 }, { "epoch": 5.05, "learning_rate": 4.237084870848709e-05, "loss": 1.4853, "step": 930 }, { "epoch": 5.11, "learning_rate": 4.227859778597786e-05, "loss": 1.5161, "step": 940 }, { "epoch": 5.16, "learning_rate": 4.218634686346863e-05, "loss": 1.4618, "step": 950 }, { "epoch": 5.22, "learning_rate": 4.209409594095941e-05, "loss": 1.5156, "step": 960 }, { "epoch": 5.27, "learning_rate": 4.2001845018450185e-05, "loss": 1.4883, "step": 970 }, { "epoch": 5.33, "learning_rate": 4.190959409594096e-05, "loss": 1.4644, "step": 980 }, { "epoch": 5.38, "learning_rate": 4.181734317343174e-05, "loss": 1.5241, "step": 990 }, { "epoch": 5.43, "learning_rate": 4.172509225092251e-05, "loss": 1.4509, "step": 1000 }, { "epoch": 5.49, "learning_rate": 4.1632841328413286e-05, "loss": 1.4532, "step": 1010 }, { "epoch": 5.54, "learning_rate": 4.154059040590406e-05, "loss": 1.5239, "step": 1020 }, { "epoch": 5.6, "learning_rate": 4.144833948339484e-05, "loss": 1.498, "step": 1030 }, { "epoch": 5.65, "learning_rate": 4.135608856088561e-05, "loss": 1.4488, "step": 1040 }, { "epoch": 5.71, "learning_rate": 4.126383763837639e-05, "loss": 1.4744, "step": 1050 }, { "epoch": 5.76, "learning_rate": 4.1171586715867164e-05, "loss": 1.4506, "step": 1060 }, { "epoch": 5.81, "learning_rate": 4.1079335793357934e-05, "loss": 1.4844, "step": 1070 }, { "epoch": 5.87, "learning_rate": 4.098708487084871e-05, "loss": 1.5083, "step": 1080 }, { "epoch": 5.92, "learning_rate": 4.089483394833948e-05, "loss": 1.4772, "step": 1090 }, { "epoch": 5.98, "learning_rate": 4.080258302583026e-05, "loss": 1.4443, "step": 1100 }, { "epoch": 6.0, "eval_loss": 1.5464590787887573, "eval_runtime": 219.9723, "eval_samples_per_second": 8.933, "eval_steps_per_second": 0.746, "eval_wer": 0.9456595403856817, "step": 1104 }, { "epoch": 6.03, "learning_rate": 4.0710332103321035e-05, "loss": 1.5313, "step": 1110 }, { "epoch": 6.09, "learning_rate": 4.061808118081181e-05, "loss": 1.4464, "step": 1120 }, { "epoch": 6.14, "learning_rate": 4.052583025830258e-05, "loss": 1.4509, "step": 1130 }, { "epoch": 6.2, "learning_rate": 4.043357933579336e-05, "loss": 1.4327, "step": 1140 }, { "epoch": 6.25, "learning_rate": 4.0341328413284135e-05, "loss": 1.5132, "step": 1150 }, { "epoch": 6.3, "learning_rate": 4.024907749077491e-05, "loss": 1.4134, "step": 1160 }, { "epoch": 6.36, "learning_rate": 4.015682656826568e-05, "loss": 1.4729, "step": 1170 }, { "epoch": 6.41, "learning_rate": 4.006457564575646e-05, "loss": 1.4597, "step": 1180 }, { "epoch": 6.47, "learning_rate": 3.9972324723247236e-05, "loss": 1.4235, "step": 1190 }, { "epoch": 6.52, "learning_rate": 3.988007380073801e-05, "loss": 1.5225, "step": 1200 }, { "epoch": 6.58, "learning_rate": 3.9787822878228783e-05, "loss": 1.468, "step": 1210 }, { "epoch": 6.63, "learning_rate": 3.969557195571956e-05, "loss": 1.4392, "step": 1220 }, { "epoch": 6.68, "learning_rate": 3.960332103321033e-05, "loss": 1.438, "step": 1230 }, { "epoch": 6.74, "learning_rate": 3.951107011070111e-05, "loss": 1.4487, "step": 1240 }, { "epoch": 6.79, "learning_rate": 3.9418819188191884e-05, "loss": 1.5486, "step": 1250 }, { "epoch": 6.85, "learning_rate": 3.9326568265682654e-05, "loss": 1.4567, "step": 1260 }, { "epoch": 6.9, "learning_rate": 3.923431734317343e-05, "loss": 1.4321, "step": 1270 }, { "epoch": 6.96, "learning_rate": 3.914206642066421e-05, "loss": 1.4801, "step": 1280 }, { "epoch": 7.0, "eval_loss": 1.5965466499328613, "eval_runtime": 220.319, "eval_samples_per_second": 8.919, "eval_steps_per_second": 0.744, "eval_wer": 0.9207072885219642, "step": 1288 }, { "epoch": 7.01, "learning_rate": 3.9049815498154985e-05, "loss": 1.4991, "step": 1290 }, { "epoch": 7.07, "learning_rate": 3.895756457564576e-05, "loss": 1.4496, "step": 1300 }, { "epoch": 7.12, "learning_rate": 3.886531365313653e-05, "loss": 1.4205, "step": 1310 }, { "epoch": 7.17, "learning_rate": 3.877306273062731e-05, "loss": 1.457, "step": 1320 }, { "epoch": 7.23, "learning_rate": 3.8680811808118086e-05, "loss": 1.4199, "step": 1330 }, { "epoch": 7.28, "learning_rate": 3.858856088560886e-05, "loss": 1.438, "step": 1340 }, { "epoch": 7.34, "learning_rate": 3.849630996309963e-05, "loss": 1.4591, "step": 1350 }, { "epoch": 7.39, "learning_rate": 3.84040590405904e-05, "loss": 1.4435, "step": 1360 }, { "epoch": 7.45, "learning_rate": 3.831180811808118e-05, "loss": 1.4468, "step": 1370 }, { "epoch": 7.5, "learning_rate": 3.821955719557196e-05, "loss": 1.4338, "step": 1380 }, { "epoch": 7.55, "learning_rate": 3.8127306273062734e-05, "loss": 1.4408, "step": 1390 }, { "epoch": 7.61, "learning_rate": 3.8035055350553504e-05, "loss": 1.408, "step": 1400 }, { "epoch": 7.66, "learning_rate": 3.794280442804428e-05, "loss": 1.404, "step": 1410 }, { "epoch": 7.72, "learning_rate": 3.785055350553506e-05, "loss": 1.4455, "step": 1420 }, { "epoch": 7.77, "learning_rate": 3.7758302583025835e-05, "loss": 1.4329, "step": 1430 }, { "epoch": 7.82, "learning_rate": 3.7666051660516605e-05, "loss": 1.4411, "step": 1440 }, { "epoch": 7.88, "learning_rate": 3.757380073800738e-05, "loss": 1.47, "step": 1450 }, { "epoch": 7.93, "learning_rate": 3.748154981549816e-05, "loss": 1.3934, "step": 1460 }, { "epoch": 7.99, "learning_rate": 3.7389298892988936e-05, "loss": 1.4104, "step": 1470 }, { "epoch": 8.0, "eval_loss": 1.5224082469940186, "eval_runtime": 219.345, "eval_samples_per_second": 8.958, "eval_steps_per_second": 0.748, "eval_wer": 0.9210769515125378, "step": 1472 }, { "epoch": 8.04, "learning_rate": 3.729704797047971e-05, "loss": 1.4428, "step": 1480 }, { "epoch": 8.1, "learning_rate": 3.720479704797048e-05, "loss": 1.384, "step": 1490 }, { "epoch": 8.15, "learning_rate": 3.711254612546125e-05, "loss": 1.3734, "step": 1500 }, { "epoch": 8.21, "learning_rate": 3.702029520295203e-05, "loss": 1.411, "step": 1510 }, { "epoch": 8.26, "learning_rate": 3.692804428044281e-05, "loss": 1.4471, "step": 1520 }, { "epoch": 8.31, "learning_rate": 3.683579335793358e-05, "loss": 1.3742, "step": 1530 }, { "epoch": 8.37, "learning_rate": 3.6743542435424354e-05, "loss": 1.3913, "step": 1540 }, { "epoch": 8.42, "learning_rate": 3.665129151291513e-05, "loss": 1.4212, "step": 1550 }, { "epoch": 8.48, "learning_rate": 3.655904059040591e-05, "loss": 1.3764, "step": 1560 }, { "epoch": 8.53, "learning_rate": 3.646678966789668e-05, "loss": 1.4378, "step": 1570 }, { "epoch": 8.59, "learning_rate": 3.6374538745387455e-05, "loss": 1.4019, "step": 1580 }, { "epoch": 8.64, "learning_rate": 3.628228782287823e-05, "loss": 1.3696, "step": 1590 }, { "epoch": 8.69, "learning_rate": 3.619003690036901e-05, "loss": 1.4489, "step": 1600 }, { "epoch": 8.75, "learning_rate": 3.6097785977859786e-05, "loss": 1.4202, "step": 1610 }, { "epoch": 8.8, "learning_rate": 3.6005535055350556e-05, "loss": 1.3961, "step": 1620 }, { "epoch": 8.86, "learning_rate": 3.591328413284133e-05, "loss": 1.388, "step": 1630 }, { "epoch": 8.91, "learning_rate": 3.58210332103321e-05, "loss": 1.4252, "step": 1640 }, { "epoch": 8.97, "learning_rate": 3.572878228782288e-05, "loss": 1.3828, "step": 1650 }, { "epoch": 9.0, "eval_loss": 1.5400218963623047, "eval_runtime": 218.8536, "eval_samples_per_second": 8.979, "eval_steps_per_second": 0.749, "eval_wer": 0.9106955825272627, "step": 1656 }, { "epoch": 9.02, "learning_rate": 3.563653136531365e-05, "loss": 1.4439, "step": 1660 }, { "epoch": 9.08, "learning_rate": 3.554428044280443e-05, "loss": 1.3608, "step": 1670 }, { "epoch": 9.13, "learning_rate": 3.5452029520295204e-05, "loss": 1.3713, "step": 1680 }, { "epoch": 9.18, "learning_rate": 3.535977859778598e-05, "loss": 1.3797, "step": 1690 }, { "epoch": 9.24, "learning_rate": 3.526752767527676e-05, "loss": 1.3647, "step": 1700 }, { "epoch": 9.29, "learning_rate": 3.517527675276753e-05, "loss": 1.4327, "step": 1710 }, { "epoch": 9.35, "learning_rate": 3.5083025830258304e-05, "loss": 1.379, "step": 1720 }, { "epoch": 9.4, "learning_rate": 3.499077490774908e-05, "loss": 1.3915, "step": 1730 }, { "epoch": 9.46, "learning_rate": 3.489852398523986e-05, "loss": 1.3589, "step": 1740 }, { "epoch": 9.51, "learning_rate": 3.480627306273063e-05, "loss": 1.3815, "step": 1750 }, { "epoch": 9.56, "learning_rate": 3.4714022140221405e-05, "loss": 1.4257, "step": 1760 }, { "epoch": 9.62, "learning_rate": 3.462177121771218e-05, "loss": 1.3687, "step": 1770 }, { "epoch": 9.67, "learning_rate": 3.452952029520295e-05, "loss": 1.3827, "step": 1780 }, { "epoch": 9.73, "learning_rate": 3.443726937269373e-05, "loss": 1.3821, "step": 1790 }, { "epoch": 9.78, "learning_rate": 3.43450184501845e-05, "loss": 1.4062, "step": 1800 }, { "epoch": 9.84, "learning_rate": 3.4252767527675276e-05, "loss": 1.3866, "step": 1810 }, { "epoch": 9.89, "learning_rate": 3.416051660516605e-05, "loss": 1.3911, "step": 1820 }, { "epoch": 9.94, "learning_rate": 3.406826568265683e-05, "loss": 1.3684, "step": 1830 }, { "epoch": 10.0, "learning_rate": 3.39760147601476e-05, "loss": 1.3966, "step": 1840 }, { "epoch": 10.0, "eval_loss": 1.5545392036437988, "eval_runtime": 220.6411, "eval_samples_per_second": 8.906, "eval_steps_per_second": 0.743, "eval_wer": 0.9288706795637977, "step": 1840 }, { "epoch": 10.05, "learning_rate": 3.388376383763838e-05, "loss": 1.402, "step": 1850 }, { "epoch": 10.11, "learning_rate": 3.3791512915129154e-05, "loss": 1.377, "step": 1860 }, { "epoch": 10.16, "learning_rate": 3.369926199261993e-05, "loss": 1.3761, "step": 1870 }, { "epoch": 10.22, "learning_rate": 3.360701107011071e-05, "loss": 1.3519, "step": 1880 }, { "epoch": 10.27, "learning_rate": 3.351476014760148e-05, "loss": 1.3709, "step": 1890 }, { "epoch": 10.33, "learning_rate": 3.3422509225092255e-05, "loss": 1.3538, "step": 1900 }, { "epoch": 10.38, "learning_rate": 3.3330258302583025e-05, "loss": 1.3532, "step": 1910 }, { "epoch": 10.43, "learning_rate": 3.32380073800738e-05, "loss": 1.3535, "step": 1920 }, { "epoch": 10.49, "learning_rate": 3.314575645756457e-05, "loss": 1.3521, "step": 1930 }, { "epoch": 10.54, "learning_rate": 3.305350553505535e-05, "loss": 1.3746, "step": 1940 }, { "epoch": 10.6, "learning_rate": 3.2961254612546126e-05, "loss": 1.3443, "step": 1950 }, { "epoch": 10.65, "learning_rate": 3.28690036900369e-05, "loss": 1.3662, "step": 1960 }, { "epoch": 10.71, "learning_rate": 3.277675276752767e-05, "loss": 1.3685, "step": 1970 }, { "epoch": 10.76, "learning_rate": 3.268450184501845e-05, "loss": 1.3618, "step": 1980 }, { "epoch": 10.81, "learning_rate": 3.259225092250923e-05, "loss": 1.3612, "step": 1990 }, { "epoch": 10.87, "learning_rate": 3.2500000000000004e-05, "loss": 1.3651, "step": 2000 }, { "epoch": 10.92, "learning_rate": 3.240774907749078e-05, "loss": 1.3502, "step": 2010 }, { "epoch": 10.98, "learning_rate": 3.231549815498155e-05, "loss": 1.3481, "step": 2020 }, { "epoch": 11.0, "eval_loss": 1.737160086631775, "eval_runtime": 221.0608, "eval_samples_per_second": 8.889, "eval_steps_per_second": 0.742, "eval_wer": 0.9772349208305096, "step": 2024 }, { "epoch": 11.03, "learning_rate": 3.222324723247233e-05, "loss": 1.41, "step": 2030 }, { "epoch": 11.09, "learning_rate": 3.2130996309963105e-05, "loss": 1.3683, "step": 2040 }, { "epoch": 11.14, "learning_rate": 3.2038745387453875e-05, "loss": 1.3357, "step": 2050 }, { "epoch": 11.2, "learning_rate": 3.1946494464944645e-05, "loss": 1.3276, "step": 2060 }, { "epoch": 11.25, "learning_rate": 3.185424354243542e-05, "loss": 1.3485, "step": 2070 }, { "epoch": 11.3, "learning_rate": 3.17619926199262e-05, "loss": 1.3791, "step": 2080 }, { "epoch": 11.36, "learning_rate": 3.1669741697416976e-05, "loss": 1.3541, "step": 2090 }, { "epoch": 11.41, "learning_rate": 3.157749077490775e-05, "loss": 1.3506, "step": 2100 }, { "epoch": 11.47, "learning_rate": 3.148523985239852e-05, "loss": 1.3192, "step": 2110 }, { "epoch": 11.52, "learning_rate": 3.13929889298893e-05, "loss": 1.3409, "step": 2120 }, { "epoch": 11.58, "learning_rate": 3.130073800738008e-05, "loss": 1.3269, "step": 2130 }, { "epoch": 11.63, "learning_rate": 3.1208487084870854e-05, "loss": 1.3429, "step": 2140 }, { "epoch": 11.68, "learning_rate": 3.1116236162361624e-05, "loss": 1.36, "step": 2150 }, { "epoch": 11.74, "learning_rate": 3.10239852398524e-05, "loss": 1.3443, "step": 2160 }, { "epoch": 11.79, "learning_rate": 3.093173431734318e-05, "loss": 1.3399, "step": 2170 }, { "epoch": 11.85, "learning_rate": 3.0839483394833955e-05, "loss": 1.3504, "step": 2180 }, { "epoch": 11.9, "learning_rate": 3.0747232472324725e-05, "loss": 1.3432, "step": 2190 }, { "epoch": 11.96, "learning_rate": 3.0654981549815495e-05, "loss": 1.3437, "step": 2200 }, { "epoch": 12.0, "eval_loss": 1.509622573852539, "eval_runtime": 220.9076, "eval_samples_per_second": 8.895, "eval_steps_per_second": 0.742, "eval_wer": 0.9207072885219642, "step": 2208 }, { "epoch": 12.01, "learning_rate": 3.056273062730627e-05, "loss": 1.4016, "step": 2210 }, { "epoch": 12.07, "learning_rate": 3.047047970479705e-05, "loss": 1.3043, "step": 2220 }, { "epoch": 12.12, "learning_rate": 3.0378228782287826e-05, "loss": 1.3303, "step": 2230 }, { "epoch": 12.17, "learning_rate": 3.0285977859778596e-05, "loss": 1.3502, "step": 2240 }, { "epoch": 12.23, "learning_rate": 3.0193726937269373e-05, "loss": 1.3281, "step": 2250 }, { "epoch": 12.28, "learning_rate": 3.010147601476015e-05, "loss": 1.3209, "step": 2260 }, { "epoch": 12.34, "learning_rate": 3.0009225092250926e-05, "loss": 1.3475, "step": 2270 }, { "epoch": 12.39, "learning_rate": 2.9916974169741697e-05, "loss": 1.3149, "step": 2280 }, { "epoch": 12.45, "learning_rate": 2.9824723247232474e-05, "loss": 1.3076, "step": 2290 }, { "epoch": 12.5, "learning_rate": 2.9732472324723247e-05, "loss": 1.3312, "step": 2300 }, { "epoch": 12.55, "learning_rate": 2.9640221402214024e-05, "loss": 1.3493, "step": 2310 }, { "epoch": 12.61, "learning_rate": 2.95479704797048e-05, "loss": 1.3236, "step": 2320 }, { "epoch": 12.66, "learning_rate": 2.945571955719557e-05, "loss": 1.3417, "step": 2330 }, { "epoch": 12.72, "learning_rate": 2.9363468634686348e-05, "loss": 1.3362, "step": 2340 }, { "epoch": 12.77, "learning_rate": 2.9271217712177125e-05, "loss": 1.3405, "step": 2350 }, { "epoch": 12.82, "learning_rate": 2.91789667896679e-05, "loss": 1.3312, "step": 2360 }, { "epoch": 12.88, "learning_rate": 2.9086715867158672e-05, "loss": 1.3392, "step": 2370 }, { "epoch": 12.93, "learning_rate": 2.8994464944649445e-05, "loss": 1.2999, "step": 2380 }, { "epoch": 12.99, "learning_rate": 2.8902214022140222e-05, "loss": 1.3207, "step": 2390 }, { "epoch": 13.0, "eval_loss": 1.5559078454971313, "eval_runtime": 221.3456, "eval_samples_per_second": 8.878, "eval_steps_per_second": 0.741, "eval_wer": 0.9220627194874007, "step": 2392 }, { "epoch": 13.04, "learning_rate": 2.8809963099631e-05, "loss": 1.3472, "step": 2400 }, { "epoch": 13.1, "learning_rate": 2.8717712177121776e-05, "loss": 1.2897, "step": 2410 }, { "epoch": 13.15, "learning_rate": 2.8625461254612546e-05, "loss": 1.3077, "step": 2420 }, { "epoch": 13.21, "learning_rate": 2.8533210332103323e-05, "loss": 1.3125, "step": 2430 }, { "epoch": 13.26, "learning_rate": 2.8440959409594097e-05, "loss": 1.3425, "step": 2440 }, { "epoch": 13.31, "learning_rate": 2.8348708487084874e-05, "loss": 1.3392, "step": 2450 }, { "epoch": 13.37, "learning_rate": 2.8256457564575644e-05, "loss": 1.2951, "step": 2460 }, { "epoch": 13.42, "learning_rate": 2.816420664206642e-05, "loss": 1.2996, "step": 2470 }, { "epoch": 13.48, "learning_rate": 2.8071955719557198e-05, "loss": 1.2869, "step": 2480 }, { "epoch": 13.53, "learning_rate": 2.7979704797047975e-05, "loss": 1.3016, "step": 2490 }, { "epoch": 13.59, "learning_rate": 2.7887453874538748e-05, "loss": 1.2765, "step": 2500 }, { "epoch": 13.64, "learning_rate": 2.7795202952029518e-05, "loss": 1.3083, "step": 2510 }, { "epoch": 13.69, "learning_rate": 2.7702952029520295e-05, "loss": 1.3109, "step": 2520 }, { "epoch": 13.75, "learning_rate": 2.7610701107011072e-05, "loss": 1.3079, "step": 2530 }, { "epoch": 13.8, "learning_rate": 2.751845018450185e-05, "loss": 1.2955, "step": 2540 }, { "epoch": 13.86, "learning_rate": 2.742619926199262e-05, "loss": 1.3101, "step": 2550 }, { "epoch": 13.91, "learning_rate": 2.7333948339483396e-05, "loss": 1.3213, "step": 2560 }, { "epoch": 13.97, "learning_rate": 2.724169741697417e-05, "loss": 1.3103, "step": 2570 }, { "epoch": 14.0, "eval_loss": 1.5284996032714844, "eval_runtime": 219.5072, "eval_samples_per_second": 8.952, "eval_steps_per_second": 0.747, "eval_wer": 0.9241882816831988, "step": 2576 }, { "epoch": 14.02, "learning_rate": 2.7149446494464946e-05, "loss": 1.3567, "step": 2580 }, { "epoch": 14.08, "learning_rate": 2.7057195571955723e-05, "loss": 1.2752, "step": 2590 }, { "epoch": 14.13, "learning_rate": 2.6964944649446494e-05, "loss": 1.2801, "step": 2600 }, { "epoch": 14.18, "learning_rate": 2.687269372693727e-05, "loss": 1.2902, "step": 2610 }, { "epoch": 14.24, "learning_rate": 2.6780442804428047e-05, "loss": 1.3133, "step": 2620 }, { "epoch": 14.29, "learning_rate": 2.668819188191882e-05, "loss": 1.33, "step": 2630 }, { "epoch": 14.35, "learning_rate": 2.6595940959409594e-05, "loss": 1.2925, "step": 2640 }, { "epoch": 14.4, "learning_rate": 2.6503690036900368e-05, "loss": 1.2757, "step": 2650 }, { "epoch": 14.46, "learning_rate": 2.6411439114391145e-05, "loss": 1.3123, "step": 2660 }, { "epoch": 14.51, "learning_rate": 2.6319188191881922e-05, "loss": 1.3476, "step": 2670 }, { "epoch": 14.56, "learning_rate": 2.6226937269372692e-05, "loss": 1.3034, "step": 2680 }, { "epoch": 14.62, "learning_rate": 2.613468634686347e-05, "loss": 1.2937, "step": 2690 }, { "epoch": 14.67, "learning_rate": 2.6042435424354246e-05, "loss": 1.29, "step": 2700 }, { "epoch": 14.73, "learning_rate": 2.595018450184502e-05, "loss": 1.2854, "step": 2710 }, { "epoch": 14.78, "learning_rate": 2.5857933579335796e-05, "loss": 1.3069, "step": 2720 }, { "epoch": 14.84, "learning_rate": 2.5765682656826566e-05, "loss": 1.2989, "step": 2730 }, { "epoch": 14.89, "learning_rate": 2.5673431734317343e-05, "loss": 1.2746, "step": 2740 }, { "epoch": 14.94, "learning_rate": 2.558118081180812e-05, "loss": 1.2927, "step": 2750 }, { "epoch": 15.0, "learning_rate": 2.5488929889298897e-05, "loss": 1.3032, "step": 2760 }, { "epoch": 15.0, "eval_loss": 1.5296591520309448, "eval_runtime": 220.4741, "eval_samples_per_second": 8.913, "eval_steps_per_second": 0.744, "eval_wer": 0.8982502618446183, "step": 2760 }, { "epoch": 15.05, "learning_rate": 2.5396678966789667e-05, "loss": 1.3075, "step": 2770 }, { "epoch": 15.11, "learning_rate": 2.5304428044280444e-05, "loss": 1.2563, "step": 2780 }, { "epoch": 15.16, "learning_rate": 2.5212177121771218e-05, "loss": 1.2831, "step": 2790 }, { "epoch": 15.22, "learning_rate": 2.5119926199261995e-05, "loss": 1.2732, "step": 2800 }, { "epoch": 15.27, "learning_rate": 2.502767527675277e-05, "loss": 1.2719, "step": 2810 }, { "epoch": 15.33, "learning_rate": 2.4935424354243545e-05, "loss": 1.2681, "step": 2820 }, { "epoch": 15.38, "learning_rate": 2.484317343173432e-05, "loss": 1.2808, "step": 2830 }, { "epoch": 15.43, "learning_rate": 2.4750922509225095e-05, "loss": 1.269, "step": 2840 }, { "epoch": 15.49, "learning_rate": 2.465867158671587e-05, "loss": 1.263, "step": 2850 }, { "epoch": 15.54, "learning_rate": 2.4566420664206643e-05, "loss": 1.285, "step": 2860 }, { "epoch": 15.6, "learning_rate": 2.4474169741697416e-05, "loss": 1.2751, "step": 2870 }, { "epoch": 15.65, "learning_rate": 2.4381918819188193e-05, "loss": 1.2568, "step": 2880 }, { "epoch": 15.71, "learning_rate": 2.428966789667897e-05, "loss": 1.2709, "step": 2890 }, { "epoch": 15.76, "learning_rate": 2.4197416974169743e-05, "loss": 1.307, "step": 2900 }, { "epoch": 15.81, "learning_rate": 2.410516605166052e-05, "loss": 1.2745, "step": 2910 }, { "epoch": 15.87, "learning_rate": 2.401291512915129e-05, "loss": 1.2816, "step": 2920 }, { "epoch": 15.92, "learning_rate": 2.3920664206642067e-05, "loss": 1.2611, "step": 2930 }, { "epoch": 15.98, "learning_rate": 2.382841328413284e-05, "loss": 1.2549, "step": 2940 }, { "epoch": 16.0, "eval_loss": 1.5480983257293701, "eval_runtime": 219.5217, "eval_samples_per_second": 8.951, "eval_steps_per_second": 0.747, "eval_wer": 0.9074918366089582, "step": 2944 }, { "epoch": 16.03, "learning_rate": 2.3736162361623618e-05, "loss": 1.2909, "step": 2950 }, { "epoch": 16.09, "learning_rate": 2.364391143911439e-05, "loss": 1.2522, "step": 2960 }, { "epoch": 16.14, "learning_rate": 2.3551660516605168e-05, "loss": 1.2484, "step": 2970 }, { "epoch": 16.2, "learning_rate": 2.3459409594095942e-05, "loss": 1.2431, "step": 2980 }, { "epoch": 16.25, "learning_rate": 2.3367158671586715e-05, "loss": 1.2808, "step": 2990 }, { "epoch": 16.3, "learning_rate": 2.3274907749077492e-05, "loss": 1.2708, "step": 3000 }, { "epoch": 16.36, "learning_rate": 2.3182656826568266e-05, "loss": 1.2528, "step": 3010 }, { "epoch": 16.41, "learning_rate": 2.3090405904059043e-05, "loss": 1.2538, "step": 3020 }, { "epoch": 16.47, "learning_rate": 2.2998154981549816e-05, "loss": 1.2554, "step": 3030 }, { "epoch": 16.52, "learning_rate": 2.2905904059040593e-05, "loss": 1.2524, "step": 3040 }, { "epoch": 16.58, "learning_rate": 2.2813653136531367e-05, "loss": 1.2464, "step": 3050 }, { "epoch": 16.63, "learning_rate": 2.272140221402214e-05, "loss": 1.2598, "step": 3060 }, { "epoch": 16.68, "learning_rate": 2.2629151291512914e-05, "loss": 1.2538, "step": 3070 }, { "epoch": 16.74, "learning_rate": 2.253690036900369e-05, "loss": 1.2501, "step": 3080 }, { "epoch": 16.79, "learning_rate": 2.2444649446494468e-05, "loss": 1.2672, "step": 3090 }, { "epoch": 16.85, "learning_rate": 2.235239852398524e-05, "loss": 1.2615, "step": 3100 }, { "epoch": 16.9, "learning_rate": 2.2260147601476018e-05, "loss": 1.253, "step": 3110 }, { "epoch": 16.96, "learning_rate": 2.216789667896679e-05, "loss": 1.2484, "step": 3120 }, { "epoch": 17.0, "eval_loss": 1.588557481765747, "eval_runtime": 219.807, "eval_samples_per_second": 8.94, "eval_steps_per_second": 0.746, "eval_wer": 0.9191054155628119, "step": 3128 }, { "epoch": 17.01, "learning_rate": 2.2075645756457565e-05, "loss": 1.2893, "step": 3130 }, { "epoch": 17.07, "learning_rate": 2.198339483394834e-05, "loss": 1.2316, "step": 3140 }, { "epoch": 17.12, "learning_rate": 2.1891143911439116e-05, "loss": 1.2376, "step": 3150 }, { "epoch": 17.17, "learning_rate": 2.179889298892989e-05, "loss": 1.2401, "step": 3160 }, { "epoch": 17.23, "learning_rate": 2.1706642066420666e-05, "loss": 1.2411, "step": 3170 }, { "epoch": 17.28, "learning_rate": 2.161439114391144e-05, "loss": 1.2658, "step": 3180 }, { "epoch": 17.34, "learning_rate": 2.1522140221402216e-05, "loss": 1.226, "step": 3190 }, { "epoch": 17.39, "learning_rate": 2.142988929889299e-05, "loss": 1.2405, "step": 3200 }, { "epoch": 17.45, "learning_rate": 2.1337638376383763e-05, "loss": 1.23, "step": 3210 }, { "epoch": 17.5, "learning_rate": 2.124538745387454e-05, "loss": 1.2426, "step": 3220 }, { "epoch": 17.55, "learning_rate": 2.1153136531365314e-05, "loss": 1.2501, "step": 3230 }, { "epoch": 17.61, "learning_rate": 2.106088560885609e-05, "loss": 1.2313, "step": 3240 }, { "epoch": 17.66, "learning_rate": 2.0968634686346864e-05, "loss": 1.2385, "step": 3250 }, { "epoch": 17.72, "learning_rate": 2.087638376383764e-05, "loss": 1.2405, "step": 3260 }, { "epoch": 17.77, "learning_rate": 2.0784132841328415e-05, "loss": 1.2535, "step": 3270 }, { "epoch": 17.82, "learning_rate": 2.069188191881919e-05, "loss": 1.2412, "step": 3280 }, { "epoch": 17.88, "learning_rate": 2.0599630996309965e-05, "loss": 1.2307, "step": 3290 }, { "epoch": 17.93, "learning_rate": 2.050738007380074e-05, "loss": 1.2338, "step": 3300 }, { "epoch": 17.99, "learning_rate": 2.0415129151291516e-05, "loss": 1.2282, "step": 3310 }, { "epoch": 18.0, "eval_loss": 1.6610581874847412, "eval_runtime": 219.6691, "eval_samples_per_second": 8.945, "eval_steps_per_second": 0.747, "eval_wer": 0.923079292711478, "step": 3312 }, { "epoch": 18.04, "learning_rate": 2.032287822878229e-05, "loss": 1.2804, "step": 3320 }, { "epoch": 18.1, "learning_rate": 2.0230627306273066e-05, "loss": 1.2429, "step": 3330 }, { "epoch": 18.15, "learning_rate": 2.0138376383763836e-05, "loss": 1.2481, "step": 3340 }, { "epoch": 18.21, "learning_rate": 2.0046125461254613e-05, "loss": 1.2284, "step": 3350 }, { "epoch": 18.26, "learning_rate": 1.9953874538745387e-05, "loss": 1.2524, "step": 3360 }, { "epoch": 18.31, "learning_rate": 1.9861623616236164e-05, "loss": 1.2245, "step": 3370 }, { "epoch": 18.37, "learning_rate": 1.9769372693726937e-05, "loss": 1.2177, "step": 3380 }, { "epoch": 18.42, "learning_rate": 1.9677121771217714e-05, "loss": 1.2052, "step": 3390 }, { "epoch": 18.48, "learning_rate": 1.9584870848708488e-05, "loss": 1.2303, "step": 3400 }, { "epoch": 18.53, "learning_rate": 1.949261992619926e-05, "loss": 1.2293, "step": 3410 }, { "epoch": 18.59, "learning_rate": 1.9400369003690038e-05, "loss": 1.2192, "step": 3420 }, { "epoch": 18.64, "learning_rate": 1.930811808118081e-05, "loss": 1.2228, "step": 3430 }, { "epoch": 18.69, "learning_rate": 1.921586715867159e-05, "loss": 1.208, "step": 3440 }, { "epoch": 18.75, "learning_rate": 1.9123616236162362e-05, "loss": 1.2228, "step": 3450 }, { "epoch": 18.8, "learning_rate": 1.903136531365314e-05, "loss": 1.2251, "step": 3460 }, { "epoch": 18.86, "learning_rate": 1.8939114391143912e-05, "loss": 1.2179, "step": 3470 }, { "epoch": 18.91, "learning_rate": 1.8846863468634686e-05, "loss": 1.2173, "step": 3480 }, { "epoch": 18.97, "learning_rate": 1.8754612546125463e-05, "loss": 1.2168, "step": 3490 }, { "epoch": 19.0, "eval_loss": 1.636816143989563, "eval_runtime": 220.9463, "eval_samples_per_second": 8.894, "eval_steps_per_second": 0.742, "eval_wer": 0.9149775121680734, "step": 3496 }, { "epoch": 19.02, "learning_rate": 1.8662361623616236e-05, "loss": 1.2467, "step": 3500 }, { "epoch": 19.08, "learning_rate": 1.8570110701107013e-05, "loss": 1.2048, "step": 3510 }, { "epoch": 19.13, "learning_rate": 1.8477859778597787e-05, "loss": 1.203, "step": 3520 }, { "epoch": 19.18, "learning_rate": 1.8385608856088564e-05, "loss": 1.2151, "step": 3530 }, { "epoch": 19.24, "learning_rate": 1.8293357933579337e-05, "loss": 1.2042, "step": 3540 }, { "epoch": 19.29, "learning_rate": 1.820110701107011e-05, "loss": 1.2146, "step": 3550 }, { "epoch": 19.35, "learning_rate": 1.8108856088560884e-05, "loss": 1.2127, "step": 3560 }, { "epoch": 19.4, "learning_rate": 1.801660516605166e-05, "loss": 1.2021, "step": 3570 }, { "epoch": 19.46, "learning_rate": 1.7924354243542435e-05, "loss": 1.2059, "step": 3580 }, { "epoch": 19.51, "learning_rate": 1.7832103321033212e-05, "loss": 1.2075, "step": 3590 }, { "epoch": 19.56, "learning_rate": 1.773985239852399e-05, "loss": 1.2118, "step": 3600 }, { "epoch": 19.62, "learning_rate": 1.7647601476014762e-05, "loss": 1.2135, "step": 3610 }, { "epoch": 19.67, "learning_rate": 1.7555350553505536e-05, "loss": 1.2008, "step": 3620 }, { "epoch": 19.73, "learning_rate": 1.746309963099631e-05, "loss": 1.2102, "step": 3630 }, { "epoch": 19.78, "learning_rate": 1.7370848708487086e-05, "loss": 1.2349, "step": 3640 }, { "epoch": 19.84, "learning_rate": 1.727859778597786e-05, "loss": 1.2011, "step": 3650 }, { "epoch": 19.89, "learning_rate": 1.7186346863468637e-05, "loss": 1.2031, "step": 3660 }, { "epoch": 19.94, "learning_rate": 1.709409594095941e-05, "loss": 1.2197, "step": 3670 }, { "epoch": 20.0, "learning_rate": 1.7001845018450187e-05, "loss": 1.2093, "step": 3680 }, { "epoch": 20.0, "eval_loss": 1.7357299327850342, "eval_runtime": 220.1926, "eval_samples_per_second": 8.924, "eval_steps_per_second": 0.745, "eval_wer": 0.9135296654549935, "step": 3680 }, { "epoch": 20.05, "learning_rate": 1.690959409594096e-05, "loss": 1.2218, "step": 3690 }, { "epoch": 20.11, "learning_rate": 1.6817343173431734e-05, "loss": 1.1965, "step": 3700 }, { "epoch": 20.16, "learning_rate": 1.672509225092251e-05, "loss": 1.1916, "step": 3710 }, { "epoch": 20.22, "learning_rate": 1.6632841328413285e-05, "loss": 1.193, "step": 3720 }, { "epoch": 20.27, "learning_rate": 1.654059040590406e-05, "loss": 1.195, "step": 3730 }, { "epoch": 20.33, "learning_rate": 1.6448339483394835e-05, "loss": 1.1937, "step": 3740 }, { "epoch": 20.38, "learning_rate": 1.635608856088561e-05, "loss": 1.2048, "step": 3750 }, { "epoch": 20.43, "learning_rate": 1.6263837638376382e-05, "loss": 1.2026, "step": 3760 }, { "epoch": 20.49, "learning_rate": 1.617158671586716e-05, "loss": 1.1981, "step": 3770 }, { "epoch": 20.54, "learning_rate": 1.6079335793357932e-05, "loss": 1.1945, "step": 3780 }, { "epoch": 20.6, "learning_rate": 1.598708487084871e-05, "loss": 1.1897, "step": 3790 }, { "epoch": 20.65, "learning_rate": 1.5894833948339486e-05, "loss": 1.1888, "step": 3800 }, { "epoch": 20.71, "learning_rate": 1.580258302583026e-05, "loss": 1.1893, "step": 3810 }, { "epoch": 20.76, "learning_rate": 1.5710332103321033e-05, "loss": 1.1965, "step": 3820 }, { "epoch": 20.81, "learning_rate": 1.5618081180811807e-05, "loss": 1.1981, "step": 3830 }, { "epoch": 20.87, "learning_rate": 1.5525830258302584e-05, "loss": 1.1882, "step": 3840 }, { "epoch": 20.92, "learning_rate": 1.5433579335793357e-05, "loss": 1.2048, "step": 3850 }, { "epoch": 20.98, "learning_rate": 1.5341328413284134e-05, "loss": 1.1951, "step": 3860 }, { "epoch": 21.0, "eval_loss": 1.6972588300704956, "eval_runtime": 221.9349, "eval_samples_per_second": 8.854, "eval_steps_per_second": 0.739, "eval_wer": 0.9076458628550305, "step": 3864 }, { "epoch": 21.03, "learning_rate": 1.5249077490774908e-05, "loss": 1.2165, "step": 3870 }, { "epoch": 21.09, "learning_rate": 1.5156826568265683e-05, "loss": 1.1675, "step": 3880 }, { "epoch": 21.14, "learning_rate": 1.506457564575646e-05, "loss": 1.1787, "step": 3890 }, { "epoch": 21.2, "learning_rate": 1.4972324723247233e-05, "loss": 1.1614, "step": 3900 }, { "epoch": 21.25, "learning_rate": 1.4880073800738009e-05, "loss": 1.172, "step": 3910 }, { "epoch": 21.3, "learning_rate": 1.4787822878228782e-05, "loss": 1.1791, "step": 3920 }, { "epoch": 21.36, "learning_rate": 1.4695571955719559e-05, "loss": 1.1758, "step": 3930 }, { "epoch": 21.41, "learning_rate": 1.4603321033210333e-05, "loss": 1.1692, "step": 3940 }, { "epoch": 21.47, "learning_rate": 1.4511070110701108e-05, "loss": 1.1734, "step": 3950 }, { "epoch": 21.52, "learning_rate": 1.4418819188191881e-05, "loss": 1.1965, "step": 3960 }, { "epoch": 21.58, "learning_rate": 1.4326568265682658e-05, "loss": 1.1836, "step": 3970 }, { "epoch": 21.63, "learning_rate": 1.4234317343173432e-05, "loss": 1.1716, "step": 3980 }, { "epoch": 21.68, "learning_rate": 1.4142066420664207e-05, "loss": 1.1902, "step": 3990 }, { "epoch": 21.74, "learning_rate": 1.4049815498154984e-05, "loss": 1.1919, "step": 4000 }, { "epoch": 21.79, "learning_rate": 1.3957564575645758e-05, "loss": 1.1896, "step": 4010 }, { "epoch": 21.85, "learning_rate": 1.3865313653136533e-05, "loss": 1.1664, "step": 4020 }, { "epoch": 21.9, "learning_rate": 1.3773062730627306e-05, "loss": 1.1782, "step": 4030 }, { "epoch": 21.96, "learning_rate": 1.3680811808118083e-05, "loss": 1.1835, "step": 4040 }, { "epoch": 22.0, "eval_loss": 1.7048912048339844, "eval_runtime": 221.2004, "eval_samples_per_second": 8.883, "eval_steps_per_second": 0.741, "eval_wer": 0.9170106586162282, "step": 4048 }, { "epoch": 22.01, "learning_rate": 1.3588560885608857e-05, "loss": 1.2062, "step": 4050 }, { "epoch": 22.07, "learning_rate": 1.3496309963099632e-05, "loss": 1.1691, "step": 4060 }, { "epoch": 22.12, "learning_rate": 1.3404059040590405e-05, "loss": 1.1526, "step": 4070 }, { "epoch": 22.17, "learning_rate": 1.3311808118081182e-05, "loss": 1.1604, "step": 4080 }, { "epoch": 22.23, "learning_rate": 1.3219557195571958e-05, "loss": 1.1781, "step": 4090 }, { "epoch": 22.28, "learning_rate": 1.3127306273062731e-05, "loss": 1.158, "step": 4100 }, { "epoch": 22.34, "learning_rate": 1.3035055350553508e-05, "loss": 1.1649, "step": 4110 }, { "epoch": 22.39, "learning_rate": 1.294280442804428e-05, "loss": 1.1725, "step": 4120 }, { "epoch": 22.45, "learning_rate": 1.2850553505535057e-05, "loss": 1.1674, "step": 4130 }, { "epoch": 22.5, "learning_rate": 1.275830258302583e-05, "loss": 1.167, "step": 4140 }, { "epoch": 22.55, "learning_rate": 1.2666051660516606e-05, "loss": 1.1704, "step": 4150 }, { "epoch": 22.61, "learning_rate": 1.2573800738007379e-05, "loss": 1.1729, "step": 4160 }, { "epoch": 22.66, "learning_rate": 1.2481549815498156e-05, "loss": 1.1703, "step": 4170 }, { "epoch": 22.72, "learning_rate": 1.2389298892988931e-05, "loss": 1.1664, "step": 4180 }, { "epoch": 22.77, "learning_rate": 1.2297047970479705e-05, "loss": 1.1594, "step": 4190 }, { "epoch": 22.82, "learning_rate": 1.220479704797048e-05, "loss": 1.1583, "step": 4200 }, { "epoch": 22.88, "learning_rate": 1.2112546125461255e-05, "loss": 1.1555, "step": 4210 }, { "epoch": 22.93, "learning_rate": 1.202029520295203e-05, "loss": 1.1585, "step": 4220 }, { "epoch": 22.99, "learning_rate": 1.1928044280442804e-05, "loss": 1.1554, "step": 4230 }, { "epoch": 23.0, "eval_loss": 1.766296625137329, "eval_runtime": 221.7981, "eval_samples_per_second": 8.859, "eval_steps_per_second": 0.739, "eval_wer": 0.9182428685848069, "step": 4232 }, { "epoch": 23.04, "learning_rate": 1.183579335793358e-05, "loss": 1.1897, "step": 4240 }, { "epoch": 23.1, "learning_rate": 1.1743542435424356e-05, "loss": 1.1549, "step": 4250 }, { "epoch": 23.15, "learning_rate": 1.165129151291513e-05, "loss": 1.1544, "step": 4260 }, { "epoch": 23.21, "learning_rate": 1.1559040590405905e-05, "loss": 1.1362, "step": 4270 }, { "epoch": 23.26, "learning_rate": 1.146678966789668e-05, "loss": 1.1507, "step": 4280 }, { "epoch": 23.31, "learning_rate": 1.1374538745387454e-05, "loss": 1.1564, "step": 4290 }, { "epoch": 23.37, "learning_rate": 1.1282287822878229e-05, "loss": 1.1528, "step": 4300 }, { "epoch": 23.42, "learning_rate": 1.1190036900369004e-05, "loss": 1.1463, "step": 4310 }, { "epoch": 23.48, "learning_rate": 1.109778597785978e-05, "loss": 1.1399, "step": 4320 }, { "epoch": 23.53, "learning_rate": 1.1005535055350553e-05, "loss": 1.1491, "step": 4330 }, { "epoch": 23.59, "learning_rate": 1.091328413284133e-05, "loss": 1.1513, "step": 4340 }, { "epoch": 23.64, "learning_rate": 1.0821033210332105e-05, "loss": 1.1494, "step": 4350 }, { "epoch": 23.69, "learning_rate": 1.0728782287822878e-05, "loss": 1.1412, "step": 4360 }, { "epoch": 23.75, "learning_rate": 1.0636531365313654e-05, "loss": 1.1553, "step": 4370 }, { "epoch": 23.8, "learning_rate": 1.0544280442804429e-05, "loss": 1.1469, "step": 4380 }, { "epoch": 23.86, "learning_rate": 1.0452029520295204e-05, "loss": 1.1468, "step": 4390 }, { "epoch": 23.91, "learning_rate": 1.0359778597785978e-05, "loss": 1.1551, "step": 4400 }, { "epoch": 23.97, "learning_rate": 1.0267527675276753e-05, "loss": 1.1418, "step": 4410 }, { "epoch": 24.0, "eval_loss": 1.6813879013061523, "eval_runtime": 216.1625, "eval_samples_per_second": 9.09, "eval_steps_per_second": 0.759, "eval_wer": 0.9133756392089212, "step": 4416 }, { "epoch": 24.02, "learning_rate": 1.0175276752767528e-05, "loss": 1.1671, "step": 4420 }, { "epoch": 24.08, "learning_rate": 1.0083025830258303e-05, "loss": 1.1418, "step": 4430 }, { "epoch": 24.13, "learning_rate": 9.990774907749079e-06, "loss": 1.1243, "step": 4440 }, { "epoch": 24.18, "learning_rate": 9.898523985239854e-06, "loss": 1.146, "step": 4450 }, { "epoch": 24.24, "learning_rate": 9.806273062730629e-06, "loss": 1.1317, "step": 4460 }, { "epoch": 24.29, "learning_rate": 9.714022140221402e-06, "loss": 1.1511, "step": 4470 }, { "epoch": 24.35, "learning_rate": 9.621771217712178e-06, "loss": 1.1261, "step": 4480 }, { "epoch": 24.4, "learning_rate": 9.529520295202953e-06, "loss": 1.13, "step": 4490 }, { "epoch": 24.46, "learning_rate": 9.437269372693726e-06, "loss": 1.1225, "step": 4500 }, { "epoch": 24.51, "learning_rate": 9.345018450184502e-06, "loss": 1.1406, "step": 4510 }, { "epoch": 24.56, "learning_rate": 9.252767527675277e-06, "loss": 1.1353, "step": 4520 }, { "epoch": 24.62, "learning_rate": 9.160516605166052e-06, "loss": 1.1483, "step": 4530 }, { "epoch": 24.67, "learning_rate": 9.068265682656827e-06, "loss": 1.1212, "step": 4540 }, { "epoch": 24.73, "learning_rate": 8.976014760147603e-06, "loss": 1.1156, "step": 4550 }, { "epoch": 24.78, "learning_rate": 8.883763837638378e-06, "loss": 1.1244, "step": 4560 }, { "epoch": 24.84, "learning_rate": 8.791512915129151e-06, "loss": 1.1211, "step": 4570 }, { "epoch": 24.89, "learning_rate": 8.699261992619927e-06, "loss": 1.128, "step": 4580 }, { "epoch": 24.94, "learning_rate": 8.607011070110702e-06, "loss": 1.1292, "step": 4590 }, { "epoch": 25.0, "learning_rate": 8.514760147601477e-06, "loss": 1.1391, "step": 4600 }, { "epoch": 25.0, "eval_loss": 1.6740144491195679, "eval_runtime": 221.3199, "eval_samples_per_second": 8.879, "eval_steps_per_second": 0.741, "eval_wer": 0.895785841907461, "step": 4600 }, { "epoch": 25.05, "learning_rate": 8.42250922509225e-06, "loss": 1.1605, "step": 4610 }, { "epoch": 25.11, "learning_rate": 8.330258302583026e-06, "loss": 1.1148, "step": 4620 }, { "epoch": 25.16, "learning_rate": 8.238007380073801e-06, "loss": 1.1238, "step": 4630 }, { "epoch": 25.22, "learning_rate": 8.145756457564576e-06, "loss": 1.1158, "step": 4640 }, { "epoch": 25.27, "learning_rate": 8.053505535055351e-06, "loss": 1.124, "step": 4650 }, { "epoch": 25.33, "learning_rate": 7.961254612546127e-06, "loss": 1.1281, "step": 4660 }, { "epoch": 25.38, "learning_rate": 7.869003690036902e-06, "loss": 1.1165, "step": 4670 }, { "epoch": 25.43, "learning_rate": 7.776752767527675e-06, "loss": 1.1177, "step": 4680 }, { "epoch": 25.49, "learning_rate": 7.68450184501845e-06, "loss": 1.1052, "step": 4690 }, { "epoch": 25.54, "learning_rate": 7.592250922509225e-06, "loss": 1.1166, "step": 4700 }, { "epoch": 25.6, "learning_rate": 7.5e-06, "loss": 1.1167, "step": 4710 }, { "epoch": 25.65, "learning_rate": 7.4077490774907746e-06, "loss": 1.1053, "step": 4720 }, { "epoch": 25.71, "learning_rate": 7.31549815498155e-06, "loss": 1.1083, "step": 4730 }, { "epoch": 25.76, "learning_rate": 7.223247232472324e-06, "loss": 1.1225, "step": 4740 }, { "epoch": 25.81, "learning_rate": 7.1309963099631e-06, "loss": 1.1139, "step": 4750 }, { "epoch": 25.87, "learning_rate": 7.0387453874538755e-06, "loss": 1.1129, "step": 4760 }, { "epoch": 25.92, "learning_rate": 6.94649446494465e-06, "loss": 1.1051, "step": 4770 }, { "epoch": 25.98, "learning_rate": 6.854243542435425e-06, "loss": 1.1142, "step": 4780 }, { "epoch": 26.0, "eval_loss": 1.7445429563522339, "eval_runtime": 220.9225, "eval_samples_per_second": 8.895, "eval_steps_per_second": 0.742, "eval_wer": 0.9014848130121372, "step": 4784 }, { "epoch": 26.03, "learning_rate": 6.7619926199261994e-06, "loss": 1.149, "step": 4790 }, { "epoch": 26.09, "learning_rate": 6.669741697416975e-06, "loss": 1.1072, "step": 4800 }, { "epoch": 26.14, "learning_rate": 6.577490774907749e-06, "loss": 1.0874, "step": 4810 }, { "epoch": 26.2, "learning_rate": 6.485239852398524e-06, "loss": 1.0894, "step": 4820 }, { "epoch": 26.25, "learning_rate": 6.392988929889299e-06, "loss": 1.0843, "step": 4830 }, { "epoch": 26.3, "learning_rate": 6.300738007380073e-06, "loss": 1.0838, "step": 4840 }, { "epoch": 26.36, "learning_rate": 6.208487084870849e-06, "loss": 1.0658, "step": 4850 }, { "epoch": 26.41, "learning_rate": 6.1162361623616234e-06, "loss": 1.0798, "step": 4860 }, { "epoch": 26.47, "learning_rate": 6.0239852398523995e-06, "loss": 1.0736, "step": 4870 }, { "epoch": 26.52, "learning_rate": 5.931734317343174e-06, "loss": 1.0738, "step": 4880 }, { "epoch": 26.58, "learning_rate": 5.839483394833948e-06, "loss": 1.0608, "step": 4890 }, { "epoch": 26.63, "learning_rate": 5.7472324723247235e-06, "loss": 1.0693, "step": 4900 }, { "epoch": 26.68, "learning_rate": 5.654981549815498e-06, "loss": 1.0694, "step": 4910 }, { "epoch": 26.74, "learning_rate": 5.562730627306274e-06, "loss": 1.0553, "step": 4920 }, { "epoch": 26.79, "learning_rate": 5.470479704797048e-06, "loss": 1.0729, "step": 4930 }, { "epoch": 26.85, "learning_rate": 5.3782287822878235e-06, "loss": 1.0571, "step": 4940 }, { "epoch": 26.9, "learning_rate": 5.285977859778598e-06, "loss": 1.0691, "step": 4950 }, { "epoch": 26.96, "learning_rate": 5.193726937269372e-06, "loss": 1.0598, "step": 4960 }, { "epoch": 27.0, "eval_loss": 1.8277820348739624, "eval_runtime": 223.9114, "eval_samples_per_second": 8.776, "eval_steps_per_second": 0.732, "eval_wer": 0.9001909925451297, "step": 4968 }, { "epoch": 27.01, "learning_rate": 5.101476014760148e-06, "loss": 1.0863, "step": 4970 }, { "epoch": 27.07, "learning_rate": 5.009225092250923e-06, "loss": 1.0481, "step": 4980 }, { "epoch": 27.12, "learning_rate": 4.916974169741698e-06, "loss": 1.044, "step": 4990 }, { "epoch": 27.17, "learning_rate": 4.824723247232472e-06, "loss": 1.045, "step": 5000 }, { "epoch": 27.23, "learning_rate": 4.7324723247232475e-06, "loss": 1.0494, "step": 5010 }, { "epoch": 27.28, "learning_rate": 4.640221402214023e-06, "loss": 1.0558, "step": 5020 }, { "epoch": 27.34, "learning_rate": 4.547970479704797e-06, "loss": 1.047, "step": 5030 }, { "epoch": 27.39, "learning_rate": 4.455719557195572e-06, "loss": 1.0394, "step": 5040 }, { "epoch": 27.45, "learning_rate": 4.363468634686347e-06, "loss": 1.0625, "step": 5050 }, { "epoch": 27.5, "learning_rate": 4.271217712177122e-06, "loss": 1.0548, "step": 5060 }, { "epoch": 27.55, "learning_rate": 4.178966789667897e-06, "loss": 1.0465, "step": 5070 }, { "epoch": 27.61, "learning_rate": 4.0867158671586716e-06, "loss": 1.0471, "step": 5080 }, { "epoch": 27.66, "learning_rate": 3.994464944649447e-06, "loss": 1.0476, "step": 5090 }, { "epoch": 27.72, "learning_rate": 3.902214022140221e-06, "loss": 1.0405, "step": 5100 }, { "epoch": 27.77, "learning_rate": 3.8099630996309964e-06, "loss": 1.0469, "step": 5110 }, { "epoch": 27.82, "learning_rate": 3.7177121771217716e-06, "loss": 1.0396, "step": 5120 }, { "epoch": 27.88, "learning_rate": 3.6254612546125464e-06, "loss": 1.0462, "step": 5130 }, { "epoch": 27.93, "learning_rate": 3.533210332103321e-06, "loss": 1.0509, "step": 5140 }, { "epoch": 27.99, "learning_rate": 3.440959409594096e-06, "loss": 1.0423, "step": 5150 }, { "epoch": 28.0, "eval_loss": 1.8642076253890991, "eval_runtime": 221.6309, "eval_samples_per_second": 8.866, "eval_steps_per_second": 0.74, "eval_wer": 0.9042264801922247, "step": 5152 }, { "epoch": 28.04, "learning_rate": 3.3487084870848708e-06, "loss": 1.0696, "step": 5160 }, { "epoch": 28.1, "learning_rate": 3.256457564575646e-06, "loss": 1.0501, "step": 5170 }, { "epoch": 28.15, "learning_rate": 3.164206642066421e-06, "loss": 1.028, "step": 5180 }, { "epoch": 28.21, "learning_rate": 3.0719557195571956e-06, "loss": 1.0278, "step": 5190 }, { "epoch": 28.26, "learning_rate": 2.9797047970479704e-06, "loss": 1.0378, "step": 5200 }, { "epoch": 28.31, "learning_rate": 2.8874538745387456e-06, "loss": 1.0414, "step": 5210 }, { "epoch": 28.37, "learning_rate": 2.7952029520295204e-06, "loss": 1.0338, "step": 5220 }, { "epoch": 28.42, "learning_rate": 2.7029520295202956e-06, "loss": 1.0344, "step": 5230 }, { "epoch": 28.48, "learning_rate": 2.6107011070110704e-06, "loss": 1.0256, "step": 5240 }, { "epoch": 28.53, "learning_rate": 2.518450184501845e-06, "loss": 1.0331, "step": 5250 }, { "epoch": 28.59, "learning_rate": 2.42619926199262e-06, "loss": 1.0487, "step": 5260 }, { "epoch": 28.64, "learning_rate": 2.333948339483395e-06, "loss": 1.0308, "step": 5270 }, { "epoch": 28.69, "learning_rate": 2.24169741697417e-06, "loss": 1.0311, "step": 5280 }, { "epoch": 28.75, "learning_rate": 2.149446494464945e-06, "loss": 1.0281, "step": 5290 }, { "epoch": 28.8, "learning_rate": 2.0571955719557197e-06, "loss": 1.0261, "step": 5300 }, { "epoch": 28.86, "learning_rate": 1.9649446494464945e-06, "loss": 1.0189, "step": 5310 }, { "epoch": 28.91, "learning_rate": 1.8726937269372695e-06, "loss": 1.0353, "step": 5320 }, { "epoch": 28.97, "learning_rate": 1.7804428044280445e-06, "loss": 1.025, "step": 5330 }, { "epoch": 29.0, "eval_loss": 1.9265143871307373, "eval_runtime": 222.0292, "eval_samples_per_second": 8.85, "eval_steps_per_second": 0.739, "eval_wer": 0.9078306943503173, "step": 5336 }, { "epoch": 29.02, "learning_rate": 1.6881918819188193e-06, "loss": 1.0553, "step": 5340 }, { "epoch": 29.08, "learning_rate": 1.595940959409594e-06, "loss": 1.0142, "step": 5350 }, { "epoch": 29.13, "learning_rate": 1.503690036900369e-06, "loss": 1.0292, "step": 5360 }, { "epoch": 29.18, "learning_rate": 1.4114391143911439e-06, "loss": 1.0249, "step": 5370 }, { "epoch": 29.24, "learning_rate": 1.319188191881919e-06, "loss": 1.0144, "step": 5380 }, { "epoch": 29.29, "learning_rate": 1.226937269372694e-06, "loss": 1.0317, "step": 5390 }, { "epoch": 29.35, "learning_rate": 1.1346863468634687e-06, "loss": 1.0328, "step": 5400 }, { "epoch": 29.4, "learning_rate": 1.0424354243542435e-06, "loss": 1.0258, "step": 5410 }, { "epoch": 29.46, "learning_rate": 9.501845018450185e-07, "loss": 1.0221, "step": 5420 }, { "epoch": 29.51, "learning_rate": 8.579335793357934e-07, "loss": 1.0177, "step": 5430 }, { "epoch": 29.56, "learning_rate": 7.656826568265683e-07, "loss": 1.0204, "step": 5440 }, { "epoch": 29.62, "learning_rate": 6.734317343173432e-07, "loss": 1.0232, "step": 5450 }, { "epoch": 29.67, "learning_rate": 5.811808118081181e-07, "loss": 1.0267, "step": 5460 }, { "epoch": 29.73, "learning_rate": 4.889298892988929e-07, "loss": 1.0177, "step": 5470 }, { "epoch": 29.78, "learning_rate": 3.9667896678966794e-07, "loss": 1.0383, "step": 5480 }, { "epoch": 29.84, "learning_rate": 3.044280442804428e-07, "loss": 1.0131, "step": 5490 }, { "epoch": 29.89, "learning_rate": 2.121771217712177e-07, "loss": 1.023, "step": 5500 }, { "epoch": 29.94, "learning_rate": 1.1992619926199263e-07, "loss": 1.0283, "step": 5510 }, { "epoch": 30.0, "learning_rate": 2.7675276752767527e-08, "loss": 1.02, "step": 5520 }, { "epoch": 30.0, "eval_loss": 1.9589478969573975, "eval_runtime": 221.7999, "eval_samples_per_second": 8.859, "eval_steps_per_second": 0.739, "eval_wer": 0.9055819111576613, "step": 5520 }, { "epoch": 30.0, "step": 5520, "total_flos": 1.607923222665725e+20, "train_loss": 1.3724038049794625, "train_runtime": 98560.7025, "train_samples_per_second": 5.383, "train_steps_per_second": 0.056 } ], "max_steps": 5520, "num_train_epochs": 30, "total_flos": 1.607923222665725e+20, "trial_name": null, "trial_params": null }