gary109's picture
End of training
664354f
raw
history blame
112 kB
{
"best_metric": 0.47944945096969604,
"best_model_checkpoint": "ai-light-dance_singing3_ft_wav2vec2-large-xlsr-53-v1-5gram/checkpoint-1512",
"epoch": 99.99653979238754,
"global_step": 7200,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.14,
"learning_rate": 5.000000000000001e-07,
"loss": 0.3086,
"step": 10
},
{
"epoch": 0.28,
"learning_rate": 1.0000000000000002e-06,
"loss": 0.3275,
"step": 20
},
{
"epoch": 0.42,
"learning_rate": 1.5e-06,
"loss": 0.3051,
"step": 30
},
{
"epoch": 0.55,
"learning_rate": 2.0000000000000003e-06,
"loss": 0.3072,
"step": 40
},
{
"epoch": 0.69,
"learning_rate": 2.5e-06,
"loss": 0.2957,
"step": 50
},
{
"epoch": 0.83,
"learning_rate": 3e-06,
"loss": 0.2856,
"step": 60
},
{
"epoch": 0.97,
"learning_rate": 3.5000000000000004e-06,
"loss": 0.314,
"step": 70
},
{
"epoch": 1.0,
"eval_loss": 0.4815235435962677,
"eval_runtime": 130.4571,
"eval_samples_per_second": 4.078,
"eval_steps_per_second": 0.514,
"eval_wer": 0.20768785755608407,
"step": 72
},
{
"epoch": 1.11,
"learning_rate": 4.000000000000001e-06,
"loss": 0.2981,
"step": 80
},
{
"epoch": 1.25,
"learning_rate": 4.5e-06,
"loss": 0.2972,
"step": 90
},
{
"epoch": 1.39,
"learning_rate": 5e-06,
"loss": 0.2892,
"step": 100
},
{
"epoch": 1.53,
"learning_rate": 5.500000000000001e-06,
"loss": 0.3014,
"step": 110
},
{
"epoch": 1.66,
"learning_rate": 6e-06,
"loss": 0.3013,
"step": 120
},
{
"epoch": 1.8,
"learning_rate": 6.5000000000000004e-06,
"loss": 0.315,
"step": 130
},
{
"epoch": 1.94,
"learning_rate": 7.000000000000001e-06,
"loss": 0.3064,
"step": 140
},
{
"epoch": 2.0,
"eval_loss": 0.5082846283912659,
"eval_runtime": 130.0863,
"eval_samples_per_second": 4.09,
"eval_steps_per_second": 0.515,
"eval_wer": 0.2101947676287202,
"step": 144
},
{
"epoch": 2.08,
"learning_rate": 7.5e-06,
"loss": 0.3067,
"step": 150
},
{
"epoch": 2.22,
"learning_rate": 7.95e-06,
"loss": 0.304,
"step": 160
},
{
"epoch": 2.36,
"learning_rate": 8.45e-06,
"loss": 0.3065,
"step": 170
},
{
"epoch": 2.5,
"learning_rate": 8.95e-06,
"loss": 0.3014,
"step": 180
},
{
"epoch": 2.64,
"learning_rate": 9.450000000000001e-06,
"loss": 0.2938,
"step": 190
},
{
"epoch": 2.78,
"learning_rate": 9.950000000000001e-06,
"loss": 0.3086,
"step": 200
},
{
"epoch": 2.91,
"learning_rate": 1.045e-05,
"loss": 0.2951,
"step": 210
},
{
"epoch": 3.0,
"eval_loss": 0.5146709680557251,
"eval_runtime": 129.1484,
"eval_samples_per_second": 4.119,
"eval_steps_per_second": 0.519,
"eval_wer": 0.2158513852285145,
"step": 216
},
{
"epoch": 3.06,
"learning_rate": 1.095e-05,
"loss": 0.3079,
"step": 220
},
{
"epoch": 3.19,
"learning_rate": 1.145e-05,
"loss": 0.2984,
"step": 230
},
{
"epoch": 3.33,
"learning_rate": 1.195e-05,
"loss": 0.3067,
"step": 240
},
{
"epoch": 3.47,
"learning_rate": 1.2450000000000001e-05,
"loss": 0.3033,
"step": 250
},
{
"epoch": 3.61,
"learning_rate": 1.2950000000000001e-05,
"loss": 0.2912,
"step": 260
},
{
"epoch": 3.75,
"learning_rate": 1.3450000000000002e-05,
"loss": 0.2915,
"step": 270
},
{
"epoch": 3.89,
"learning_rate": 1.3950000000000002e-05,
"loss": 0.2835,
"step": 280
},
{
"epoch": 4.0,
"eval_loss": 0.515735387802124,
"eval_runtime": 128.8527,
"eval_samples_per_second": 4.129,
"eval_steps_per_second": 0.52,
"eval_wer": 0.20910201195603265,
"step": 288
},
{
"epoch": 4.03,
"learning_rate": 1.4449999999999999e-05,
"loss": 0.3069,
"step": 290
},
{
"epoch": 4.17,
"learning_rate": 1.4950000000000001e-05,
"loss": 0.2931,
"step": 300
},
{
"epoch": 4.3,
"learning_rate": 1.545e-05,
"loss": 0.2916,
"step": 310
},
{
"epoch": 4.44,
"learning_rate": 1.595e-05,
"loss": 0.304,
"step": 320
},
{
"epoch": 4.58,
"learning_rate": 1.645e-05,
"loss": 0.301,
"step": 330
},
{
"epoch": 4.72,
"learning_rate": 1.6950000000000002e-05,
"loss": 0.3098,
"step": 340
},
{
"epoch": 4.86,
"learning_rate": 1.745e-05,
"loss": 0.2935,
"step": 350
},
{
"epoch": 5.0,
"learning_rate": 1.795e-05,
"loss": 0.3011,
"step": 360
},
{
"epoch": 5.0,
"eval_loss": 0.495644748210907,
"eval_runtime": 129.107,
"eval_samples_per_second": 4.121,
"eval_steps_per_second": 0.519,
"eval_wer": 0.215080028283088,
"step": 360
},
{
"epoch": 5.14,
"learning_rate": 1.845e-05,
"loss": 0.302,
"step": 370
},
{
"epoch": 5.28,
"learning_rate": 1.895e-05,
"loss": 0.3081,
"step": 380
},
{
"epoch": 5.42,
"learning_rate": 1.9450000000000002e-05,
"loss": 0.3041,
"step": 390
},
{
"epoch": 5.55,
"learning_rate": 1.995e-05,
"loss": 0.3061,
"step": 400
},
{
"epoch": 5.69,
"learning_rate": 2.045e-05,
"loss": 0.3081,
"step": 410
},
{
"epoch": 5.83,
"learning_rate": 2.09e-05,
"loss": 0.2989,
"step": 420
},
{
"epoch": 5.97,
"learning_rate": 2.1400000000000002e-05,
"loss": 0.3097,
"step": 430
},
{
"epoch": 6.0,
"eval_loss": 0.5190498232841492,
"eval_runtime": 129.2076,
"eval_samples_per_second": 4.117,
"eval_steps_per_second": 0.519,
"eval_wer": 0.21533714726489683,
"step": 432
},
{
"epoch": 6.11,
"learning_rate": 2.19e-05,
"loss": 0.3235,
"step": 440
},
{
"epoch": 6.25,
"learning_rate": 2.2400000000000002e-05,
"loss": 0.3015,
"step": 450
},
{
"epoch": 6.39,
"learning_rate": 2.29e-05,
"loss": 0.2979,
"step": 460
},
{
"epoch": 6.53,
"learning_rate": 2.3400000000000003e-05,
"loss": 0.3303,
"step": 470
},
{
"epoch": 6.66,
"learning_rate": 2.39e-05,
"loss": 0.318,
"step": 480
},
{
"epoch": 6.8,
"learning_rate": 2.44e-05,
"loss": 0.3111,
"step": 490
},
{
"epoch": 6.94,
"learning_rate": 2.4900000000000002e-05,
"loss": 0.2998,
"step": 500
},
{
"epoch": 7.0,
"eval_loss": 0.5349323153495789,
"eval_runtime": 129.2108,
"eval_samples_per_second": 4.117,
"eval_steps_per_second": 0.519,
"eval_wer": 0.22015812817381245,
"step": 504
},
{
"epoch": 7.08,
"learning_rate": 2.4970149253731346e-05,
"loss": 0.3216,
"step": 510
},
{
"epoch": 7.22,
"learning_rate": 2.493283582089552e-05,
"loss": 0.3147,
"step": 520
},
{
"epoch": 7.36,
"learning_rate": 2.4895522388059704e-05,
"loss": 0.3128,
"step": 530
},
{
"epoch": 7.5,
"learning_rate": 2.4858208955223883e-05,
"loss": 0.3079,
"step": 540
},
{
"epoch": 7.64,
"learning_rate": 2.482089552238806e-05,
"loss": 0.2967,
"step": 550
},
{
"epoch": 7.78,
"learning_rate": 2.478358208955224e-05,
"loss": 0.3098,
"step": 560
},
{
"epoch": 7.91,
"learning_rate": 2.474626865671642e-05,
"loss": 0.3086,
"step": 570
},
{
"epoch": 8.0,
"eval_loss": 0.5055466890335083,
"eval_runtime": 128.9787,
"eval_samples_per_second": 4.125,
"eval_steps_per_second": 0.519,
"eval_wer": 0.21450151057401812,
"step": 576
},
{
"epoch": 8.06,
"learning_rate": 2.4708955223880597e-05,
"loss": 0.3243,
"step": 580
},
{
"epoch": 8.19,
"learning_rate": 2.467164179104478e-05,
"loss": 0.3088,
"step": 590
},
{
"epoch": 8.33,
"learning_rate": 2.4634328358208955e-05,
"loss": 0.3071,
"step": 600
},
{
"epoch": 8.47,
"learning_rate": 2.4597014925373134e-05,
"loss": 0.3094,
"step": 610
},
{
"epoch": 8.61,
"learning_rate": 2.4559701492537317e-05,
"loss": 0.3049,
"step": 620
},
{
"epoch": 8.75,
"learning_rate": 2.4522388059701492e-05,
"loss": 0.3061,
"step": 630
},
{
"epoch": 8.89,
"learning_rate": 2.448507462686567e-05,
"loss": 0.2964,
"step": 640
},
{
"epoch": 9.0,
"eval_loss": 0.5091516971588135,
"eval_runtime": 129.4051,
"eval_samples_per_second": 4.111,
"eval_steps_per_second": 0.518,
"eval_wer": 0.2183582953011506,
"step": 648
},
{
"epoch": 9.03,
"learning_rate": 2.4447761194029854e-05,
"loss": 0.3212,
"step": 650
},
{
"epoch": 9.17,
"learning_rate": 2.441044776119403e-05,
"loss": 0.302,
"step": 660
},
{
"epoch": 9.3,
"learning_rate": 2.437313432835821e-05,
"loss": 0.3103,
"step": 670
},
{
"epoch": 9.44,
"learning_rate": 2.433582089552239e-05,
"loss": 0.3102,
"step": 680
},
{
"epoch": 9.58,
"learning_rate": 2.4298507462686567e-05,
"loss": 0.3045,
"step": 690
},
{
"epoch": 9.72,
"learning_rate": 2.4261194029850746e-05,
"loss": 0.3162,
"step": 700
},
{
"epoch": 9.86,
"learning_rate": 2.4223880597014926e-05,
"loss": 0.3186,
"step": 710
},
{
"epoch": 10.0,
"learning_rate": 2.4186567164179105e-05,
"loss": 0.3288,
"step": 720
},
{
"epoch": 10.0,
"eval_loss": 0.5076370239257812,
"eval_runtime": 129.7675,
"eval_samples_per_second": 4.1,
"eval_steps_per_second": 0.516,
"eval_wer": 0.2190653725011249,
"step": 720
},
{
"epoch": 10.14,
"learning_rate": 2.4149253731343284e-05,
"loss": 0.3037,
"step": 730
},
{
"epoch": 10.28,
"learning_rate": 2.4111940298507463e-05,
"loss": 0.3256,
"step": 740
},
{
"epoch": 10.42,
"learning_rate": 2.4074626865671642e-05,
"loss": 0.3209,
"step": 750
},
{
"epoch": 10.55,
"learning_rate": 2.403731343283582e-05,
"loss": 0.3259,
"step": 760
},
{
"epoch": 10.69,
"learning_rate": 2.4e-05,
"loss": 0.3081,
"step": 770
},
{
"epoch": 10.83,
"learning_rate": 2.396268656716418e-05,
"loss": 0.3153,
"step": 780
},
{
"epoch": 10.97,
"learning_rate": 2.392537313432836e-05,
"loss": 0.3019,
"step": 790
},
{
"epoch": 11.0,
"eval_loss": 0.5125810503959656,
"eval_runtime": 128.8657,
"eval_samples_per_second": 4.128,
"eval_steps_per_second": 0.52,
"eval_wer": 0.20916629170148487,
"step": 792
},
{
"epoch": 11.11,
"learning_rate": 2.3888059701492538e-05,
"loss": 0.3151,
"step": 800
},
{
"epoch": 11.25,
"learning_rate": 2.3850746268656717e-05,
"loss": 0.3154,
"step": 810
},
{
"epoch": 11.39,
"learning_rate": 2.3813432835820896e-05,
"loss": 0.2949,
"step": 820
},
{
"epoch": 11.53,
"learning_rate": 2.3776119402985076e-05,
"loss": 0.3214,
"step": 830
},
{
"epoch": 11.66,
"learning_rate": 2.3738805970149255e-05,
"loss": 0.2946,
"step": 840
},
{
"epoch": 11.8,
"learning_rate": 2.3701492537313434e-05,
"loss": 0.3154,
"step": 850
},
{
"epoch": 11.94,
"learning_rate": 2.3664179104477613e-05,
"loss": 0.3047,
"step": 860
},
{
"epoch": 12.0,
"eval_loss": 0.5249019861221313,
"eval_runtime": 129.2154,
"eval_samples_per_second": 4.117,
"eval_steps_per_second": 0.519,
"eval_wer": 0.2117374815195732,
"step": 864
},
{
"epoch": 12.08,
"learning_rate": 2.3626865671641792e-05,
"loss": 0.2959,
"step": 870
},
{
"epoch": 12.22,
"learning_rate": 2.358955223880597e-05,
"loss": 0.295,
"step": 880
},
{
"epoch": 12.36,
"learning_rate": 2.355223880597015e-05,
"loss": 0.3122,
"step": 890
},
{
"epoch": 12.5,
"learning_rate": 2.351492537313433e-05,
"loss": 0.3028,
"step": 900
},
{
"epoch": 12.64,
"learning_rate": 2.347761194029851e-05,
"loss": 0.2777,
"step": 910
},
{
"epoch": 12.78,
"learning_rate": 2.3440298507462688e-05,
"loss": 0.3025,
"step": 920
},
{
"epoch": 12.91,
"learning_rate": 2.3402985074626867e-05,
"loss": 0.2998,
"step": 930
},
{
"epoch": 13.0,
"eval_loss": 0.531330406665802,
"eval_runtime": 129.1703,
"eval_samples_per_second": 4.119,
"eval_steps_per_second": 0.519,
"eval_wer": 0.21405155235585266,
"step": 936
},
{
"epoch": 13.06,
"learning_rate": 2.3365671641791046e-05,
"loss": 0.3192,
"step": 940
},
{
"epoch": 13.19,
"learning_rate": 2.3328358208955225e-05,
"loss": 0.2997,
"step": 950
},
{
"epoch": 13.33,
"learning_rate": 2.32910447761194e-05,
"loss": 0.3163,
"step": 960
},
{
"epoch": 13.47,
"learning_rate": 2.3253731343283584e-05,
"loss": 0.3046,
"step": 970
},
{
"epoch": 13.61,
"learning_rate": 2.3216417910447763e-05,
"loss": 0.2924,
"step": 980
},
{
"epoch": 13.75,
"learning_rate": 2.317910447761194e-05,
"loss": 0.3161,
"step": 990
},
{
"epoch": 13.89,
"learning_rate": 2.314179104477612e-05,
"loss": 0.3043,
"step": 1000
},
{
"epoch": 14.0,
"eval_loss": 0.5343348979949951,
"eval_runtime": 129.5843,
"eval_samples_per_second": 4.105,
"eval_steps_per_second": 0.517,
"eval_wer": 0.21861541428295944,
"step": 1008
},
{
"epoch": 14.03,
"learning_rate": 2.31044776119403e-05,
"loss": 0.3099,
"step": 1010
},
{
"epoch": 14.17,
"learning_rate": 2.306716417910448e-05,
"loss": 0.2953,
"step": 1020
},
{
"epoch": 14.3,
"learning_rate": 2.302985074626866e-05,
"loss": 0.3134,
"step": 1030
},
{
"epoch": 14.44,
"learning_rate": 2.2992537313432838e-05,
"loss": 0.2917,
"step": 1040
},
{
"epoch": 14.58,
"learning_rate": 2.2955223880597017e-05,
"loss": 0.3108,
"step": 1050
},
{
"epoch": 14.72,
"learning_rate": 2.2917910447761196e-05,
"loss": 0.3085,
"step": 1060
},
{
"epoch": 14.86,
"learning_rate": 2.2880597014925372e-05,
"loss": 0.2921,
"step": 1070
},
{
"epoch": 15.0,
"learning_rate": 2.2843283582089555e-05,
"loss": 0.3147,
"step": 1080
},
{
"epoch": 15.0,
"eval_loss": 0.506893515586853,
"eval_runtime": 129.0401,
"eval_samples_per_second": 4.123,
"eval_steps_per_second": 0.519,
"eval_wer": 0.21713698013755867,
"step": 1080
},
{
"epoch": 15.14,
"learning_rate": 2.2805970149253734e-05,
"loss": 0.307,
"step": 1090
},
{
"epoch": 15.28,
"learning_rate": 2.276865671641791e-05,
"loss": 0.3152,
"step": 1100
},
{
"epoch": 15.42,
"learning_rate": 2.2731343283582092e-05,
"loss": 0.3002,
"step": 1110
},
{
"epoch": 15.55,
"learning_rate": 2.269402985074627e-05,
"loss": 0.2992,
"step": 1120
},
{
"epoch": 15.69,
"learning_rate": 2.2656716417910447e-05,
"loss": 0.2897,
"step": 1130
},
{
"epoch": 15.83,
"learning_rate": 2.261940298507463e-05,
"loss": 0.3069,
"step": 1140
},
{
"epoch": 15.97,
"learning_rate": 2.258208955223881e-05,
"loss": 0.3049,
"step": 1150
},
{
"epoch": 16.0,
"eval_loss": 0.5032855272293091,
"eval_runtime": 129.2941,
"eval_samples_per_second": 4.115,
"eval_steps_per_second": 0.518,
"eval_wer": 0.20736645882882304,
"step": 1152
},
{
"epoch": 16.11,
"learning_rate": 2.2544776119402984e-05,
"loss": 0.3014,
"step": 1160
},
{
"epoch": 16.25,
"learning_rate": 2.2507462686567167e-05,
"loss": 0.3078,
"step": 1170
},
{
"epoch": 16.39,
"learning_rate": 2.2470149253731346e-05,
"loss": 0.2942,
"step": 1180
},
{
"epoch": 16.53,
"learning_rate": 2.2432835820895522e-05,
"loss": 0.3168,
"step": 1190
},
{
"epoch": 16.66,
"learning_rate": 2.2395522388059704e-05,
"loss": 0.3124,
"step": 1200
},
{
"epoch": 16.8,
"learning_rate": 2.235820895522388e-05,
"loss": 0.2951,
"step": 1210
},
{
"epoch": 16.94,
"learning_rate": 2.232089552238806e-05,
"loss": 0.298,
"step": 1220
},
{
"epoch": 17.0,
"eval_loss": 0.5108718276023865,
"eval_runtime": 129.096,
"eval_samples_per_second": 4.121,
"eval_steps_per_second": 0.519,
"eval_wer": 0.20498810824709135,
"step": 1224
},
{
"epoch": 17.08,
"learning_rate": 2.2283582089552242e-05,
"loss": 0.3255,
"step": 1230
},
{
"epoch": 17.22,
"learning_rate": 2.2246268656716418e-05,
"loss": 0.2867,
"step": 1240
},
{
"epoch": 17.36,
"learning_rate": 2.2208955223880597e-05,
"loss": 0.2983,
"step": 1250
},
{
"epoch": 17.5,
"learning_rate": 2.217164179104478e-05,
"loss": 0.3105,
"step": 1260
},
{
"epoch": 17.64,
"learning_rate": 2.2134328358208955e-05,
"loss": 0.2818,
"step": 1270
},
{
"epoch": 17.78,
"learning_rate": 2.2097014925373134e-05,
"loss": 0.3107,
"step": 1280
},
{
"epoch": 17.91,
"learning_rate": 2.2059701492537317e-05,
"loss": 0.2948,
"step": 1290
},
{
"epoch": 18.0,
"eval_loss": 0.5252682566642761,
"eval_runtime": 129.1692,
"eval_samples_per_second": 4.119,
"eval_steps_per_second": 0.519,
"eval_wer": 0.20993764864691136,
"step": 1296
},
{
"epoch": 18.06,
"learning_rate": 2.2022388059701493e-05,
"loss": 0.316,
"step": 1300
},
{
"epoch": 18.19,
"learning_rate": 2.1985074626865672e-05,
"loss": 0.3066,
"step": 1310
},
{
"epoch": 18.33,
"learning_rate": 2.194776119402985e-05,
"loss": 0.3031,
"step": 1320
},
{
"epoch": 18.47,
"learning_rate": 2.191044776119403e-05,
"loss": 0.3037,
"step": 1330
},
{
"epoch": 18.61,
"learning_rate": 2.187313432835821e-05,
"loss": 0.2986,
"step": 1340
},
{
"epoch": 18.75,
"learning_rate": 2.183582089552239e-05,
"loss": 0.2955,
"step": 1350
},
{
"epoch": 18.89,
"learning_rate": 2.1798507462686568e-05,
"loss": 0.2986,
"step": 1360
},
{
"epoch": 19.0,
"eval_loss": 0.4976494014263153,
"eval_runtime": 129.378,
"eval_samples_per_second": 4.112,
"eval_steps_per_second": 0.518,
"eval_wer": 0.20209551970174197,
"step": 1368
},
{
"epoch": 19.03,
"learning_rate": 2.1761194029850747e-05,
"loss": 0.3021,
"step": 1370
},
{
"epoch": 19.17,
"learning_rate": 2.1723880597014926e-05,
"loss": 0.2887,
"step": 1380
},
{
"epoch": 19.3,
"learning_rate": 2.1686567164179105e-05,
"loss": 0.3059,
"step": 1390
},
{
"epoch": 19.44,
"learning_rate": 2.1649253731343284e-05,
"loss": 0.2945,
"step": 1400
},
{
"epoch": 19.58,
"learning_rate": 2.1611940298507463e-05,
"loss": 0.3006,
"step": 1410
},
{
"epoch": 19.72,
"learning_rate": 2.1574626865671643e-05,
"loss": 0.3033,
"step": 1420
},
{
"epoch": 19.86,
"learning_rate": 2.153731343283582e-05,
"loss": 0.3002,
"step": 1430
},
{
"epoch": 20.0,
"learning_rate": 2.15e-05,
"loss": 0.2958,
"step": 1440
},
{
"epoch": 20.0,
"eval_loss": 0.5233781933784485,
"eval_runtime": 129.422,
"eval_samples_per_second": 4.111,
"eval_steps_per_second": 0.518,
"eval_wer": 0.20935913093784148,
"step": 1440
},
{
"epoch": 20.14,
"learning_rate": 2.146268656716418e-05,
"loss": 0.2982,
"step": 1450
},
{
"epoch": 20.28,
"learning_rate": 2.142537313432836e-05,
"loss": 0.2861,
"step": 1460
},
{
"epoch": 20.42,
"learning_rate": 2.1388059701492538e-05,
"loss": 0.293,
"step": 1470
},
{
"epoch": 20.55,
"learning_rate": 2.1350746268656717e-05,
"loss": 0.304,
"step": 1480
},
{
"epoch": 20.69,
"learning_rate": 2.1313432835820897e-05,
"loss": 0.2926,
"step": 1490
},
{
"epoch": 20.83,
"learning_rate": 2.1276119402985076e-05,
"loss": 0.3092,
"step": 1500
},
{
"epoch": 20.97,
"learning_rate": 2.1238805970149255e-05,
"loss": 0.2931,
"step": 1510
},
{
"epoch": 21.0,
"eval_loss": 0.47944945096969604,
"eval_runtime": 130.2981,
"eval_samples_per_second": 4.083,
"eval_steps_per_second": 0.514,
"eval_wer": 0.20595230442887447,
"step": 1512
},
{
"epoch": 21.11,
"learning_rate": 2.1201492537313434e-05,
"loss": 0.2956,
"step": 1520
},
{
"epoch": 21.25,
"learning_rate": 2.1164179104477613e-05,
"loss": 0.3007,
"step": 1530
},
{
"epoch": 21.39,
"learning_rate": 2.1126865671641792e-05,
"loss": 0.3045,
"step": 1540
},
{
"epoch": 21.53,
"learning_rate": 2.108955223880597e-05,
"loss": 0.3002,
"step": 1550
},
{
"epoch": 21.66,
"learning_rate": 2.105223880597015e-05,
"loss": 0.2848,
"step": 1560
},
{
"epoch": 21.8,
"learning_rate": 2.1014925373134326e-05,
"loss": 0.286,
"step": 1570
},
{
"epoch": 21.94,
"learning_rate": 2.097761194029851e-05,
"loss": 0.305,
"step": 1580
},
{
"epoch": 22.0,
"eval_loss": 0.4916737377643585,
"eval_runtime": 129.0137,
"eval_samples_per_second": 4.124,
"eval_steps_per_second": 0.519,
"eval_wer": 0.20492382850163912,
"step": 1584
},
{
"epoch": 22.08,
"learning_rate": 2.0940298507462688e-05,
"loss": 0.3092,
"step": 1590
},
{
"epoch": 22.22,
"learning_rate": 2.0902985074626867e-05,
"loss": 0.2979,
"step": 1600
},
{
"epoch": 22.36,
"learning_rate": 2.0865671641791047e-05,
"loss": 0.2921,
"step": 1610
},
{
"epoch": 22.5,
"learning_rate": 2.0828358208955226e-05,
"loss": 0.3052,
"step": 1620
},
{
"epoch": 22.64,
"learning_rate": 2.0791044776119405e-05,
"loss": 0.2977,
"step": 1630
},
{
"epoch": 22.78,
"learning_rate": 2.0753731343283584e-05,
"loss": 0.2938,
"step": 1640
},
{
"epoch": 22.91,
"learning_rate": 2.0716417910447763e-05,
"loss": 0.2847,
"step": 1650
},
{
"epoch": 23.0,
"eval_loss": 0.5089883804321289,
"eval_runtime": 129.655,
"eval_samples_per_second": 4.103,
"eval_steps_per_second": 0.517,
"eval_wer": 0.21000192839236356,
"step": 1656
},
{
"epoch": 23.06,
"learning_rate": 2.0679104477611942e-05,
"loss": 0.2993,
"step": 1660
},
{
"epoch": 23.19,
"learning_rate": 2.064179104477612e-05,
"loss": 0.3081,
"step": 1670
},
{
"epoch": 23.33,
"learning_rate": 2.0604477611940297e-05,
"loss": 0.2998,
"step": 1680
},
{
"epoch": 23.47,
"learning_rate": 2.056716417910448e-05,
"loss": 0.3125,
"step": 1690
},
{
"epoch": 23.61,
"learning_rate": 2.052985074626866e-05,
"loss": 0.3135,
"step": 1700
},
{
"epoch": 23.75,
"learning_rate": 2.0492537313432835e-05,
"loss": 0.3039,
"step": 1710
},
{
"epoch": 23.89,
"learning_rate": 2.0455223880597017e-05,
"loss": 0.2869,
"step": 1720
},
{
"epoch": 24.0,
"eval_loss": 0.5296673774719238,
"eval_runtime": 132.3841,
"eval_samples_per_second": 4.019,
"eval_steps_per_second": 0.506,
"eval_wer": 0.2101947676287202,
"step": 1728
},
{
"epoch": 24.03,
"learning_rate": 2.0417910447761196e-05,
"loss": 0.2958,
"step": 1730
},
{
"epoch": 24.17,
"learning_rate": 2.0380597014925372e-05,
"loss": 0.2985,
"step": 1740
},
{
"epoch": 24.3,
"learning_rate": 2.0343283582089555e-05,
"loss": 0.2914,
"step": 1750
},
{
"epoch": 24.44,
"learning_rate": 2.0305970149253734e-05,
"loss": 0.2975,
"step": 1760
},
{
"epoch": 24.58,
"learning_rate": 2.026865671641791e-05,
"loss": 0.3037,
"step": 1770
},
{
"epoch": 24.72,
"learning_rate": 2.0231343283582092e-05,
"loss": 0.294,
"step": 1780
},
{
"epoch": 24.86,
"learning_rate": 2.0194029850746268e-05,
"loss": 0.3024,
"step": 1790
},
{
"epoch": 25.0,
"learning_rate": 2.0156716417910447e-05,
"loss": 0.2997,
"step": 1800
},
{
"epoch": 25.0,
"eval_loss": 0.5185533165931702,
"eval_runtime": 132.6367,
"eval_samples_per_second": 4.011,
"eval_steps_per_second": 0.505,
"eval_wer": 0.20878061322877162,
"step": 1800
},
{
"epoch": 25.14,
"learning_rate": 2.011940298507463e-05,
"loss": 0.3077,
"step": 1810
},
{
"epoch": 25.28,
"learning_rate": 2.0082089552238805e-05,
"loss": 0.2926,
"step": 1820
},
{
"epoch": 25.42,
"learning_rate": 2.0044776119402985e-05,
"loss": 0.2924,
"step": 1830
},
{
"epoch": 25.55,
"learning_rate": 2.0007462686567167e-05,
"loss": 0.2969,
"step": 1840
},
{
"epoch": 25.69,
"learning_rate": 1.9970149253731343e-05,
"loss": 0.299,
"step": 1850
},
{
"epoch": 25.83,
"learning_rate": 1.9932835820895522e-05,
"loss": 0.2963,
"step": 1860
},
{
"epoch": 25.97,
"learning_rate": 1.9895522388059705e-05,
"loss": 0.2996,
"step": 1870
},
{
"epoch": 26.0,
"eval_loss": 0.5218982100486755,
"eval_runtime": 131.3811,
"eval_samples_per_second": 4.049,
"eval_steps_per_second": 0.51,
"eval_wer": 0.20980908915600693,
"step": 1872
},
{
"epoch": 26.11,
"learning_rate": 1.985820895522388e-05,
"loss": 0.2972,
"step": 1880
},
{
"epoch": 26.25,
"learning_rate": 1.982089552238806e-05,
"loss": 0.2993,
"step": 1890
},
{
"epoch": 26.39,
"learning_rate": 1.9783582089552242e-05,
"loss": 0.2877,
"step": 1900
},
{
"epoch": 26.53,
"learning_rate": 1.9746268656716418e-05,
"loss": 0.2864,
"step": 1910
},
{
"epoch": 26.66,
"learning_rate": 1.9708955223880597e-05,
"loss": 0.2869,
"step": 1920
},
{
"epoch": 26.8,
"learning_rate": 1.9671641791044776e-05,
"loss": 0.3113,
"step": 1930
},
{
"epoch": 26.94,
"learning_rate": 1.9634328358208955e-05,
"loss": 0.298,
"step": 1940
},
{
"epoch": 27.0,
"eval_loss": 0.506175696849823,
"eval_runtime": 132.0981,
"eval_samples_per_second": 4.027,
"eval_steps_per_second": 0.507,
"eval_wer": 0.21077328533779005,
"step": 1944
},
{
"epoch": 27.08,
"learning_rate": 1.9597014925373135e-05,
"loss": 0.3057,
"step": 1950
},
{
"epoch": 27.22,
"learning_rate": 1.9559701492537314e-05,
"loss": 0.3026,
"step": 1960
},
{
"epoch": 27.36,
"learning_rate": 1.9522388059701493e-05,
"loss": 0.298,
"step": 1970
},
{
"epoch": 27.5,
"learning_rate": 1.9485074626865672e-05,
"loss": 0.3077,
"step": 1980
},
{
"epoch": 27.64,
"learning_rate": 1.944776119402985e-05,
"loss": 0.3073,
"step": 1990
},
{
"epoch": 27.78,
"learning_rate": 1.941044776119403e-05,
"loss": 0.3163,
"step": 2000
},
{
"epoch": 27.91,
"learning_rate": 1.9373134328358213e-05,
"loss": 0.3057,
"step": 2010
},
{
"epoch": 28.0,
"eval_loss": 0.5299437642097473,
"eval_runtime": 132.6119,
"eval_samples_per_second": 4.012,
"eval_steps_per_second": 0.505,
"eval_wer": 0.21366587388313943,
"step": 2016
},
{
"epoch": 28.06,
"learning_rate": 1.933582089552239e-05,
"loss": 0.3058,
"step": 2020
},
{
"epoch": 28.19,
"learning_rate": 1.9298507462686568e-05,
"loss": 0.2959,
"step": 2030
},
{
"epoch": 28.33,
"learning_rate": 1.9261194029850747e-05,
"loss": 0.3052,
"step": 2040
},
{
"epoch": 28.47,
"learning_rate": 1.9223880597014926e-05,
"loss": 0.2961,
"step": 2050
},
{
"epoch": 28.61,
"learning_rate": 1.9186567164179105e-05,
"loss": 0.3006,
"step": 2060
},
{
"epoch": 28.75,
"learning_rate": 1.9149253731343284e-05,
"loss": 0.3096,
"step": 2070
},
{
"epoch": 28.89,
"learning_rate": 1.9111940298507464e-05,
"loss": 0.2937,
"step": 2080
},
{
"epoch": 29.0,
"eval_loss": 0.5345147848129272,
"eval_runtime": 131.6737,
"eval_samples_per_second": 4.04,
"eval_steps_per_second": 0.509,
"eval_wer": 0.21540142701034903,
"step": 2088
},
{
"epoch": 29.03,
"learning_rate": 1.9074626865671643e-05,
"loss": 0.3,
"step": 2090
},
{
"epoch": 29.17,
"learning_rate": 1.9037313432835822e-05,
"loss": 0.2895,
"step": 2100
},
{
"epoch": 29.3,
"learning_rate": 1.9e-05,
"loss": 0.2907,
"step": 2110
},
{
"epoch": 29.44,
"learning_rate": 1.896268656716418e-05,
"loss": 0.2975,
"step": 2120
},
{
"epoch": 29.58,
"learning_rate": 1.892537313432836e-05,
"loss": 0.2945,
"step": 2130
},
{
"epoch": 29.72,
"learning_rate": 1.888805970149254e-05,
"loss": 0.3019,
"step": 2140
},
{
"epoch": 29.86,
"learning_rate": 1.8850746268656718e-05,
"loss": 0.2987,
"step": 2150
},
{
"epoch": 30.0,
"learning_rate": 1.8813432835820897e-05,
"loss": 0.3064,
"step": 2160
},
{
"epoch": 30.0,
"eval_loss": 0.5374366044998169,
"eval_runtime": 131.625,
"eval_samples_per_second": 4.042,
"eval_steps_per_second": 0.509,
"eval_wer": 0.21160892202866877,
"step": 2160
},
{
"epoch": 30.14,
"learning_rate": 1.8776119402985076e-05,
"loss": 0.2945,
"step": 2170
},
{
"epoch": 30.28,
"learning_rate": 1.8738805970149255e-05,
"loss": 0.2925,
"step": 2180
},
{
"epoch": 30.42,
"learning_rate": 1.8701492537313434e-05,
"loss": 0.2875,
"step": 2190
},
{
"epoch": 30.55,
"learning_rate": 1.8664179104477613e-05,
"loss": 0.2936,
"step": 2200
},
{
"epoch": 30.69,
"learning_rate": 1.8626865671641793e-05,
"loss": 0.2937,
"step": 2210
},
{
"epoch": 30.83,
"learning_rate": 1.8589552238805972e-05,
"loss": 0.2952,
"step": 2220
},
{
"epoch": 30.97,
"learning_rate": 1.855223880597015e-05,
"loss": 0.2915,
"step": 2230
},
{
"epoch": 31.0,
"eval_loss": 0.5184913873672485,
"eval_runtime": 131.6654,
"eval_samples_per_second": 4.041,
"eval_steps_per_second": 0.509,
"eval_wer": 0.20736645882882304,
"step": 2232
},
{
"epoch": 31.11,
"learning_rate": 1.851492537313433e-05,
"loss": 0.3009,
"step": 2240
},
{
"epoch": 31.25,
"learning_rate": 1.847761194029851e-05,
"loss": 0.3002,
"step": 2250
},
{
"epoch": 31.39,
"learning_rate": 1.844029850746269e-05,
"loss": 0.2676,
"step": 2260
},
{
"epoch": 31.53,
"learning_rate": 1.8402985074626868e-05,
"loss": 0.2795,
"step": 2270
},
{
"epoch": 31.66,
"learning_rate": 1.8365671641791047e-05,
"loss": 0.2855,
"step": 2280
},
{
"epoch": 31.8,
"learning_rate": 1.8328358208955223e-05,
"loss": 0.2967,
"step": 2290
},
{
"epoch": 31.94,
"learning_rate": 1.8291044776119405e-05,
"loss": 0.2942,
"step": 2300
},
{
"epoch": 32.0,
"eval_loss": 0.5221661925315857,
"eval_runtime": 131.7358,
"eval_samples_per_second": 4.038,
"eval_steps_per_second": 0.509,
"eval_wer": 0.20935913093784148,
"step": 2304
},
{
"epoch": 32.08,
"learning_rate": 1.8253731343283584e-05,
"loss": 0.3027,
"step": 2310
},
{
"epoch": 32.22,
"learning_rate": 1.821641791044776e-05,
"loss": 0.2919,
"step": 2320
},
{
"epoch": 32.36,
"learning_rate": 1.8179104477611943e-05,
"loss": 0.2963,
"step": 2330
},
{
"epoch": 32.5,
"learning_rate": 1.814179104477612e-05,
"loss": 0.2917,
"step": 2340
},
{
"epoch": 32.64,
"learning_rate": 1.8104477611940297e-05,
"loss": 0.2753,
"step": 2350
},
{
"epoch": 32.78,
"learning_rate": 1.806716417910448e-05,
"loss": 0.288,
"step": 2360
},
{
"epoch": 32.91,
"learning_rate": 1.802985074626866e-05,
"loss": 0.2777,
"step": 2370
},
{
"epoch": 33.0,
"eval_loss": 0.5229014158248901,
"eval_runtime": 131.9614,
"eval_samples_per_second": 4.031,
"eval_steps_per_second": 0.508,
"eval_wer": 0.21077328533779005,
"step": 2376
},
{
"epoch": 33.06,
"learning_rate": 1.7992537313432835e-05,
"loss": 0.3004,
"step": 2380
},
{
"epoch": 33.19,
"learning_rate": 1.7955223880597017e-05,
"loss": 0.2916,
"step": 2390
},
{
"epoch": 33.33,
"learning_rate": 1.7917910447761193e-05,
"loss": 0.2933,
"step": 2400
},
{
"epoch": 33.47,
"learning_rate": 1.7880597014925372e-05,
"loss": 0.296,
"step": 2410
},
{
"epoch": 33.61,
"learning_rate": 1.7843283582089555e-05,
"loss": 0.2959,
"step": 2420
},
{
"epoch": 33.75,
"learning_rate": 1.780597014925373e-05,
"loss": 0.2846,
"step": 2430
},
{
"epoch": 33.89,
"learning_rate": 1.776865671641791e-05,
"loss": 0.2821,
"step": 2440
},
{
"epoch": 34.0,
"eval_loss": 0.5242453813552856,
"eval_runtime": 132.7946,
"eval_samples_per_second": 4.006,
"eval_steps_per_second": 0.505,
"eval_wer": 0.2101947676287202,
"step": 2448
},
{
"epoch": 34.03,
"learning_rate": 1.7731343283582092e-05,
"loss": 0.2997,
"step": 2450
},
{
"epoch": 34.17,
"learning_rate": 1.7694029850746268e-05,
"loss": 0.2872,
"step": 2460
},
{
"epoch": 34.3,
"learning_rate": 1.7656716417910447e-05,
"loss": 0.2826,
"step": 2470
},
{
"epoch": 34.44,
"learning_rate": 1.761940298507463e-05,
"loss": 0.2965,
"step": 2480
},
{
"epoch": 34.58,
"learning_rate": 1.7582089552238806e-05,
"loss": 0.2812,
"step": 2490
},
{
"epoch": 34.72,
"learning_rate": 1.7548507462686566e-05,
"loss": 0.2893,
"step": 2500
},
{
"epoch": 34.86,
"learning_rate": 1.751119402985075e-05,
"loss": 0.2799,
"step": 2510
},
{
"epoch": 35.0,
"learning_rate": 1.7473880597014928e-05,
"loss": 0.2859,
"step": 2520
},
{
"epoch": 35.0,
"eval_loss": 0.5292270183563232,
"eval_runtime": 131.3549,
"eval_samples_per_second": 4.05,
"eval_steps_per_second": 0.51,
"eval_wer": 0.2096162499196503,
"step": 2520
},
{
"epoch": 35.14,
"learning_rate": 1.7436567164179103e-05,
"loss": 0.2936,
"step": 2530
},
{
"epoch": 35.28,
"learning_rate": 1.7399253731343286e-05,
"loss": 0.2941,
"step": 2540
},
{
"epoch": 35.42,
"learning_rate": 1.7361940298507465e-05,
"loss": 0.2887,
"step": 2550
},
{
"epoch": 35.55,
"learning_rate": 1.732462686567164e-05,
"loss": 0.296,
"step": 2560
},
{
"epoch": 35.69,
"learning_rate": 1.7287313432835823e-05,
"loss": 0.2905,
"step": 2570
},
{
"epoch": 35.83,
"learning_rate": 1.725e-05,
"loss": 0.2872,
"step": 2580
},
{
"epoch": 35.97,
"learning_rate": 1.721268656716418e-05,
"loss": 0.283,
"step": 2590
},
{
"epoch": 36.0,
"eval_loss": 0.5041770339012146,
"eval_runtime": 131.4728,
"eval_samples_per_second": 4.046,
"eval_steps_per_second": 0.51,
"eval_wer": 0.20665938162884875,
"step": 2592
},
{
"epoch": 36.11,
"learning_rate": 1.717537313432836e-05,
"loss": 0.2914,
"step": 2600
},
{
"epoch": 36.25,
"learning_rate": 1.7138059701492537e-05,
"loss": 0.2829,
"step": 2610
},
{
"epoch": 36.39,
"learning_rate": 1.7100746268656716e-05,
"loss": 0.2682,
"step": 2620
},
{
"epoch": 36.53,
"learning_rate": 1.70634328358209e-05,
"loss": 0.2989,
"step": 2630
},
{
"epoch": 36.66,
"learning_rate": 1.7026119402985074e-05,
"loss": 0.2873,
"step": 2640
},
{
"epoch": 36.8,
"learning_rate": 1.6992537313432834e-05,
"loss": 0.29,
"step": 2650
},
{
"epoch": 36.94,
"learning_rate": 1.6955223880597017e-05,
"loss": 0.2895,
"step": 2660
},
{
"epoch": 37.0,
"eval_loss": 0.5222975015640259,
"eval_runtime": 131.841,
"eval_samples_per_second": 4.035,
"eval_steps_per_second": 0.508,
"eval_wer": 0.2045381500289259,
"step": 2664
},
{
"epoch": 37.08,
"learning_rate": 1.6917910447761196e-05,
"loss": 0.2939,
"step": 2670
},
{
"epoch": 37.22,
"learning_rate": 1.6880597014925372e-05,
"loss": 0.295,
"step": 2680
},
{
"epoch": 37.36,
"learning_rate": 1.6843283582089554e-05,
"loss": 0.2793,
"step": 2690
},
{
"epoch": 37.5,
"learning_rate": 1.6805970149253734e-05,
"loss": 0.2842,
"step": 2700
},
{
"epoch": 37.64,
"learning_rate": 1.676865671641791e-05,
"loss": 0.2678,
"step": 2710
},
{
"epoch": 37.78,
"learning_rate": 1.6731343283582092e-05,
"loss": 0.2868,
"step": 2720
},
{
"epoch": 37.91,
"learning_rate": 1.669402985074627e-05,
"loss": 0.2822,
"step": 2730
},
{
"epoch": 38.0,
"eval_loss": 0.5093514919281006,
"eval_runtime": 132.4112,
"eval_samples_per_second": 4.018,
"eval_steps_per_second": 0.506,
"eval_wer": 0.2071093398470142,
"step": 2736
},
{
"epoch": 38.06,
"learning_rate": 1.6656716417910447e-05,
"loss": 0.2914,
"step": 2740
},
{
"epoch": 38.19,
"learning_rate": 1.661940298507463e-05,
"loss": 0.2828,
"step": 2750
},
{
"epoch": 38.33,
"learning_rate": 1.658208955223881e-05,
"loss": 0.2637,
"step": 2760
},
{
"epoch": 38.47,
"learning_rate": 1.6544776119402984e-05,
"loss": 0.288,
"step": 2770
},
{
"epoch": 38.61,
"learning_rate": 1.6507462686567167e-05,
"loss": 0.2814,
"step": 2780
},
{
"epoch": 38.75,
"learning_rate": 1.6470149253731343e-05,
"loss": 0.2902,
"step": 2790
},
{
"epoch": 38.89,
"learning_rate": 1.6432835820895522e-05,
"loss": 0.2672,
"step": 2800
},
{
"epoch": 39.0,
"eval_loss": 0.5250556468963623,
"eval_runtime": 131.822,
"eval_samples_per_second": 4.036,
"eval_steps_per_second": 0.508,
"eval_wer": 0.20415247155621263,
"step": 2808
},
{
"epoch": 39.03,
"learning_rate": 1.6395522388059704e-05,
"loss": 0.2954,
"step": 2810
},
{
"epoch": 39.17,
"learning_rate": 1.635820895522388e-05,
"loss": 0.2854,
"step": 2820
},
{
"epoch": 39.3,
"learning_rate": 1.632089552238806e-05,
"loss": 0.2874,
"step": 2830
},
{
"epoch": 39.44,
"learning_rate": 1.6283582089552242e-05,
"loss": 0.2671,
"step": 2840
},
{
"epoch": 39.58,
"learning_rate": 1.6246268656716418e-05,
"loss": 0.2761,
"step": 2850
},
{
"epoch": 39.72,
"learning_rate": 1.6208955223880597e-05,
"loss": 0.2904,
"step": 2860
},
{
"epoch": 39.86,
"learning_rate": 1.617164179104478e-05,
"loss": 0.2783,
"step": 2870
},
{
"epoch": 40.0,
"learning_rate": 1.6134328358208955e-05,
"loss": 0.2925,
"step": 2880
},
{
"epoch": 40.0,
"eval_loss": 0.5071823000907898,
"eval_runtime": 132.8431,
"eval_samples_per_second": 4.005,
"eval_steps_per_second": 0.504,
"eval_wer": 0.20511666773799575,
"step": 2880
},
{
"epoch": 40.14,
"learning_rate": 1.6097014925373134e-05,
"loss": 0.2936,
"step": 2890
},
{
"epoch": 40.28,
"learning_rate": 1.6059701492537313e-05,
"loss": 0.2848,
"step": 2900
},
{
"epoch": 40.42,
"learning_rate": 1.6022388059701492e-05,
"loss": 0.2866,
"step": 2910
},
{
"epoch": 40.55,
"learning_rate": 1.598507462686567e-05,
"loss": 0.289,
"step": 2920
},
{
"epoch": 40.69,
"learning_rate": 1.594776119402985e-05,
"loss": 0.2817,
"step": 2930
},
{
"epoch": 40.83,
"learning_rate": 1.591044776119403e-05,
"loss": 0.293,
"step": 2940
},
{
"epoch": 40.97,
"learning_rate": 1.587313432835821e-05,
"loss": 0.295,
"step": 2950
},
{
"epoch": 41.0,
"eval_loss": 0.4903075695037842,
"eval_runtime": 131.5707,
"eval_samples_per_second": 4.043,
"eval_steps_per_second": 0.509,
"eval_wer": 0.2071093398470142,
"step": 2952
},
{
"epoch": 41.11,
"learning_rate": 1.5835820895522388e-05,
"loss": 0.2957,
"step": 2960
},
{
"epoch": 41.25,
"learning_rate": 1.5798507462686567e-05,
"loss": 0.294,
"step": 2970
},
{
"epoch": 41.39,
"learning_rate": 1.5761194029850747e-05,
"loss": 0.2779,
"step": 2980
},
{
"epoch": 41.53,
"learning_rate": 1.5723880597014926e-05,
"loss": 0.2808,
"step": 2990
},
{
"epoch": 41.66,
"learning_rate": 1.5686567164179105e-05,
"loss": 0.2924,
"step": 3000
},
{
"epoch": 41.8,
"learning_rate": 1.5649253731343284e-05,
"loss": 0.2917,
"step": 3010
},
{
"epoch": 41.94,
"learning_rate": 1.5611940298507463e-05,
"loss": 0.2725,
"step": 3020
},
{
"epoch": 42.0,
"eval_loss": 0.49732398986816406,
"eval_runtime": 131.4816,
"eval_samples_per_second": 4.046,
"eval_steps_per_second": 0.51,
"eval_wer": 0.20485954875618692,
"step": 3024
},
{
"epoch": 42.08,
"learning_rate": 1.5574626865671642e-05,
"loss": 0.2972,
"step": 3030
},
{
"epoch": 42.22,
"learning_rate": 1.553731343283582e-05,
"loss": 0.2854,
"step": 3040
},
{
"epoch": 42.36,
"learning_rate": 1.55e-05,
"loss": 0.2874,
"step": 3050
},
{
"epoch": 42.5,
"learning_rate": 1.546268656716418e-05,
"loss": 0.2928,
"step": 3060
},
{
"epoch": 42.64,
"learning_rate": 1.542537313432836e-05,
"loss": 0.2773,
"step": 3070
},
{
"epoch": 42.78,
"learning_rate": 1.5388059701492538e-05,
"loss": 0.2954,
"step": 3080
},
{
"epoch": 42.91,
"learning_rate": 1.5350746268656717e-05,
"loss": 0.2758,
"step": 3090
},
{
"epoch": 43.0,
"eval_loss": 0.5097233057022095,
"eval_runtime": 131.4822,
"eval_samples_per_second": 4.046,
"eval_steps_per_second": 0.51,
"eval_wer": 0.2015812817381243,
"step": 3096
},
{
"epoch": 43.06,
"learning_rate": 1.5313432835820896e-05,
"loss": 0.2904,
"step": 3100
},
{
"epoch": 43.19,
"learning_rate": 1.5276119402985076e-05,
"loss": 0.2831,
"step": 3110
},
{
"epoch": 43.33,
"learning_rate": 1.5238805970149256e-05,
"loss": 0.2779,
"step": 3120
},
{
"epoch": 43.47,
"learning_rate": 1.5201492537313434e-05,
"loss": 0.2844,
"step": 3130
},
{
"epoch": 43.61,
"learning_rate": 1.5164179104477613e-05,
"loss": 0.2842,
"step": 3140
},
{
"epoch": 43.75,
"learning_rate": 1.512686567164179e-05,
"loss": 0.2856,
"step": 3150
},
{
"epoch": 43.89,
"learning_rate": 1.5089552238805971e-05,
"loss": 0.2809,
"step": 3160
},
{
"epoch": 44.0,
"eval_loss": 0.49982935190200806,
"eval_runtime": 131.8613,
"eval_samples_per_second": 4.035,
"eval_steps_per_second": 0.508,
"eval_wer": 0.20280259690171626,
"step": 3168
},
{
"epoch": 44.03,
"learning_rate": 1.505223880597015e-05,
"loss": 0.2936,
"step": 3170
},
{
"epoch": 44.17,
"learning_rate": 1.5014925373134328e-05,
"loss": 0.285,
"step": 3180
},
{
"epoch": 44.3,
"learning_rate": 1.4977611940298509e-05,
"loss": 0.2833,
"step": 3190
},
{
"epoch": 44.44,
"learning_rate": 1.4940298507462688e-05,
"loss": 0.282,
"step": 3200
},
{
"epoch": 44.58,
"learning_rate": 1.4902985074626866e-05,
"loss": 0.2816,
"step": 3210
},
{
"epoch": 44.72,
"learning_rate": 1.4865671641791046e-05,
"loss": 0.2711,
"step": 3220
},
{
"epoch": 44.86,
"learning_rate": 1.4828358208955226e-05,
"loss": 0.2702,
"step": 3230
},
{
"epoch": 45.0,
"learning_rate": 1.4791044776119403e-05,
"loss": 0.2804,
"step": 3240
},
{
"epoch": 45.0,
"eval_loss": 0.5103247761726379,
"eval_runtime": 131.3748,
"eval_samples_per_second": 4.049,
"eval_steps_per_second": 0.51,
"eval_wer": 0.20421675130166483,
"step": 3240
},
{
"epoch": 45.14,
"learning_rate": 1.4753731343283584e-05,
"loss": 0.2664,
"step": 3250
},
{
"epoch": 45.28,
"learning_rate": 1.4716417910447761e-05,
"loss": 0.2755,
"step": 3260
},
{
"epoch": 45.42,
"learning_rate": 1.467910447761194e-05,
"loss": 0.2725,
"step": 3270
},
{
"epoch": 45.55,
"learning_rate": 1.4641791044776121e-05,
"loss": 0.2878,
"step": 3280
},
{
"epoch": 45.69,
"learning_rate": 1.4604477611940299e-05,
"loss": 0.2847,
"step": 3290
},
{
"epoch": 45.83,
"learning_rate": 1.4567164179104478e-05,
"loss": 0.2826,
"step": 3300
},
{
"epoch": 45.97,
"learning_rate": 1.4529850746268659e-05,
"loss": 0.2842,
"step": 3310
},
{
"epoch": 46.0,
"eval_loss": 0.48608192801475525,
"eval_runtime": 131.8901,
"eval_samples_per_second": 4.034,
"eval_steps_per_second": 0.508,
"eval_wer": 0.2021597994471942,
"step": 3312
},
{
"epoch": 46.11,
"learning_rate": 1.4492537313432836e-05,
"loss": 0.2921,
"step": 3320
},
{
"epoch": 46.25,
"learning_rate": 1.4455223880597015e-05,
"loss": 0.2833,
"step": 3330
},
{
"epoch": 46.39,
"learning_rate": 1.4417910447761196e-05,
"loss": 0.2787,
"step": 3340
},
{
"epoch": 46.53,
"learning_rate": 1.4380597014925374e-05,
"loss": 0.2772,
"step": 3350
},
{
"epoch": 46.66,
"learning_rate": 1.4343283582089553e-05,
"loss": 0.2756,
"step": 3360
},
{
"epoch": 46.8,
"learning_rate": 1.430597014925373e-05,
"loss": 0.2745,
"step": 3370
},
{
"epoch": 46.94,
"learning_rate": 1.4268656716417911e-05,
"loss": 0.2721,
"step": 3380
},
{
"epoch": 47.0,
"eval_loss": 0.5053983926773071,
"eval_runtime": 131.5158,
"eval_samples_per_second": 4.045,
"eval_steps_per_second": 0.509,
"eval_wer": 0.20595230442887447,
"step": 3384
},
{
"epoch": 47.08,
"learning_rate": 1.423134328358209e-05,
"loss": 0.2809,
"step": 3390
},
{
"epoch": 47.22,
"learning_rate": 1.4194029850746268e-05,
"loss": 0.2767,
"step": 3400
},
{
"epoch": 47.36,
"learning_rate": 1.4156716417910449e-05,
"loss": 0.267,
"step": 3410
},
{
"epoch": 47.5,
"learning_rate": 1.4119402985074628e-05,
"loss": 0.2758,
"step": 3420
},
{
"epoch": 47.64,
"learning_rate": 1.4082089552238805e-05,
"loss": 0.2654,
"step": 3430
},
{
"epoch": 47.78,
"learning_rate": 1.4044776119402986e-05,
"loss": 0.2781,
"step": 3440
},
{
"epoch": 47.91,
"learning_rate": 1.4007462686567165e-05,
"loss": 0.2673,
"step": 3450
},
{
"epoch": 48.0,
"eval_loss": 0.5044223070144653,
"eval_runtime": 131.7824,
"eval_samples_per_second": 4.037,
"eval_steps_per_second": 0.508,
"eval_wer": 0.1999742881018191,
"step": 3456
},
{
"epoch": 48.06,
"learning_rate": 1.3970149253731343e-05,
"loss": 0.2927,
"step": 3460
},
{
"epoch": 48.19,
"learning_rate": 1.3932835820895524e-05,
"loss": 0.2854,
"step": 3470
},
{
"epoch": 48.33,
"learning_rate": 1.3895522388059703e-05,
"loss": 0.284,
"step": 3480
},
{
"epoch": 48.47,
"learning_rate": 1.385820895522388e-05,
"loss": 0.2675,
"step": 3490
},
{
"epoch": 48.61,
"learning_rate": 1.3820895522388061e-05,
"loss": 0.2719,
"step": 3500
},
{
"epoch": 48.75,
"learning_rate": 1.3783582089552239e-05,
"loss": 0.2748,
"step": 3510
},
{
"epoch": 48.89,
"learning_rate": 1.3746268656716418e-05,
"loss": 0.2696,
"step": 3520
},
{
"epoch": 49.0,
"eval_loss": 0.5187488794326782,
"eval_runtime": 131.1067,
"eval_samples_per_second": 4.058,
"eval_steps_per_second": 0.511,
"eval_wer": 0.1983030147200617,
"step": 3528
},
{
"epoch": 49.03,
"learning_rate": 1.3708955223880599e-05,
"loss": 0.2806,
"step": 3530
},
{
"epoch": 49.17,
"learning_rate": 1.3671641791044776e-05,
"loss": 0.2766,
"step": 3540
},
{
"epoch": 49.3,
"learning_rate": 1.3634328358208955e-05,
"loss": 0.2821,
"step": 3550
},
{
"epoch": 49.44,
"learning_rate": 1.3597014925373136e-05,
"loss": 0.2673,
"step": 3560
},
{
"epoch": 49.58,
"learning_rate": 1.3559701492537314e-05,
"loss": 0.2794,
"step": 3570
},
{
"epoch": 49.72,
"learning_rate": 1.3522388059701493e-05,
"loss": 0.2745,
"step": 3580
},
{
"epoch": 49.86,
"learning_rate": 1.3485074626865674e-05,
"loss": 0.2664,
"step": 3590
},
{
"epoch": 50.0,
"learning_rate": 1.3447761194029851e-05,
"loss": 0.2724,
"step": 3600
},
{
"epoch": 50.0,
"eval_loss": 0.5234389901161194,
"eval_runtime": 131.879,
"eval_samples_per_second": 4.034,
"eval_steps_per_second": 0.508,
"eval_wer": 0.20350967410169055,
"step": 3600
},
{
"epoch": 50.14,
"learning_rate": 1.3410447761194032e-05,
"loss": 0.2814,
"step": 3610
},
{
"epoch": 50.28,
"learning_rate": 1.3373134328358208e-05,
"loss": 0.267,
"step": 3620
},
{
"epoch": 50.42,
"learning_rate": 1.3335820895522388e-05,
"loss": 0.2681,
"step": 3630
},
{
"epoch": 50.55,
"learning_rate": 1.329850746268657e-05,
"loss": 0.2812,
"step": 3640
},
{
"epoch": 50.69,
"learning_rate": 1.3261194029850745e-05,
"loss": 0.2709,
"step": 3650
},
{
"epoch": 50.83,
"learning_rate": 1.3223880597014926e-05,
"loss": 0.2719,
"step": 3660
},
{
"epoch": 50.97,
"learning_rate": 1.3186567164179107e-05,
"loss": 0.2736,
"step": 3670
},
{
"epoch": 51.0,
"eval_loss": 0.5106495022773743,
"eval_runtime": 131.9308,
"eval_samples_per_second": 4.032,
"eval_steps_per_second": 0.508,
"eval_wer": 0.2016455614835765,
"step": 3672
},
{
"epoch": 51.11,
"learning_rate": 1.3149253731343284e-05,
"loss": 0.2766,
"step": 3680
},
{
"epoch": 51.25,
"learning_rate": 1.3111940298507463e-05,
"loss": 0.2771,
"step": 3690
},
{
"epoch": 51.39,
"learning_rate": 1.3074626865671644e-05,
"loss": 0.2754,
"step": 3700
},
{
"epoch": 51.53,
"learning_rate": 1.3037313432835822e-05,
"loss": 0.2849,
"step": 3710
},
{
"epoch": 51.66,
"learning_rate": 1.3000000000000001e-05,
"loss": 0.2669,
"step": 3720
},
{
"epoch": 51.8,
"learning_rate": 1.2962686567164178e-05,
"loss": 0.2623,
"step": 3730
},
{
"epoch": 51.94,
"learning_rate": 1.292537313432836e-05,
"loss": 0.2662,
"step": 3740
},
{
"epoch": 52.0,
"eval_loss": 0.5071024298667908,
"eval_runtime": 131.882,
"eval_samples_per_second": 4.034,
"eval_steps_per_second": 0.508,
"eval_wer": 0.20537378671980458,
"step": 3744
},
{
"epoch": 52.08,
"learning_rate": 1.2888059701492538e-05,
"loss": 0.2814,
"step": 3750
},
{
"epoch": 52.22,
"learning_rate": 1.2850746268656716e-05,
"loss": 0.2733,
"step": 3760
},
{
"epoch": 52.36,
"learning_rate": 1.2813432835820897e-05,
"loss": 0.2679,
"step": 3770
},
{
"epoch": 52.5,
"learning_rate": 1.2776119402985076e-05,
"loss": 0.2717,
"step": 3780
},
{
"epoch": 52.64,
"learning_rate": 1.2738805970149253e-05,
"loss": 0.2563,
"step": 3790
},
{
"epoch": 52.78,
"learning_rate": 1.2701492537313434e-05,
"loss": 0.2791,
"step": 3800
},
{
"epoch": 52.91,
"learning_rate": 1.2664179104477613e-05,
"loss": 0.2701,
"step": 3810
},
{
"epoch": 53.0,
"eval_loss": 0.5253528356552124,
"eval_runtime": 131.2156,
"eval_samples_per_second": 4.054,
"eval_steps_per_second": 0.511,
"eval_wer": 0.2016455614835765,
"step": 3816
},
{
"epoch": 53.06,
"learning_rate": 1.262686567164179e-05,
"loss": 0.2935,
"step": 3820
},
{
"epoch": 53.19,
"learning_rate": 1.2589552238805972e-05,
"loss": 0.2654,
"step": 3830
},
{
"epoch": 53.33,
"learning_rate": 1.255223880597015e-05,
"loss": 0.2768,
"step": 3840
},
{
"epoch": 53.47,
"learning_rate": 1.2514925373134328e-05,
"loss": 0.2779,
"step": 3850
},
{
"epoch": 53.61,
"learning_rate": 1.2477611940298509e-05,
"loss": 0.2743,
"step": 3860
},
{
"epoch": 53.75,
"learning_rate": 1.2440298507462687e-05,
"loss": 0.2719,
"step": 3870
},
{
"epoch": 53.89,
"learning_rate": 1.2402985074626866e-05,
"loss": 0.261,
"step": 3880
},
{
"epoch": 54.0,
"eval_loss": 0.4967404007911682,
"eval_runtime": 131.9132,
"eval_samples_per_second": 4.033,
"eval_steps_per_second": 0.508,
"eval_wer": 0.19939577039274925,
"step": 3888
},
{
"epoch": 54.03,
"learning_rate": 1.2365671641791045e-05,
"loss": 0.2909,
"step": 3890
},
{
"epoch": 54.17,
"learning_rate": 1.2328358208955226e-05,
"loss": 0.2642,
"step": 3900
},
{
"epoch": 54.3,
"learning_rate": 1.2291044776119403e-05,
"loss": 0.2746,
"step": 3910
},
{
"epoch": 54.44,
"learning_rate": 1.2253731343283582e-05,
"loss": 0.2655,
"step": 3920
},
{
"epoch": 54.58,
"learning_rate": 1.2216417910447763e-05,
"loss": 0.2722,
"step": 3930
},
{
"epoch": 54.72,
"learning_rate": 1.217910447761194e-05,
"loss": 0.2721,
"step": 3940
},
{
"epoch": 54.86,
"learning_rate": 1.214179104477612e-05,
"loss": 0.2728,
"step": 3950
},
{
"epoch": 55.0,
"learning_rate": 1.2104477611940299e-05,
"loss": 0.2708,
"step": 3960
},
{
"epoch": 55.0,
"eval_loss": 0.5263388156890869,
"eval_runtime": 131.5494,
"eval_samples_per_second": 4.044,
"eval_steps_per_second": 0.509,
"eval_wer": 0.19688886032011313,
"step": 3960
},
{
"epoch": 55.14,
"learning_rate": 1.2067164179104478e-05,
"loss": 0.2684,
"step": 3970
},
{
"epoch": 55.28,
"learning_rate": 1.2029850746268657e-05,
"loss": 0.2699,
"step": 3980
},
{
"epoch": 55.42,
"learning_rate": 1.1992537313432836e-05,
"loss": 0.2796,
"step": 3990
},
{
"epoch": 55.55,
"learning_rate": 1.1955223880597016e-05,
"loss": 0.2666,
"step": 4000
},
{
"epoch": 55.69,
"learning_rate": 1.1917910447761195e-05,
"loss": 0.2702,
"step": 4010
},
{
"epoch": 55.83,
"learning_rate": 1.1880597014925374e-05,
"loss": 0.2711,
"step": 4020
},
{
"epoch": 55.97,
"learning_rate": 1.1843283582089553e-05,
"loss": 0.2764,
"step": 4030
},
{
"epoch": 56.0,
"eval_loss": 0.5201473236083984,
"eval_runtime": 131.8696,
"eval_samples_per_second": 4.034,
"eval_steps_per_second": 0.508,
"eval_wer": 0.19676030082920873,
"step": 4032
},
{
"epoch": 56.11,
"learning_rate": 1.1805970149253732e-05,
"loss": 0.272,
"step": 4040
},
{
"epoch": 56.25,
"learning_rate": 1.1768656716417911e-05,
"loss": 0.2624,
"step": 4050
},
{
"epoch": 56.39,
"learning_rate": 1.173134328358209e-05,
"loss": 0.2566,
"step": 4060
},
{
"epoch": 56.53,
"learning_rate": 1.1694029850746268e-05,
"loss": 0.2789,
"step": 4070
},
{
"epoch": 56.66,
"learning_rate": 1.1656716417910449e-05,
"loss": 0.267,
"step": 4080
},
{
"epoch": 56.8,
"learning_rate": 1.1619402985074628e-05,
"loss": 0.2711,
"step": 4090
},
{
"epoch": 56.94,
"learning_rate": 1.1582089552238806e-05,
"loss": 0.268,
"step": 4100
},
{
"epoch": 57.0,
"eval_loss": 0.5023506879806519,
"eval_runtime": 131.2011,
"eval_samples_per_second": 4.055,
"eval_steps_per_second": 0.511,
"eval_wer": 0.19785305650189625,
"step": 4104
},
{
"epoch": 57.08,
"learning_rate": 1.1544776119402986e-05,
"loss": 0.2639,
"step": 4110
},
{
"epoch": 57.22,
"learning_rate": 1.1507462686567166e-05,
"loss": 0.2725,
"step": 4120
},
{
"epoch": 57.36,
"learning_rate": 1.1470149253731343e-05,
"loss": 0.271,
"step": 4130
},
{
"epoch": 57.5,
"learning_rate": 1.1432835820895522e-05,
"loss": 0.2778,
"step": 4140
},
{
"epoch": 57.64,
"learning_rate": 1.1395522388059703e-05,
"loss": 0.2673,
"step": 4150
},
{
"epoch": 57.78,
"learning_rate": 1.135820895522388e-05,
"loss": 0.2665,
"step": 4160
},
{
"epoch": 57.91,
"learning_rate": 1.132089552238806e-05,
"loss": 0.2536,
"step": 4170
},
{
"epoch": 58.0,
"eval_loss": 0.5224213600158691,
"eval_runtime": 131.5544,
"eval_samples_per_second": 4.044,
"eval_steps_per_second": 0.509,
"eval_wer": 0.19701741981101756,
"step": 4176
},
{
"epoch": 58.06,
"learning_rate": 1.1283582089552239e-05,
"loss": 0.2727,
"step": 4180
},
{
"epoch": 58.19,
"learning_rate": 1.124626865671642e-05,
"loss": 0.2596,
"step": 4190
},
{
"epoch": 58.33,
"learning_rate": 1.1208955223880597e-05,
"loss": 0.2671,
"step": 4200
},
{
"epoch": 58.47,
"learning_rate": 1.1171641791044776e-05,
"loss": 0.2667,
"step": 4210
},
{
"epoch": 58.61,
"learning_rate": 1.1134328358208957e-05,
"loss": 0.2648,
"step": 4220
},
{
"epoch": 58.75,
"learning_rate": 1.1097014925373135e-05,
"loss": 0.2828,
"step": 4230
},
{
"epoch": 58.89,
"learning_rate": 1.1059701492537314e-05,
"loss": 0.2625,
"step": 4240
},
{
"epoch": 59.0,
"eval_loss": 0.5316326022148132,
"eval_runtime": 131.6958,
"eval_samples_per_second": 4.04,
"eval_steps_per_second": 0.509,
"eval_wer": 0.1999742881018191,
"step": 4248
},
{
"epoch": 59.03,
"learning_rate": 1.1022388059701493e-05,
"loss": 0.2725,
"step": 4250
},
{
"epoch": 59.17,
"learning_rate": 1.0985074626865672e-05,
"loss": 0.2541,
"step": 4260
},
{
"epoch": 59.3,
"learning_rate": 1.0947761194029851e-05,
"loss": 0.2703,
"step": 4270
},
{
"epoch": 59.44,
"learning_rate": 1.091044776119403e-05,
"loss": 0.2725,
"step": 4280
},
{
"epoch": 59.58,
"learning_rate": 1.087313432835821e-05,
"loss": 0.273,
"step": 4290
},
{
"epoch": 59.72,
"learning_rate": 1.0835820895522389e-05,
"loss": 0.2793,
"step": 4300
},
{
"epoch": 59.86,
"learning_rate": 1.0798507462686568e-05,
"loss": 0.257,
"step": 4310
},
{
"epoch": 60.0,
"learning_rate": 1.0761194029850747e-05,
"loss": 0.2621,
"step": 4320
},
{
"epoch": 60.0,
"eval_loss": 0.5173215270042419,
"eval_runtime": 131.579,
"eval_samples_per_second": 4.043,
"eval_steps_per_second": 0.509,
"eval_wer": 0.19965288937455808,
"step": 4320
},
{
"epoch": 60.14,
"learning_rate": 1.0723880597014926e-05,
"loss": 0.272,
"step": 4330
},
{
"epoch": 60.28,
"learning_rate": 1.0686567164179105e-05,
"loss": 0.2669,
"step": 4340
},
{
"epoch": 60.42,
"learning_rate": 1.0649253731343284e-05,
"loss": 0.2703,
"step": 4350
},
{
"epoch": 60.55,
"learning_rate": 1.0611940298507462e-05,
"loss": 0.2633,
"step": 4360
},
{
"epoch": 60.69,
"learning_rate": 1.0574626865671643e-05,
"loss": 0.2657,
"step": 4370
},
{
"epoch": 60.83,
"learning_rate": 1.0537313432835822e-05,
"loss": 0.2654,
"step": 4380
},
{
"epoch": 60.97,
"learning_rate": 1.05e-05,
"loss": 0.2673,
"step": 4390
},
{
"epoch": 61.0,
"eval_loss": 0.5116785764694214,
"eval_runtime": 131.1081,
"eval_samples_per_second": 4.058,
"eval_steps_per_second": 0.511,
"eval_wer": 0.20280259690171626,
"step": 4392
},
{
"epoch": 61.11,
"learning_rate": 1.046268656716418e-05,
"loss": 0.2678,
"step": 4400
},
{
"epoch": 61.25,
"learning_rate": 1.042537313432836e-05,
"loss": 0.2706,
"step": 4410
},
{
"epoch": 61.39,
"learning_rate": 1.0388059701492537e-05,
"loss": 0.2641,
"step": 4420
},
{
"epoch": 61.53,
"learning_rate": 1.0350746268656716e-05,
"loss": 0.2596,
"step": 4430
},
{
"epoch": 61.66,
"learning_rate": 1.0313432835820897e-05,
"loss": 0.2562,
"step": 4440
},
{
"epoch": 61.8,
"learning_rate": 1.0276119402985074e-05,
"loss": 0.2802,
"step": 4450
},
{
"epoch": 61.94,
"learning_rate": 1.0238805970149254e-05,
"loss": 0.2723,
"step": 4460
},
{
"epoch": 62.0,
"eval_loss": 0.5285342335700989,
"eval_runtime": 131.8603,
"eval_samples_per_second": 4.035,
"eval_steps_per_second": 0.508,
"eval_wer": 0.1999742881018191,
"step": 4464
},
{
"epoch": 62.08,
"learning_rate": 1.0201492537313434e-05,
"loss": 0.2846,
"step": 4470
},
{
"epoch": 62.22,
"learning_rate": 1.0164179104477614e-05,
"loss": 0.2758,
"step": 4480
},
{
"epoch": 62.36,
"learning_rate": 1.0126865671641791e-05,
"loss": 0.277,
"step": 4490
},
{
"epoch": 62.5,
"learning_rate": 1.008955223880597e-05,
"loss": 0.2761,
"step": 4500
},
{
"epoch": 62.64,
"learning_rate": 1.0052238805970151e-05,
"loss": 0.2684,
"step": 4510
},
{
"epoch": 62.78,
"learning_rate": 1.0014925373134328e-05,
"loss": 0.2817,
"step": 4520
},
{
"epoch": 62.91,
"learning_rate": 9.977611940298508e-06,
"loss": 0.2691,
"step": 4530
},
{
"epoch": 63.0,
"eval_loss": 0.5328835248947144,
"eval_runtime": 131.3705,
"eval_samples_per_second": 4.05,
"eval_steps_per_second": 0.51,
"eval_wer": 0.19611750337468664,
"step": 4536
},
{
"epoch": 63.06,
"learning_rate": 9.940298507462687e-06,
"loss": 0.2824,
"step": 4540
},
{
"epoch": 63.19,
"learning_rate": 9.902985074626866e-06,
"loss": 0.2772,
"step": 4550
},
{
"epoch": 63.33,
"learning_rate": 9.865671641791045e-06,
"loss": 0.2708,
"step": 4560
},
{
"epoch": 63.47,
"learning_rate": 9.828358208955224e-06,
"loss": 0.2679,
"step": 4570
},
{
"epoch": 63.61,
"learning_rate": 9.791044776119403e-06,
"loss": 0.268,
"step": 4580
},
{
"epoch": 63.75,
"learning_rate": 9.753731343283583e-06,
"loss": 0.2705,
"step": 4590
},
{
"epoch": 63.89,
"learning_rate": 9.716417910447762e-06,
"loss": 0.2668,
"step": 4600
},
{
"epoch": 64.0,
"eval_loss": 0.5160889625549316,
"eval_runtime": 131.2903,
"eval_samples_per_second": 4.052,
"eval_steps_per_second": 0.51,
"eval_wer": 0.19643890210194767,
"step": 4608
},
{
"epoch": 64.03,
"learning_rate": 9.679104477611941e-06,
"loss": 0.2774,
"step": 4610
},
{
"epoch": 64.17,
"learning_rate": 9.64179104477612e-06,
"loss": 0.2688,
"step": 4620
},
{
"epoch": 64.3,
"learning_rate": 9.6044776119403e-06,
"loss": 0.2773,
"step": 4630
},
{
"epoch": 64.44,
"learning_rate": 9.567164179104478e-06,
"loss": 0.2633,
"step": 4640
},
{
"epoch": 64.58,
"learning_rate": 9.529850746268656e-06,
"loss": 0.2735,
"step": 4650
},
{
"epoch": 64.72,
"learning_rate": 9.492537313432837e-06,
"loss": 0.2683,
"step": 4660
},
{
"epoch": 64.86,
"learning_rate": 9.455223880597016e-06,
"loss": 0.2719,
"step": 4670
},
{
"epoch": 65.0,
"learning_rate": 9.417910447761193e-06,
"loss": 0.27,
"step": 4680
},
{
"epoch": 65.0,
"eval_loss": 0.5026705861091614,
"eval_runtime": 131.4228,
"eval_samples_per_second": 4.048,
"eval_steps_per_second": 0.51,
"eval_wer": 0.19695314006556533,
"step": 4680
},
{
"epoch": 65.14,
"learning_rate": 9.380597014925374e-06,
"loss": 0.2786,
"step": 4690
},
{
"epoch": 65.28,
"learning_rate": 9.343283582089553e-06,
"loss": 0.2731,
"step": 4700
},
{
"epoch": 65.42,
"learning_rate": 9.30597014925373e-06,
"loss": 0.2707,
"step": 4710
},
{
"epoch": 65.55,
"learning_rate": 9.26865671641791e-06,
"loss": 0.2638,
"step": 4720
},
{
"epoch": 65.69,
"learning_rate": 9.23134328358209e-06,
"loss": 0.2605,
"step": 4730
},
{
"epoch": 65.83,
"learning_rate": 9.194029850746268e-06,
"loss": 0.2736,
"step": 4740
},
{
"epoch": 65.97,
"learning_rate": 9.156716417910447e-06,
"loss": 0.257,
"step": 4750
},
{
"epoch": 66.0,
"eval_loss": 0.5016449689865112,
"eval_runtime": 132.0547,
"eval_samples_per_second": 4.029,
"eval_steps_per_second": 0.507,
"eval_wer": 0.19965288937455808,
"step": 4752
},
{
"epoch": 66.11,
"learning_rate": 9.119402985074628e-06,
"loss": 0.277,
"step": 4760
},
{
"epoch": 66.25,
"learning_rate": 9.082089552238807e-06,
"loss": 0.2734,
"step": 4770
},
{
"epoch": 66.39,
"learning_rate": 9.044776119402985e-06,
"loss": 0.2679,
"step": 4780
},
{
"epoch": 66.53,
"learning_rate": 9.007462686567164e-06,
"loss": 0.2755,
"step": 4790
},
{
"epoch": 66.66,
"learning_rate": 8.970149253731345e-06,
"loss": 0.2686,
"step": 4800
},
{
"epoch": 66.8,
"learning_rate": 8.932835820895522e-06,
"loss": 0.2651,
"step": 4810
},
{
"epoch": 66.94,
"learning_rate": 8.895522388059702e-06,
"loss": 0.2711,
"step": 4820
},
{
"epoch": 67.0,
"eval_loss": 0.5059924721717834,
"eval_runtime": 131.6036,
"eval_samples_per_second": 4.042,
"eval_steps_per_second": 0.509,
"eval_wer": 0.19714597930192196,
"step": 4824
},
{
"epoch": 67.08,
"learning_rate": 8.85820895522388e-06,
"loss": 0.2678,
"step": 4830
},
{
"epoch": 67.22,
"learning_rate": 8.82089552238806e-06,
"loss": 0.2676,
"step": 4840
},
{
"epoch": 67.36,
"learning_rate": 8.783582089552239e-06,
"loss": 0.2569,
"step": 4850
},
{
"epoch": 67.5,
"learning_rate": 8.746268656716418e-06,
"loss": 0.2681,
"step": 4860
},
{
"epoch": 67.64,
"learning_rate": 8.708955223880597e-06,
"loss": 0.2664,
"step": 4870
},
{
"epoch": 67.78,
"learning_rate": 8.671641791044776e-06,
"loss": 0.2725,
"step": 4880
},
{
"epoch": 67.91,
"learning_rate": 8.634328358208956e-06,
"loss": 0.269,
"step": 4890
},
{
"epoch": 68.0,
"eval_loss": 0.5219683051109314,
"eval_runtime": 131.9262,
"eval_samples_per_second": 4.033,
"eval_steps_per_second": 0.508,
"eval_wer": 0.1983030147200617,
"step": 4896
},
{
"epoch": 68.06,
"learning_rate": 8.597014925373135e-06,
"loss": 0.2747,
"step": 4900
},
{
"epoch": 68.19,
"learning_rate": 8.559701492537314e-06,
"loss": 0.2724,
"step": 4910
},
{
"epoch": 68.33,
"learning_rate": 8.522388059701493e-06,
"loss": 0.2773,
"step": 4920
},
{
"epoch": 68.47,
"learning_rate": 8.485074626865672e-06,
"loss": 0.282,
"step": 4930
},
{
"epoch": 68.61,
"learning_rate": 8.447761194029851e-06,
"loss": 0.2674,
"step": 4940
},
{
"epoch": 68.75,
"learning_rate": 8.41044776119403e-06,
"loss": 0.2611,
"step": 4950
},
{
"epoch": 68.89,
"learning_rate": 8.37313432835821e-06,
"loss": 0.2659,
"step": 4960
},
{
"epoch": 69.0,
"eval_loss": 0.498529314994812,
"eval_runtime": 132.3204,
"eval_samples_per_second": 4.021,
"eval_steps_per_second": 0.506,
"eval_wer": 0.19856013370187053,
"step": 4968
},
{
"epoch": 69.03,
"learning_rate": 8.335820895522387e-06,
"loss": 0.2752,
"step": 4970
},
{
"epoch": 69.17,
"learning_rate": 8.298507462686568e-06,
"loss": 0.2671,
"step": 4980
},
{
"epoch": 69.3,
"learning_rate": 8.261194029850747e-06,
"loss": 0.2704,
"step": 4990
},
{
"epoch": 69.44,
"learning_rate": 8.223880597014925e-06,
"loss": 0.265,
"step": 5000
},
{
"epoch": 69.58,
"learning_rate": 8.186567164179104e-06,
"loss": 0.2757,
"step": 5010
},
{
"epoch": 69.72,
"learning_rate": 8.149253731343285e-06,
"loss": 0.2688,
"step": 5020
},
{
"epoch": 69.86,
"learning_rate": 8.111940298507462e-06,
"loss": 0.2666,
"step": 5030
},
{
"epoch": 70.0,
"learning_rate": 8.074626865671641e-06,
"loss": 0.2669,
"step": 5040
},
{
"epoch": 70.0,
"eval_loss": 0.514457643032074,
"eval_runtime": 131.6706,
"eval_samples_per_second": 4.04,
"eval_steps_per_second": 0.509,
"eval_wer": 0.1958603843928778,
"step": 5040
},
{
"epoch": 70.14,
"learning_rate": 8.037313432835822e-06,
"loss": 0.2716,
"step": 5050
},
{
"epoch": 70.28,
"learning_rate": 8.000000000000001e-06,
"loss": 0.2729,
"step": 5060
},
{
"epoch": 70.42,
"learning_rate": 7.962686567164179e-06,
"loss": 0.259,
"step": 5070
},
{
"epoch": 70.55,
"learning_rate": 7.925373134328358e-06,
"loss": 0.2651,
"step": 5080
},
{
"epoch": 70.69,
"learning_rate": 7.888059701492539e-06,
"loss": 0.2657,
"step": 5090
},
{
"epoch": 70.83,
"learning_rate": 7.850746268656716e-06,
"loss": 0.2735,
"step": 5100
},
{
"epoch": 70.97,
"learning_rate": 7.813432835820895e-06,
"loss": 0.2685,
"step": 5110
},
{
"epoch": 71.0,
"eval_loss": 0.5079246163368225,
"eval_runtime": 131.456,
"eval_samples_per_second": 4.047,
"eval_steps_per_second": 0.51,
"eval_wer": 0.19560326541106898,
"step": 5112
},
{
"epoch": 71.11,
"learning_rate": 7.776119402985076e-06,
"loss": 0.2732,
"step": 5120
},
{
"epoch": 71.25,
"learning_rate": 7.738805970149254e-06,
"loss": 0.2568,
"step": 5130
},
{
"epoch": 71.39,
"learning_rate": 7.701492537313433e-06,
"loss": 0.2552,
"step": 5140
},
{
"epoch": 71.53,
"learning_rate": 7.664179104477612e-06,
"loss": 0.2634,
"step": 5150
},
{
"epoch": 71.66,
"learning_rate": 7.626865671641792e-06,
"loss": 0.2663,
"step": 5160
},
{
"epoch": 71.8,
"learning_rate": 7.58955223880597e-06,
"loss": 0.2679,
"step": 5170
},
{
"epoch": 71.94,
"learning_rate": 7.5522388059701495e-06,
"loss": 0.2669,
"step": 5180
},
{
"epoch": 72.0,
"eval_loss": 0.49233612418174744,
"eval_runtime": 131.3756,
"eval_samples_per_second": 4.049,
"eval_steps_per_second": 0.51,
"eval_wer": 0.19361059330205052,
"step": 5184
},
{
"epoch": 72.08,
"learning_rate": 7.514925373134328e-06,
"loss": 0.2722,
"step": 5190
},
{
"epoch": 72.22,
"learning_rate": 7.477611940298508e-06,
"loss": 0.2698,
"step": 5200
},
{
"epoch": 72.36,
"learning_rate": 7.440298507462687e-06,
"loss": 0.2527,
"step": 5210
},
{
"epoch": 72.5,
"learning_rate": 7.402985074626865e-06,
"loss": 0.2658,
"step": 5220
},
{
"epoch": 72.64,
"learning_rate": 7.365671641791045e-06,
"loss": 0.2623,
"step": 5230
},
{
"epoch": 72.78,
"learning_rate": 7.3283582089552245e-06,
"loss": 0.2574,
"step": 5240
},
{
"epoch": 72.91,
"learning_rate": 7.291044776119403e-06,
"loss": 0.2586,
"step": 5250
},
{
"epoch": 73.0,
"eval_loss": 0.4957040250301361,
"eval_runtime": 131.9056,
"eval_samples_per_second": 4.033,
"eval_steps_per_second": 0.508,
"eval_wer": 0.19528186668380793,
"step": 5256
},
{
"epoch": 73.06,
"learning_rate": 7.253731343283582e-06,
"loss": 0.2703,
"step": 5260
},
{
"epoch": 73.19,
"learning_rate": 7.216417910447762e-06,
"loss": 0.2618,
"step": 5270
},
{
"epoch": 73.33,
"learning_rate": 7.17910447761194e-06,
"loss": 0.2643,
"step": 5280
},
{
"epoch": 73.47,
"learning_rate": 7.1417910447761194e-06,
"loss": 0.2735,
"step": 5290
},
{
"epoch": 73.61,
"learning_rate": 7.1044776119402994e-06,
"loss": 0.2562,
"step": 5300
},
{
"epoch": 73.75,
"learning_rate": 7.067164179104479e-06,
"loss": 0.2597,
"step": 5310
},
{
"epoch": 73.89,
"learning_rate": 7.029850746268657e-06,
"loss": 0.2486,
"step": 5320
},
{
"epoch": 74.0,
"eval_loss": 0.4974006712436676,
"eval_runtime": 132.0022,
"eval_samples_per_second": 4.03,
"eval_steps_per_second": 0.508,
"eval_wer": 0.19316063508388506,
"step": 5328
},
{
"epoch": 74.03,
"learning_rate": 6.992537313432835e-06,
"loss": 0.2732,
"step": 5330
},
{
"epoch": 74.17,
"learning_rate": 6.955223880597016e-06,
"loss": 0.2455,
"step": 5340
},
{
"epoch": 74.3,
"learning_rate": 6.917910447761194e-06,
"loss": 0.2517,
"step": 5350
},
{
"epoch": 74.44,
"learning_rate": 6.8805970149253735e-06,
"loss": 0.2618,
"step": 5360
},
{
"epoch": 74.58,
"learning_rate": 6.843283582089552e-06,
"loss": 0.2667,
"step": 5370
},
{
"epoch": 74.72,
"learning_rate": 6.805970149253732e-06,
"loss": 0.2635,
"step": 5380
},
{
"epoch": 74.86,
"learning_rate": 6.768656716417911e-06,
"loss": 0.2667,
"step": 5390
},
{
"epoch": 75.0,
"learning_rate": 6.731343283582089e-06,
"loss": 0.2611,
"step": 5400
},
{
"epoch": 75.0,
"eval_loss": 0.5044746398925781,
"eval_runtime": 131.9706,
"eval_samples_per_second": 4.031,
"eval_steps_per_second": 0.508,
"eval_wer": 0.1948961882110947,
"step": 5400
},
{
"epoch": 75.14,
"learning_rate": 6.694029850746269e-06,
"loss": 0.2813,
"step": 5410
},
{
"epoch": 75.28,
"learning_rate": 6.6567164179104485e-06,
"loss": 0.2708,
"step": 5420
},
{
"epoch": 75.42,
"learning_rate": 6.619402985074627e-06,
"loss": 0.2558,
"step": 5430
},
{
"epoch": 75.55,
"learning_rate": 6.582089552238806e-06,
"loss": 0.2593,
"step": 5440
},
{
"epoch": 75.69,
"learning_rate": 6.544776119402986e-06,
"loss": 0.2532,
"step": 5450
},
{
"epoch": 75.83,
"learning_rate": 6.507462686567164e-06,
"loss": 0.2601,
"step": 5460
},
{
"epoch": 75.97,
"learning_rate": 6.4701492537313434e-06,
"loss": 0.264,
"step": 5470
},
{
"epoch": 76.0,
"eval_loss": 0.5025977492332458,
"eval_runtime": 132.0676,
"eval_samples_per_second": 4.028,
"eval_steps_per_second": 0.507,
"eval_wer": 0.1965674615928521,
"step": 5472
},
{
"epoch": 76.11,
"learning_rate": 6.4328358208955234e-06,
"loss": 0.256,
"step": 5480
},
{
"epoch": 76.25,
"learning_rate": 6.395522388059702e-06,
"loss": 0.2661,
"step": 5490
},
{
"epoch": 76.39,
"learning_rate": 6.358208955223881e-06,
"loss": 0.2603,
"step": 5500
},
{
"epoch": 76.53,
"learning_rate": 6.320895522388059e-06,
"loss": 0.2574,
"step": 5510
},
{
"epoch": 76.66,
"learning_rate": 6.283582089552239e-06,
"loss": 0.2572,
"step": 5520
},
{
"epoch": 76.8,
"learning_rate": 6.246268656716418e-06,
"loss": 0.2587,
"step": 5530
},
{
"epoch": 76.94,
"learning_rate": 6.208955223880597e-06,
"loss": 0.2653,
"step": 5540
},
{
"epoch": 77.0,
"eval_loss": 0.5044174790382385,
"eval_runtime": 133.5324,
"eval_samples_per_second": 3.984,
"eval_steps_per_second": 0.502,
"eval_wer": 0.19361059330205052,
"step": 5544
},
{
"epoch": 77.08,
"learning_rate": 6.171641791044777e-06,
"loss": 0.2586,
"step": 5550
},
{
"epoch": 77.22,
"learning_rate": 6.134328358208956e-06,
"loss": 0.2628,
"step": 5560
},
{
"epoch": 77.36,
"learning_rate": 6.097014925373134e-06,
"loss": 0.2637,
"step": 5570
},
{
"epoch": 77.5,
"learning_rate": 6.059701492537314e-06,
"loss": 0.2594,
"step": 5580
},
{
"epoch": 77.64,
"learning_rate": 6.0223880597014925e-06,
"loss": 0.2567,
"step": 5590
},
{
"epoch": 77.78,
"learning_rate": 5.9850746268656725e-06,
"loss": 0.2684,
"step": 5600
},
{
"epoch": 77.91,
"learning_rate": 5.947761194029851e-06,
"loss": 0.2579,
"step": 5610
},
{
"epoch": 78.0,
"eval_loss": 0.4963833689689636,
"eval_runtime": 131.9034,
"eval_samples_per_second": 4.033,
"eval_steps_per_second": 0.508,
"eval_wer": 0.1966960210837565,
"step": 5616
},
{
"epoch": 78.06,
"learning_rate": 5.91044776119403e-06,
"loss": 0.2654,
"step": 5620
},
{
"epoch": 78.19,
"learning_rate": 5.873134328358209e-06,
"loss": 0.2565,
"step": 5630
},
{
"epoch": 78.33,
"learning_rate": 5.835820895522388e-06,
"loss": 0.2647,
"step": 5640
},
{
"epoch": 78.47,
"learning_rate": 5.7985074626865674e-06,
"loss": 0.2561,
"step": 5650
},
{
"epoch": 78.61,
"learning_rate": 5.761194029850747e-06,
"loss": 0.2495,
"step": 5660
},
{
"epoch": 78.75,
"learning_rate": 5.723880597014926e-06,
"loss": 0.2562,
"step": 5670
},
{
"epoch": 78.89,
"learning_rate": 5.686567164179105e-06,
"loss": 0.26,
"step": 5680
},
{
"epoch": 79.0,
"eval_loss": 0.4918227195739746,
"eval_runtime": 132.2622,
"eval_samples_per_second": 4.022,
"eval_steps_per_second": 0.507,
"eval_wer": 0.19373915279295495,
"step": 5688
},
{
"epoch": 79.03,
"learning_rate": 5.649253731343284e-06,
"loss": 0.269,
"step": 5690
},
{
"epoch": 79.17,
"learning_rate": 5.611940298507462e-06,
"loss": 0.2585,
"step": 5700
},
{
"epoch": 79.3,
"learning_rate": 5.574626865671642e-06,
"loss": 0.2609,
"step": 5710
},
{
"epoch": 79.44,
"learning_rate": 5.537313432835821e-06,
"loss": 0.256,
"step": 5720
},
{
"epoch": 79.58,
"learning_rate": 5.500000000000001e-06,
"loss": 0.2615,
"step": 5730
},
{
"epoch": 79.72,
"learning_rate": 5.46268656716418e-06,
"loss": 0.2626,
"step": 5740
},
{
"epoch": 79.86,
"learning_rate": 5.425373134328358e-06,
"loss": 0.2545,
"step": 5750
},
{
"epoch": 80.0,
"learning_rate": 5.388059701492538e-06,
"loss": 0.2634,
"step": 5760
},
{
"epoch": 80.0,
"eval_loss": 0.4841861128807068,
"eval_runtime": 131.8698,
"eval_samples_per_second": 4.034,
"eval_steps_per_second": 0.508,
"eval_wer": 0.19277495661117183,
"step": 5760
},
{
"epoch": 80.14,
"learning_rate": 5.3507462686567165e-06,
"loss": 0.2575,
"step": 5770
},
{
"epoch": 80.28,
"learning_rate": 5.313432835820896e-06,
"loss": 0.2567,
"step": 5780
},
{
"epoch": 80.42,
"learning_rate": 5.276119402985075e-06,
"loss": 0.2599,
"step": 5790
},
{
"epoch": 80.55,
"learning_rate": 5.238805970149254e-06,
"loss": 0.246,
"step": 5800
},
{
"epoch": 80.69,
"learning_rate": 5.201492537313433e-06,
"loss": 0.2546,
"step": 5810
},
{
"epoch": 80.83,
"learning_rate": 5.164179104477612e-06,
"loss": 0.2675,
"step": 5820
},
{
"epoch": 80.97,
"learning_rate": 5.1268656716417914e-06,
"loss": 0.2598,
"step": 5830
},
{
"epoch": 81.0,
"eval_loss": 0.5017235279083252,
"eval_runtime": 132.1658,
"eval_samples_per_second": 4.025,
"eval_steps_per_second": 0.507,
"eval_wer": 0.19463906922928584,
"step": 5832
},
{
"epoch": 81.11,
"learning_rate": 5.089552238805971e-06,
"loss": 0.2551,
"step": 5840
},
{
"epoch": 81.25,
"learning_rate": 5.05223880597015e-06,
"loss": 0.2648,
"step": 5850
},
{
"epoch": 81.39,
"learning_rate": 5.014925373134328e-06,
"loss": 0.2447,
"step": 5860
},
{
"epoch": 81.53,
"learning_rate": 4.977611940298508e-06,
"loss": 0.2561,
"step": 5870
},
{
"epoch": 81.66,
"learning_rate": 4.940298507462686e-06,
"loss": 0.261,
"step": 5880
},
{
"epoch": 81.8,
"learning_rate": 4.902985074626866e-06,
"loss": 0.2653,
"step": 5890
},
{
"epoch": 81.94,
"learning_rate": 4.865671641791045e-06,
"loss": 0.2571,
"step": 5900
},
{
"epoch": 82.0,
"eval_loss": 0.4997570514678955,
"eval_runtime": 131.7552,
"eval_samples_per_second": 4.038,
"eval_steps_per_second": 0.509,
"eval_wer": 0.1983672944655139,
"step": 5904
},
{
"epoch": 82.08,
"learning_rate": 4.828358208955224e-06,
"loss": 0.2628,
"step": 5910
},
{
"epoch": 82.22,
"learning_rate": 4.791044776119404e-06,
"loss": 0.2625,
"step": 5920
},
{
"epoch": 82.36,
"learning_rate": 4.753731343283582e-06,
"loss": 0.2396,
"step": 5930
},
{
"epoch": 82.5,
"learning_rate": 4.716417910447761e-06,
"loss": 0.2698,
"step": 5940
},
{
"epoch": 82.64,
"learning_rate": 4.6791044776119405e-06,
"loss": 0.2571,
"step": 5950
},
{
"epoch": 82.78,
"learning_rate": 4.64179104477612e-06,
"loss": 0.2592,
"step": 5960
},
{
"epoch": 82.91,
"learning_rate": 4.604477611940299e-06,
"loss": 0.2564,
"step": 5970
},
{
"epoch": 83.0,
"eval_loss": 0.4961981475353241,
"eval_runtime": 132.3751,
"eval_samples_per_second": 4.019,
"eval_steps_per_second": 0.506,
"eval_wer": 0.19393199202931155,
"step": 5976
},
{
"epoch": 83.06,
"learning_rate": 4.567164179104478e-06,
"loss": 0.2661,
"step": 5980
},
{
"epoch": 83.19,
"learning_rate": 4.529850746268656e-06,
"loss": 0.2602,
"step": 5990
},
{
"epoch": 83.33,
"learning_rate": 4.492537313432836e-06,
"loss": 0.2515,
"step": 6000
},
{
"epoch": 83.47,
"learning_rate": 4.4552238805970154e-06,
"loss": 0.2607,
"step": 6010
},
{
"epoch": 83.61,
"learning_rate": 4.417910447761195e-06,
"loss": 0.2457,
"step": 6020
},
{
"epoch": 83.75,
"learning_rate": 4.380597014925374e-06,
"loss": 0.2613,
"step": 6030
},
{
"epoch": 83.89,
"learning_rate": 4.343283582089552e-06,
"loss": 0.2606,
"step": 6040
},
{
"epoch": 84.0,
"eval_loss": 0.49531611800193787,
"eval_runtime": 131.4182,
"eval_samples_per_second": 4.048,
"eval_steps_per_second": 0.51,
"eval_wer": 0.19155364144757986,
"step": 6048
},
{
"epoch": 84.03,
"learning_rate": 4.305970149253732e-06,
"loss": 0.2655,
"step": 6050
},
{
"epoch": 84.17,
"learning_rate": 4.26865671641791e-06,
"loss": 0.2488,
"step": 6060
},
{
"epoch": 84.3,
"learning_rate": 4.2313432835820895e-06,
"loss": 0.258,
"step": 6070
},
{
"epoch": 84.44,
"learning_rate": 4.194029850746269e-06,
"loss": 0.2644,
"step": 6080
},
{
"epoch": 84.58,
"learning_rate": 4.156716417910448e-06,
"loss": 0.2573,
"step": 6090
},
{
"epoch": 84.72,
"learning_rate": 4.119402985074627e-06,
"loss": 0.243,
"step": 6100
},
{
"epoch": 84.86,
"learning_rate": 4.082089552238806e-06,
"loss": 0.2581,
"step": 6110
},
{
"epoch": 85.0,
"learning_rate": 4.044776119402985e-06,
"loss": 0.2587,
"step": 6120
},
{
"epoch": 85.0,
"eval_loss": 0.4982677400112152,
"eval_runtime": 132.0294,
"eval_samples_per_second": 4.029,
"eval_steps_per_second": 0.507,
"eval_wer": 0.19463906922928584,
"step": 6120
},
{
"epoch": 85.14,
"learning_rate": 4.0074626865671645e-06,
"loss": 0.2455,
"step": 6130
},
{
"epoch": 85.28,
"learning_rate": 3.970149253731344e-06,
"loss": 0.2532,
"step": 6140
},
{
"epoch": 85.42,
"learning_rate": 3.932835820895522e-06,
"loss": 0.2608,
"step": 6150
},
{
"epoch": 85.55,
"learning_rate": 3.895522388059702e-06,
"loss": 0.2604,
"step": 6160
},
{
"epoch": 85.69,
"learning_rate": 3.85820895522388e-06,
"loss": 0.2489,
"step": 6170
},
{
"epoch": 85.83,
"learning_rate": 3.82089552238806e-06,
"loss": 0.2594,
"step": 6180
},
{
"epoch": 85.97,
"learning_rate": 3.7835820895522394e-06,
"loss": 0.2499,
"step": 6190
},
{
"epoch": 86.0,
"eval_loss": 0.5027219653129578,
"eval_runtime": 131.6359,
"eval_samples_per_second": 4.041,
"eval_steps_per_second": 0.509,
"eval_wer": 0.19534614642926015,
"step": 6192
},
{
"epoch": 86.11,
"learning_rate": 3.746268656716418e-06,
"loss": 0.2499,
"step": 6200
},
{
"epoch": 86.25,
"learning_rate": 3.7089552238805973e-06,
"loss": 0.2627,
"step": 6210
},
{
"epoch": 86.39,
"learning_rate": 3.671641791044776e-06,
"loss": 0.2471,
"step": 6220
},
{
"epoch": 86.53,
"learning_rate": 3.6343283582089557e-06,
"loss": 0.2538,
"step": 6230
},
{
"epoch": 86.66,
"learning_rate": 3.5970149253731344e-06,
"loss": 0.2432,
"step": 6240
},
{
"epoch": 86.8,
"learning_rate": 3.5597014925373135e-06,
"loss": 0.2625,
"step": 6250
},
{
"epoch": 86.94,
"learning_rate": 3.5223880597014923e-06,
"loss": 0.253,
"step": 6260
},
{
"epoch": 87.0,
"eval_loss": 0.5000377297401428,
"eval_runtime": 132.268,
"eval_samples_per_second": 4.022,
"eval_steps_per_second": 0.507,
"eval_wer": 0.19515330719290352,
"step": 6264
},
{
"epoch": 87.08,
"learning_rate": 3.485074626865672e-06,
"loss": 0.2605,
"step": 6270
},
{
"epoch": 87.22,
"learning_rate": 3.4477611940298506e-06,
"loss": 0.2625,
"step": 6280
},
{
"epoch": 87.36,
"learning_rate": 3.41044776119403e-06,
"loss": 0.2449,
"step": 6290
},
{
"epoch": 87.5,
"learning_rate": 3.3731343283582093e-06,
"loss": 0.2529,
"step": 6300
},
{
"epoch": 87.64,
"learning_rate": 3.335820895522388e-06,
"loss": 0.2388,
"step": 6310
},
{
"epoch": 87.78,
"learning_rate": 3.2985074626865677e-06,
"loss": 0.2504,
"step": 6320
},
{
"epoch": 87.91,
"learning_rate": 3.2611940298507464e-06,
"loss": 0.2614,
"step": 6330
},
{
"epoch": 88.0,
"eval_loss": 0.4974157512187958,
"eval_runtime": 132.0096,
"eval_samples_per_second": 4.03,
"eval_steps_per_second": 0.508,
"eval_wer": 0.19354631355659832,
"step": 6336
},
{
"epoch": 88.06,
"learning_rate": 3.2238805970149255e-06,
"loss": 0.2682,
"step": 6340
},
{
"epoch": 88.19,
"learning_rate": 3.1865671641791043e-06,
"loss": 0.2494,
"step": 6350
},
{
"epoch": 88.33,
"learning_rate": 3.149253731343284e-06,
"loss": 0.2554,
"step": 6360
},
{
"epoch": 88.47,
"learning_rate": 3.111940298507463e-06,
"loss": 0.2546,
"step": 6370
},
{
"epoch": 88.61,
"learning_rate": 3.0746268656716418e-06,
"loss": 0.2447,
"step": 6380
},
{
"epoch": 88.75,
"learning_rate": 3.037313432835821e-06,
"loss": 0.257,
"step": 6390
},
{
"epoch": 88.89,
"learning_rate": 3e-06,
"loss": 0.2533,
"step": 6400
},
{
"epoch": 89.0,
"eval_loss": 0.4969758987426758,
"eval_runtime": 132.51,
"eval_samples_per_second": 4.015,
"eval_steps_per_second": 0.506,
"eval_wer": 0.1948961882110947,
"step": 6408
},
{
"epoch": 89.03,
"learning_rate": 2.9626865671641792e-06,
"loss": 0.2591,
"step": 6410
},
{
"epoch": 89.17,
"learning_rate": 2.9253731343283584e-06,
"loss": 0.2604,
"step": 6420
},
{
"epoch": 89.3,
"learning_rate": 2.8880597014925376e-06,
"loss": 0.2445,
"step": 6430
},
{
"epoch": 89.44,
"learning_rate": 2.8507462686567167e-06,
"loss": 0.2494,
"step": 6440
},
{
"epoch": 89.58,
"learning_rate": 2.813432835820896e-06,
"loss": 0.255,
"step": 6450
},
{
"epoch": 89.72,
"learning_rate": 2.7761194029850746e-06,
"loss": 0.2512,
"step": 6460
},
{
"epoch": 89.86,
"learning_rate": 2.7388059701492538e-06,
"loss": 0.253,
"step": 6470
},
{
"epoch": 90.0,
"learning_rate": 2.701492537313433e-06,
"loss": 0.2553,
"step": 6480
},
{
"epoch": 90.0,
"eval_loss": 0.5005418658256531,
"eval_runtime": 131.5872,
"eval_samples_per_second": 4.043,
"eval_steps_per_second": 0.509,
"eval_wer": 0.19296779584752843,
"step": 6480
},
{
"epoch": 90.14,
"learning_rate": 2.664179104477612e-06,
"loss": 0.2521,
"step": 6490
},
{
"epoch": 90.28,
"learning_rate": 2.626865671641791e-06,
"loss": 0.2599,
"step": 6500
},
{
"epoch": 90.42,
"learning_rate": 2.5895522388059704e-06,
"loss": 0.256,
"step": 6510
},
{
"epoch": 90.55,
"learning_rate": 2.5522388059701496e-06,
"loss": 0.2559,
"step": 6520
},
{
"epoch": 90.69,
"learning_rate": 2.5149253731343287e-06,
"loss": 0.2507,
"step": 6530
},
{
"epoch": 90.83,
"learning_rate": 2.4776119402985074e-06,
"loss": 0.2525,
"step": 6540
},
{
"epoch": 90.97,
"learning_rate": 2.4402985074626866e-06,
"loss": 0.2518,
"step": 6550
},
{
"epoch": 91.0,
"eval_loss": 0.5009539127349854,
"eval_runtime": 131.4903,
"eval_samples_per_second": 4.046,
"eval_steps_per_second": 0.51,
"eval_wer": 0.1948961882110947,
"step": 6552
},
{
"epoch": 91.11,
"learning_rate": 2.4029850746268658e-06,
"loss": 0.2618,
"step": 6560
},
{
"epoch": 91.25,
"learning_rate": 2.365671641791045e-06,
"loss": 0.2592,
"step": 6570
},
{
"epoch": 91.39,
"learning_rate": 2.328358208955224e-06,
"loss": 0.2505,
"step": 6580
},
{
"epoch": 91.53,
"learning_rate": 2.291044776119403e-06,
"loss": 0.2539,
"step": 6590
},
{
"epoch": 91.66,
"learning_rate": 2.2537313432835824e-06,
"loss": 0.249,
"step": 6600
},
{
"epoch": 91.8,
"learning_rate": 2.2164179104477616e-06,
"loss": 0.2428,
"step": 6610
},
{
"epoch": 91.94,
"learning_rate": 2.1791044776119403e-06,
"loss": 0.2481,
"step": 6620
},
{
"epoch": 92.0,
"eval_loss": 0.4958493113517761,
"eval_runtime": 131.9046,
"eval_samples_per_second": 4.033,
"eval_steps_per_second": 0.508,
"eval_wer": 0.1918107604293887,
"step": 6624
},
{
"epoch": 92.08,
"learning_rate": 2.1417910447761194e-06,
"loss": 0.2649,
"step": 6630
},
{
"epoch": 92.22,
"learning_rate": 2.1044776119402986e-06,
"loss": 0.2549,
"step": 6640
},
{
"epoch": 92.36,
"learning_rate": 2.0671641791044778e-06,
"loss": 0.2425,
"step": 6650
},
{
"epoch": 92.5,
"learning_rate": 2.029850746268657e-06,
"loss": 0.2598,
"step": 6660
},
{
"epoch": 92.64,
"learning_rate": 1.9925373134328357e-06,
"loss": 0.2429,
"step": 6670
},
{
"epoch": 92.78,
"learning_rate": 1.955223880597015e-06,
"loss": 0.2596,
"step": 6680
},
{
"epoch": 92.91,
"learning_rate": 1.9179104477611944e-06,
"loss": 0.2491,
"step": 6690
},
{
"epoch": 93.0,
"eval_loss": 0.4932185709476471,
"eval_runtime": 131.4467,
"eval_samples_per_second": 4.047,
"eval_steps_per_second": 0.51,
"eval_wer": 0.1909108439930578,
"step": 6696
},
{
"epoch": 93.06,
"learning_rate": 1.8805970149253733e-06,
"loss": 0.2682,
"step": 6700
},
{
"epoch": 93.19,
"learning_rate": 1.8432835820895525e-06,
"loss": 0.2455,
"step": 6710
},
{
"epoch": 93.33,
"learning_rate": 1.8059701492537314e-06,
"loss": 0.2456,
"step": 6720
},
{
"epoch": 93.47,
"learning_rate": 1.7686567164179106e-06,
"loss": 0.2493,
"step": 6730
},
{
"epoch": 93.61,
"learning_rate": 1.7313432835820896e-06,
"loss": 0.2526,
"step": 6740
},
{
"epoch": 93.75,
"learning_rate": 1.6940298507462687e-06,
"loss": 0.2599,
"step": 6750
},
{
"epoch": 93.89,
"learning_rate": 1.6567164179104477e-06,
"loss": 0.2455,
"step": 6760
},
{
"epoch": 94.0,
"eval_loss": 0.493074506521225,
"eval_runtime": 131.6855,
"eval_samples_per_second": 4.04,
"eval_steps_per_second": 0.509,
"eval_wer": 0.19123224272031883,
"step": 6768
},
{
"epoch": 94.03,
"learning_rate": 1.6194029850746268e-06,
"loss": 0.2531,
"step": 6770
},
{
"epoch": 94.17,
"learning_rate": 1.5820895522388062e-06,
"loss": 0.2513,
"step": 6780
},
{
"epoch": 94.3,
"learning_rate": 1.5447761194029851e-06,
"loss": 0.2534,
"step": 6790
},
{
"epoch": 94.44,
"learning_rate": 1.5111940298507464e-06,
"loss": 0.2418,
"step": 6800
},
{
"epoch": 94.58,
"learning_rate": 1.4738805970149254e-06,
"loss": 0.2407,
"step": 6810
},
{
"epoch": 94.72,
"learning_rate": 1.4365671641791045e-06,
"loss": 0.251,
"step": 6820
},
{
"epoch": 94.86,
"learning_rate": 1.3992537313432837e-06,
"loss": 0.2494,
"step": 6830
},
{
"epoch": 95.0,
"learning_rate": 1.3619402985074628e-06,
"loss": 0.2581,
"step": 6840
},
{
"epoch": 95.0,
"eval_loss": 0.49741461873054504,
"eval_runtime": 132.2805,
"eval_samples_per_second": 4.022,
"eval_steps_per_second": 0.506,
"eval_wer": 0.19148936170212766,
"step": 6840
},
{
"epoch": 95.14,
"learning_rate": 1.3246268656716418e-06,
"loss": 0.2415,
"step": 6850
},
{
"epoch": 95.28,
"learning_rate": 1.287313432835821e-06,
"loss": 0.2474,
"step": 6860
},
{
"epoch": 95.42,
"learning_rate": 1.25e-06,
"loss": 0.2488,
"step": 6870
},
{
"epoch": 95.55,
"learning_rate": 1.2126865671641793e-06,
"loss": 0.2566,
"step": 6880
},
{
"epoch": 95.69,
"learning_rate": 1.1753731343283582e-06,
"loss": 0.2457,
"step": 6890
},
{
"epoch": 95.83,
"learning_rate": 1.1380597014925374e-06,
"loss": 0.2489,
"step": 6900
},
{
"epoch": 95.97,
"learning_rate": 1.1007462686567163e-06,
"loss": 0.2578,
"step": 6910
},
{
"epoch": 96.0,
"eval_loss": 0.4990382492542267,
"eval_runtime": 131.6402,
"eval_samples_per_second": 4.041,
"eval_steps_per_second": 0.509,
"eval_wer": 0.1909108439930578,
"step": 6912
},
{
"epoch": 96.11,
"learning_rate": 1.0634328358208957e-06,
"loss": 0.2528,
"step": 6920
},
{
"epoch": 96.25,
"learning_rate": 1.0261194029850746e-06,
"loss": 0.2517,
"step": 6930
},
{
"epoch": 96.39,
"learning_rate": 9.888059701492538e-07,
"loss": 0.2358,
"step": 6940
},
{
"epoch": 96.53,
"learning_rate": 9.514925373134328e-07,
"loss": 0.254,
"step": 6950
},
{
"epoch": 96.66,
"learning_rate": 9.141791044776121e-07,
"loss": 0.2491,
"step": 6960
},
{
"epoch": 96.8,
"learning_rate": 8.768656716417912e-07,
"loss": 0.2494,
"step": 6970
},
{
"epoch": 96.94,
"learning_rate": 8.395522388059702e-07,
"loss": 0.2503,
"step": 6980
},
{
"epoch": 97.0,
"eval_loss": 0.4989832937717438,
"eval_runtime": 131.556,
"eval_samples_per_second": 4.044,
"eval_steps_per_second": 0.509,
"eval_wer": 0.19136080221122323,
"step": 6984
},
{
"epoch": 97.08,
"learning_rate": 8.022388059701493e-07,
"loss": 0.2468,
"step": 6990
},
{
"epoch": 97.22,
"learning_rate": 7.649253731343284e-07,
"loss": 0.2519,
"step": 7000
},
{
"epoch": 97.36,
"learning_rate": 7.276119402985075e-07,
"loss": 0.2464,
"step": 7010
},
{
"epoch": 97.5,
"learning_rate": 6.902985074626866e-07,
"loss": 0.2423,
"step": 7020
},
{
"epoch": 97.64,
"learning_rate": 6.529850746268657e-07,
"loss": 0.2327,
"step": 7030
},
{
"epoch": 97.78,
"learning_rate": 6.156716417910448e-07,
"loss": 0.2523,
"step": 7040
},
{
"epoch": 97.91,
"learning_rate": 5.783582089552239e-07,
"loss": 0.2544,
"step": 7050
},
{
"epoch": 98.0,
"eval_loss": 0.4931636154651642,
"eval_runtime": 132.145,
"eval_samples_per_second": 4.026,
"eval_steps_per_second": 0.507,
"eval_wer": 0.1903323262839879,
"step": 7056
},
{
"epoch": 98.06,
"learning_rate": 5.41044776119403e-07,
"loss": 0.2491,
"step": 7060
},
{
"epoch": 98.19,
"learning_rate": 5.037313432835821e-07,
"loss": 0.2483,
"step": 7070
},
{
"epoch": 98.33,
"learning_rate": 4.6641791044776116e-07,
"loss": 0.2478,
"step": 7080
},
{
"epoch": 98.47,
"learning_rate": 4.291044776119403e-07,
"loss": 0.255,
"step": 7090
},
{
"epoch": 98.61,
"learning_rate": 3.9179104477611937e-07,
"loss": 0.2429,
"step": 7100
},
{
"epoch": 98.75,
"learning_rate": 3.544776119402985e-07,
"loss": 0.2524,
"step": 7110
},
{
"epoch": 98.89,
"learning_rate": 3.1716417910447763e-07,
"loss": 0.2391,
"step": 7120
},
{
"epoch": 99.0,
"eval_loss": 0.49354514479637146,
"eval_runtime": 131.8773,
"eval_samples_per_second": 4.034,
"eval_steps_per_second": 0.508,
"eval_wer": 0.1903966060294401,
"step": 7128
},
{
"epoch": 99.03,
"learning_rate": 2.7985074626865674e-07,
"loss": 0.265,
"step": 7130
},
{
"epoch": 99.17,
"learning_rate": 2.4253731343283584e-07,
"loss": 0.2477,
"step": 7140
},
{
"epoch": 99.3,
"learning_rate": 2.0522388059701492e-07,
"loss": 0.2497,
"step": 7150
},
{
"epoch": 99.44,
"learning_rate": 1.6791044776119403e-07,
"loss": 0.2535,
"step": 7160
},
{
"epoch": 99.58,
"learning_rate": 1.3059701492537316e-07,
"loss": 0.2511,
"step": 7170
},
{
"epoch": 99.72,
"learning_rate": 9.328358208955224e-08,
"loss": 0.2441,
"step": 7180
},
{
"epoch": 99.86,
"learning_rate": 5.597014925373135e-08,
"loss": 0.2413,
"step": 7190
},
{
"epoch": 100.0,
"learning_rate": 1.8656716417910447e-08,
"loss": 0.2498,
"step": 7200
},
{
"epoch": 100.0,
"eval_loss": 0.4945172667503357,
"eval_runtime": 132.2872,
"eval_samples_per_second": 4.022,
"eval_steps_per_second": 0.506,
"eval_wer": 0.1909108439930578,
"step": 7200
},
{
"epoch": 100.0,
"step": 7200,
"total_flos": 2.7202925310621965e+20,
"train_loss": 0.2786852648191982,
"train_runtime": 194751.2153,
"train_samples_per_second": 2.371,
"train_steps_per_second": 0.037
}
],
"max_steps": 7200,
"num_train_epochs": 100,
"total_flos": 2.7202925310621965e+20,
"trial_name": null,
"trial_params": null
}