Aramaic_finetuned_teacher / trainer_state.json
pburub's picture
Upload 9 files
55c2415 verified
{
"best_metric": 0.32863247863247863,
"best_model_checkpoint": "/content/drive/MyDrive/model_ft/checkpoint-60000",
"epoch": 70.58823529411765,
"global_step": 60000,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.12,
"learning_rate": 8.25e-08,
"loss": 13.3276,
"step": 100
},
{
"epoch": 0.24,
"learning_rate": 1.6583333333333334e-07,
"loss": 13.3671,
"step": 200
},
{
"epoch": 0.35,
"learning_rate": 2.491666666666667e-07,
"loss": 13.5271,
"step": 300
},
{
"epoch": 0.47,
"learning_rate": 3.3250000000000005e-07,
"loss": 13.1811,
"step": 400
},
{
"epoch": 0.59,
"learning_rate": 4.1583333333333336e-07,
"loss": 13.759,
"step": 500
},
{
"epoch": 0.71,
"learning_rate": 4.991666666666667e-07,
"loss": 12.8466,
"step": 600
},
{
"epoch": 0.82,
"learning_rate": 5.816666666666667e-07,
"loss": 13.2734,
"step": 700
},
{
"epoch": 0.94,
"learning_rate": 6.650000000000001e-07,
"loss": 12.6648,
"step": 800
},
{
"epoch": 1.06,
"learning_rate": 7.483333333333334e-07,
"loss": 11.954,
"step": 900
},
{
"epoch": 1.18,
"learning_rate": 8.316666666666667e-07,
"loss": 10.7418,
"step": 1000
},
{
"epoch": 1.29,
"learning_rate": 9.15e-07,
"loss": 9.103,
"step": 1100
},
{
"epoch": 1.41,
"learning_rate": 9.983333333333334e-07,
"loss": 7.9895,
"step": 1200
},
{
"epoch": 1.53,
"learning_rate": 1.0816666666666668e-06,
"loss": 6.969,
"step": 1300
},
{
"epoch": 1.65,
"learning_rate": 1.165e-06,
"loss": 6.3495,
"step": 1400
},
{
"epoch": 1.76,
"learning_rate": 1.2483333333333334e-06,
"loss": 6.025,
"step": 1500
},
{
"epoch": 1.88,
"learning_rate": 1.3316666666666667e-06,
"loss": 5.5944,
"step": 1600
},
{
"epoch": 2.0,
"learning_rate": 1.415e-06,
"loss": 5.3688,
"step": 1700
},
{
"epoch": 2.12,
"learning_rate": 1.4983333333333335e-06,
"loss": 5.1139,
"step": 1800
},
{
"epoch": 2.24,
"learning_rate": 1.5816666666666668e-06,
"loss": 4.9115,
"step": 1900
},
{
"epoch": 2.35,
"learning_rate": 1.6650000000000002e-06,
"loss": 4.7514,
"step": 2000
},
{
"epoch": 2.47,
"learning_rate": 1.7483333333333335e-06,
"loss": 4.6136,
"step": 2100
},
{
"epoch": 2.59,
"learning_rate": 1.8316666666666668e-06,
"loss": 4.491,
"step": 2200
},
{
"epoch": 2.71,
"learning_rate": 1.9150000000000003e-06,
"loss": 4.342,
"step": 2300
},
{
"epoch": 2.82,
"learning_rate": 1.9983333333333334e-06,
"loss": 4.2564,
"step": 2400
},
{
"epoch": 2.94,
"learning_rate": 2.081666666666667e-06,
"loss": 4.1291,
"step": 2500
},
{
"epoch": 3.06,
"learning_rate": 2.165e-06,
"loss": 4.0612,
"step": 2600
},
{
"epoch": 3.18,
"learning_rate": 2.2483333333333335e-06,
"loss": 3.9644,
"step": 2700
},
{
"epoch": 3.29,
"learning_rate": 2.3316666666666666e-06,
"loss": 3.8365,
"step": 2800
},
{
"epoch": 3.41,
"learning_rate": 2.415e-06,
"loss": 3.8019,
"step": 2900
},
{
"epoch": 3.53,
"learning_rate": 2.4983333333333333e-06,
"loss": 3.7349,
"step": 3000
},
{
"epoch": 3.65,
"learning_rate": 2.581666666666667e-06,
"loss": 3.682,
"step": 3100
},
{
"epoch": 3.76,
"learning_rate": 2.6650000000000003e-06,
"loss": 3.6215,
"step": 3200
},
{
"epoch": 3.88,
"learning_rate": 2.7483333333333334e-06,
"loss": 3.5712,
"step": 3300
},
{
"epoch": 4.0,
"learning_rate": 2.831666666666667e-06,
"loss": 3.5167,
"step": 3400
},
{
"epoch": 4.12,
"learning_rate": 2.915e-06,
"loss": 3.4697,
"step": 3500
},
{
"epoch": 4.24,
"learning_rate": 2.9983333333333336e-06,
"loss": 3.4221,
"step": 3600
},
{
"epoch": 4.35,
"learning_rate": 3.0816666666666667e-06,
"loss": 3.398,
"step": 3700
},
{
"epoch": 4.47,
"learning_rate": 3.165e-06,
"loss": 3.385,
"step": 3800
},
{
"epoch": 4.59,
"learning_rate": 3.2483333333333333e-06,
"loss": 3.3592,
"step": 3900
},
{
"epoch": 4.71,
"learning_rate": 3.331666666666667e-06,
"loss": 3.3542,
"step": 4000
},
{
"epoch": 4.82,
"learning_rate": 3.4150000000000003e-06,
"loss": 3.3356,
"step": 4100
},
{
"epoch": 4.94,
"learning_rate": 3.4983333333333334e-06,
"loss": 3.315,
"step": 4200
},
{
"epoch": 5.06,
"learning_rate": 3.5816666666666674e-06,
"loss": 3.3274,
"step": 4300
},
{
"epoch": 5.18,
"learning_rate": 3.665e-06,
"loss": 3.2824,
"step": 4400
},
{
"epoch": 5.29,
"learning_rate": 3.748333333333334e-06,
"loss": 3.2844,
"step": 4500
},
{
"epoch": 5.41,
"learning_rate": 3.831666666666667e-06,
"loss": 3.2619,
"step": 4600
},
{
"epoch": 5.53,
"learning_rate": 3.915000000000001e-06,
"loss": 3.2613,
"step": 4700
},
{
"epoch": 5.65,
"learning_rate": 3.998333333333334e-06,
"loss": 3.2509,
"step": 4800
},
{
"epoch": 5.76,
"learning_rate": 4.081666666666667e-06,
"loss": 3.2457,
"step": 4900
},
{
"epoch": 5.88,
"learning_rate": 4.165e-06,
"loss": 3.2303,
"step": 5000
},
{
"epoch": 6.0,
"learning_rate": 4.2475e-06,
"loss": 3.235,
"step": 5100
},
{
"epoch": 6.12,
"learning_rate": 4.3308333333333335e-06,
"loss": 3.2095,
"step": 5200
},
{
"epoch": 6.24,
"learning_rate": 4.4141666666666675e-06,
"loss": 3.2111,
"step": 5300
},
{
"epoch": 6.35,
"learning_rate": 4.4975000000000006e-06,
"loss": 3.1865,
"step": 5400
},
{
"epoch": 6.47,
"learning_rate": 4.580833333333334e-06,
"loss": 3.1699,
"step": 5500
},
{
"epoch": 6.59,
"learning_rate": 4.664166666666667e-06,
"loss": 3.1455,
"step": 5600
},
{
"epoch": 6.71,
"learning_rate": 4.747500000000001e-06,
"loss": 3.1055,
"step": 5700
},
{
"epoch": 6.82,
"learning_rate": 4.830833333333334e-06,
"loss": 3.0822,
"step": 5800
},
{
"epoch": 6.94,
"learning_rate": 4.914166666666667e-06,
"loss": 3.0117,
"step": 5900
},
{
"epoch": 7.06,
"learning_rate": 4.997500000000001e-06,
"loss": 2.9725,
"step": 6000
},
{
"epoch": 7.18,
"learning_rate": 5e-06,
"loss": 2.9052,
"step": 6100
},
{
"epoch": 7.29,
"learning_rate": 5e-06,
"loss": 2.8386,
"step": 6200
},
{
"epoch": 7.41,
"learning_rate": 5e-06,
"loss": 2.7776,
"step": 6300
},
{
"epoch": 7.53,
"learning_rate": 5e-06,
"loss": 2.7029,
"step": 6400
},
{
"epoch": 7.65,
"learning_rate": 5e-06,
"loss": 2.6344,
"step": 6500
},
{
"epoch": 7.76,
"learning_rate": 5e-06,
"loss": 2.5601,
"step": 6600
},
{
"epoch": 7.88,
"learning_rate": 5e-06,
"loss": 2.5069,
"step": 6700
},
{
"epoch": 8.0,
"learning_rate": 5e-06,
"loss": 2.4533,
"step": 6800
},
{
"epoch": 8.12,
"learning_rate": 5e-06,
"loss": 2.3527,
"step": 6900
},
{
"epoch": 8.24,
"learning_rate": 5e-06,
"loss": 2.3213,
"step": 7000
},
{
"epoch": 8.35,
"learning_rate": 5e-06,
"loss": 2.2538,
"step": 7100
},
{
"epoch": 8.47,
"learning_rate": 5e-06,
"loss": 2.2051,
"step": 7200
},
{
"epoch": 8.59,
"learning_rate": 5e-06,
"loss": 2.1572,
"step": 7300
},
{
"epoch": 8.71,
"learning_rate": 5e-06,
"loss": 2.1269,
"step": 7400
},
{
"epoch": 8.82,
"learning_rate": 5e-06,
"loss": 2.0919,
"step": 7500
},
{
"epoch": 8.94,
"learning_rate": 5e-06,
"loss": 2.043,
"step": 7600
},
{
"epoch": 9.06,
"learning_rate": 5e-06,
"loss": 1.9963,
"step": 7700
},
{
"epoch": 9.18,
"learning_rate": 5e-06,
"loss": 1.923,
"step": 7800
},
{
"epoch": 9.29,
"learning_rate": 5e-06,
"loss": 1.8817,
"step": 7900
},
{
"epoch": 9.41,
"learning_rate": 5e-06,
"loss": 1.8598,
"step": 8000
},
{
"epoch": 9.53,
"learning_rate": 5e-06,
"loss": 1.853,
"step": 8100
},
{
"epoch": 9.65,
"learning_rate": 5e-06,
"loss": 1.7911,
"step": 8200
},
{
"epoch": 9.76,
"learning_rate": 5e-06,
"loss": 1.801,
"step": 8300
},
{
"epoch": 9.88,
"learning_rate": 5e-06,
"loss": 1.7483,
"step": 8400
},
{
"epoch": 10.0,
"learning_rate": 5e-06,
"loss": 1.6983,
"step": 8500
},
{
"epoch": 10.12,
"learning_rate": 5e-06,
"loss": 1.7095,
"step": 8600
},
{
"epoch": 10.24,
"learning_rate": 5e-06,
"loss": 1.6673,
"step": 8700
},
{
"epoch": 10.35,
"learning_rate": 5e-06,
"loss": 1.662,
"step": 8800
},
{
"epoch": 10.47,
"learning_rate": 5e-06,
"loss": 1.5961,
"step": 8900
},
{
"epoch": 10.59,
"learning_rate": 5e-06,
"loss": 1.5782,
"step": 9000
},
{
"epoch": 10.71,
"learning_rate": 5e-06,
"loss": 1.5687,
"step": 9100
},
{
"epoch": 10.82,
"learning_rate": 5e-06,
"loss": 1.5924,
"step": 9200
},
{
"epoch": 10.94,
"learning_rate": 5e-06,
"loss": 1.5246,
"step": 9300
},
{
"epoch": 11.06,
"learning_rate": 5e-06,
"loss": 1.5382,
"step": 9400
},
{
"epoch": 11.18,
"learning_rate": 5e-06,
"loss": 1.4948,
"step": 9500
},
{
"epoch": 11.29,
"learning_rate": 5e-06,
"loss": 1.4695,
"step": 9600
},
{
"epoch": 11.41,
"learning_rate": 5e-06,
"loss": 1.4473,
"step": 9700
},
{
"epoch": 11.53,
"learning_rate": 5e-06,
"loss": 1.4252,
"step": 9800
},
{
"epoch": 11.65,
"learning_rate": 5e-06,
"loss": 1.4359,
"step": 9900
},
{
"epoch": 11.76,
"learning_rate": 5e-06,
"loss": 1.4131,
"step": 10000
},
{
"epoch": 11.76,
"eval_cer": 0.2265467514343309,
"eval_loss": 1.0398374795913696,
"eval_runtime": 8.2478,
"eval_samples_per_second": 36.374,
"eval_steps_per_second": 18.187,
"eval_wer": 0.7435897435897436,
"step": 10000
},
{
"epoch": 11.88,
"learning_rate": 5e-06,
"loss": 1.4034,
"step": 10100
},
{
"epoch": 12.0,
"learning_rate": 5e-06,
"loss": 1.3831,
"step": 10200
},
{
"epoch": 12.12,
"learning_rate": 5e-06,
"loss": 1.3612,
"step": 10300
},
{
"epoch": 12.24,
"learning_rate": 5e-06,
"loss": 1.3589,
"step": 10400
},
{
"epoch": 12.35,
"learning_rate": 5e-06,
"loss": 1.3453,
"step": 10500
},
{
"epoch": 12.47,
"learning_rate": 5e-06,
"loss": 1.343,
"step": 10600
},
{
"epoch": 12.59,
"learning_rate": 5e-06,
"loss": 1.317,
"step": 10700
},
{
"epoch": 12.71,
"learning_rate": 5e-06,
"loss": 1.3011,
"step": 10800
},
{
"epoch": 12.82,
"learning_rate": 5e-06,
"loss": 1.3333,
"step": 10900
},
{
"epoch": 12.94,
"learning_rate": 5e-06,
"loss": 1.2563,
"step": 11000
},
{
"epoch": 13.06,
"learning_rate": 5e-06,
"loss": 1.3362,
"step": 11100
},
{
"epoch": 13.18,
"learning_rate": 5e-06,
"loss": 1.2656,
"step": 11200
},
{
"epoch": 13.29,
"learning_rate": 5e-06,
"loss": 1.2411,
"step": 11300
},
{
"epoch": 13.41,
"learning_rate": 5e-06,
"loss": 1.2256,
"step": 11400
},
{
"epoch": 13.53,
"learning_rate": 5e-06,
"loss": 1.2319,
"step": 11500
},
{
"epoch": 13.65,
"learning_rate": 5e-06,
"loss": 1.2011,
"step": 11600
},
{
"epoch": 13.76,
"learning_rate": 5e-06,
"loss": 1.1766,
"step": 11700
},
{
"epoch": 13.88,
"learning_rate": 5e-06,
"loss": 1.2659,
"step": 11800
},
{
"epoch": 14.0,
"learning_rate": 5e-06,
"loss": 1.2131,
"step": 11900
},
{
"epoch": 14.12,
"learning_rate": 5e-06,
"loss": 1.1934,
"step": 12000
},
{
"epoch": 14.24,
"learning_rate": 5e-06,
"loss": 1.2018,
"step": 12100
},
{
"epoch": 14.35,
"learning_rate": 5e-06,
"loss": 1.175,
"step": 12200
},
{
"epoch": 14.47,
"learning_rate": 5e-06,
"loss": 1.1658,
"step": 12300
},
{
"epoch": 14.59,
"learning_rate": 5e-06,
"loss": 1.1728,
"step": 12400
},
{
"epoch": 14.71,
"learning_rate": 5e-06,
"loss": 1.1216,
"step": 12500
},
{
"epoch": 14.82,
"learning_rate": 5e-06,
"loss": 1.1417,
"step": 12600
},
{
"epoch": 14.94,
"learning_rate": 5e-06,
"loss": 1.1386,
"step": 12700
},
{
"epoch": 15.06,
"learning_rate": 5e-06,
"loss": 1.0892,
"step": 12800
},
{
"epoch": 15.18,
"learning_rate": 5e-06,
"loss": 1.124,
"step": 12900
},
{
"epoch": 15.29,
"learning_rate": 5e-06,
"loss": 1.1065,
"step": 13000
},
{
"epoch": 15.41,
"learning_rate": 5e-06,
"loss": 1.1189,
"step": 13100
},
{
"epoch": 15.53,
"learning_rate": 5e-06,
"loss": 1.1184,
"step": 13200
},
{
"epoch": 15.65,
"learning_rate": 5e-06,
"loss": 1.0709,
"step": 13300
},
{
"epoch": 15.76,
"learning_rate": 5e-06,
"loss": 1.1085,
"step": 13400
},
{
"epoch": 15.88,
"learning_rate": 5e-06,
"loss": 1.0668,
"step": 13500
},
{
"epoch": 16.0,
"learning_rate": 5e-06,
"loss": 1.104,
"step": 13600
},
{
"epoch": 16.12,
"learning_rate": 5e-06,
"loss": 1.0781,
"step": 13700
},
{
"epoch": 16.24,
"learning_rate": 5e-06,
"loss": 1.0525,
"step": 13800
},
{
"epoch": 16.35,
"learning_rate": 5e-06,
"loss": 1.0667,
"step": 13900
},
{
"epoch": 16.47,
"learning_rate": 5e-06,
"loss": 1.0298,
"step": 14000
},
{
"epoch": 16.59,
"learning_rate": 5e-06,
"loss": 1.093,
"step": 14100
},
{
"epoch": 16.71,
"learning_rate": 5e-06,
"loss": 1.0394,
"step": 14200
},
{
"epoch": 16.82,
"learning_rate": 5e-06,
"loss": 1.0356,
"step": 14300
},
{
"epoch": 16.94,
"learning_rate": 5e-06,
"loss": 1.0467,
"step": 14400
},
{
"epoch": 17.06,
"learning_rate": 5e-06,
"loss": 1.0171,
"step": 14500
},
{
"epoch": 17.18,
"learning_rate": 5e-06,
"loss": 1.0577,
"step": 14600
},
{
"epoch": 17.29,
"learning_rate": 5e-06,
"loss": 1.0329,
"step": 14700
},
{
"epoch": 17.41,
"learning_rate": 5e-06,
"loss": 1.0385,
"step": 14800
},
{
"epoch": 17.53,
"learning_rate": 5e-06,
"loss": 0.9814,
"step": 14900
},
{
"epoch": 17.65,
"learning_rate": 5e-06,
"loss": 1.0115,
"step": 15000
},
{
"epoch": 17.76,
"learning_rate": 5e-06,
"loss": 0.9966,
"step": 15100
},
{
"epoch": 17.88,
"learning_rate": 5e-06,
"loss": 1.0068,
"step": 15200
},
{
"epoch": 18.0,
"learning_rate": 5e-06,
"loss": 0.9655,
"step": 15300
},
{
"epoch": 18.12,
"learning_rate": 5e-06,
"loss": 1.0097,
"step": 15400
},
{
"epoch": 18.24,
"learning_rate": 5e-06,
"loss": 0.9861,
"step": 15500
},
{
"epoch": 18.35,
"learning_rate": 5e-06,
"loss": 0.9604,
"step": 15600
},
{
"epoch": 18.47,
"learning_rate": 5e-06,
"loss": 0.9894,
"step": 15700
},
{
"epoch": 18.59,
"learning_rate": 5e-06,
"loss": 1.0,
"step": 15800
},
{
"epoch": 18.71,
"learning_rate": 5e-06,
"loss": 0.9469,
"step": 15900
},
{
"epoch": 18.82,
"learning_rate": 5e-06,
"loss": 0.9675,
"step": 16000
},
{
"epoch": 18.94,
"learning_rate": 5e-06,
"loss": 1.0127,
"step": 16100
},
{
"epoch": 19.06,
"learning_rate": 5e-06,
"loss": 0.9574,
"step": 16200
},
{
"epoch": 19.18,
"learning_rate": 5e-06,
"loss": 0.9775,
"step": 16300
},
{
"epoch": 19.29,
"learning_rate": 5e-06,
"loss": 0.9302,
"step": 16400
},
{
"epoch": 19.41,
"learning_rate": 5e-06,
"loss": 0.9379,
"step": 16500
},
{
"epoch": 19.53,
"learning_rate": 5e-06,
"loss": 0.9498,
"step": 16600
},
{
"epoch": 19.65,
"learning_rate": 5e-06,
"loss": 0.9449,
"step": 16700
},
{
"epoch": 19.76,
"learning_rate": 5e-06,
"loss": 0.9567,
"step": 16800
},
{
"epoch": 19.88,
"learning_rate": 5e-06,
"loss": 0.9288,
"step": 16900
},
{
"epoch": 20.0,
"learning_rate": 5e-06,
"loss": 0.9174,
"step": 17000
},
{
"epoch": 20.12,
"learning_rate": 5e-06,
"loss": 0.8975,
"step": 17100
},
{
"epoch": 20.24,
"learning_rate": 5e-06,
"loss": 0.907,
"step": 17200
},
{
"epoch": 20.35,
"learning_rate": 5e-06,
"loss": 0.9152,
"step": 17300
},
{
"epoch": 20.47,
"learning_rate": 5e-06,
"loss": 0.9345,
"step": 17400
},
{
"epoch": 20.59,
"learning_rate": 5e-06,
"loss": 0.9491,
"step": 17500
},
{
"epoch": 20.71,
"learning_rate": 5e-06,
"loss": 0.8746,
"step": 17600
},
{
"epoch": 20.82,
"learning_rate": 5e-06,
"loss": 0.9377,
"step": 17700
},
{
"epoch": 20.94,
"learning_rate": 5e-06,
"loss": 0.9243,
"step": 17800
},
{
"epoch": 21.06,
"learning_rate": 5e-06,
"loss": 0.9177,
"step": 17900
},
{
"epoch": 21.18,
"learning_rate": 5e-06,
"loss": 0.8991,
"step": 18000
},
{
"epoch": 21.29,
"learning_rate": 5e-06,
"loss": 0.8724,
"step": 18100
},
{
"epoch": 21.41,
"learning_rate": 5e-06,
"loss": 0.874,
"step": 18200
},
{
"epoch": 21.53,
"learning_rate": 5e-06,
"loss": 0.934,
"step": 18300
},
{
"epoch": 21.65,
"learning_rate": 5e-06,
"loss": 0.868,
"step": 18400
},
{
"epoch": 21.76,
"learning_rate": 5e-06,
"loss": 0.8915,
"step": 18500
},
{
"epoch": 21.88,
"learning_rate": 5e-06,
"loss": 0.8902,
"step": 18600
},
{
"epoch": 22.0,
"learning_rate": 5e-06,
"loss": 0.8871,
"step": 18700
},
{
"epoch": 22.12,
"learning_rate": 5e-06,
"loss": 0.883,
"step": 18800
},
{
"epoch": 22.24,
"learning_rate": 5e-06,
"loss": 0.8589,
"step": 18900
},
{
"epoch": 22.35,
"learning_rate": 5e-06,
"loss": 0.8407,
"step": 19000
},
{
"epoch": 22.47,
"learning_rate": 5e-06,
"loss": 0.8759,
"step": 19100
},
{
"epoch": 22.59,
"learning_rate": 5e-06,
"loss": 0.8964,
"step": 19200
},
{
"epoch": 22.71,
"learning_rate": 5e-06,
"loss": 0.8961,
"step": 19300
},
{
"epoch": 22.82,
"learning_rate": 5e-06,
"loss": 0.8789,
"step": 19400
},
{
"epoch": 22.94,
"learning_rate": 5e-06,
"loss": 0.8619,
"step": 19500
},
{
"epoch": 23.06,
"learning_rate": 5e-06,
"loss": 0.8907,
"step": 19600
},
{
"epoch": 23.18,
"learning_rate": 5e-06,
"loss": 0.8332,
"step": 19700
},
{
"epoch": 23.29,
"learning_rate": 5e-06,
"loss": 0.8518,
"step": 19800
},
{
"epoch": 23.41,
"learning_rate": 5e-06,
"loss": 0.8685,
"step": 19900
},
{
"epoch": 23.53,
"learning_rate": 5e-06,
"loss": 0.8208,
"step": 20000
},
{
"epoch": 23.53,
"eval_cer": 0.1398666459916266,
"eval_loss": 0.5984983444213867,
"eval_runtime": 7.9445,
"eval_samples_per_second": 37.762,
"eval_steps_per_second": 18.881,
"eval_wer": 0.48846153846153845,
"step": 20000
},
{
"epoch": 23.65,
"learning_rate": 5e-06,
"loss": 0.8495,
"step": 20100
},
{
"epoch": 23.76,
"learning_rate": 5e-06,
"loss": 0.8308,
"step": 20200
},
{
"epoch": 23.88,
"learning_rate": 5e-06,
"loss": 0.8871,
"step": 20300
},
{
"epoch": 24.0,
"learning_rate": 5e-06,
"loss": 0.8437,
"step": 20400
},
{
"epoch": 24.12,
"learning_rate": 5e-06,
"loss": 0.8301,
"step": 20500
},
{
"epoch": 24.24,
"learning_rate": 5e-06,
"loss": 0.8147,
"step": 20600
},
{
"epoch": 24.35,
"learning_rate": 5e-06,
"loss": 0.8189,
"step": 20700
},
{
"epoch": 24.47,
"learning_rate": 5e-06,
"loss": 0.8449,
"step": 20800
},
{
"epoch": 24.59,
"learning_rate": 5e-06,
"loss": 0.8581,
"step": 20900
},
{
"epoch": 24.71,
"learning_rate": 5e-06,
"loss": 0.8694,
"step": 21000
},
{
"epoch": 24.82,
"learning_rate": 5e-06,
"loss": 0.8206,
"step": 21100
},
{
"epoch": 24.94,
"learning_rate": 5e-06,
"loss": 0.8328,
"step": 21200
},
{
"epoch": 25.06,
"learning_rate": 5e-06,
"loss": 0.8133,
"step": 21300
},
{
"epoch": 25.18,
"learning_rate": 5e-06,
"loss": 0.7928,
"step": 21400
},
{
"epoch": 25.29,
"learning_rate": 5e-06,
"loss": 0.8863,
"step": 21500
},
{
"epoch": 25.41,
"learning_rate": 5e-06,
"loss": 0.8131,
"step": 21600
},
{
"epoch": 25.53,
"learning_rate": 5e-06,
"loss": 0.8293,
"step": 21700
},
{
"epoch": 25.65,
"learning_rate": 5e-06,
"loss": 0.8113,
"step": 21800
},
{
"epoch": 25.76,
"learning_rate": 5e-06,
"loss": 0.8267,
"step": 21900
},
{
"epoch": 25.88,
"learning_rate": 5e-06,
"loss": 0.7989,
"step": 22000
},
{
"epoch": 26.0,
"learning_rate": 5e-06,
"loss": 0.7918,
"step": 22100
},
{
"epoch": 26.12,
"learning_rate": 5e-06,
"loss": 0.7992,
"step": 22200
},
{
"epoch": 26.24,
"learning_rate": 5e-06,
"loss": 0.8054,
"step": 22300
},
{
"epoch": 26.35,
"learning_rate": 5e-06,
"loss": 0.8051,
"step": 22400
},
{
"epoch": 26.47,
"learning_rate": 5e-06,
"loss": 0.804,
"step": 22500
},
{
"epoch": 26.59,
"learning_rate": 5e-06,
"loss": 0.8245,
"step": 22600
},
{
"epoch": 26.71,
"learning_rate": 5e-06,
"loss": 0.7936,
"step": 22700
},
{
"epoch": 26.82,
"learning_rate": 5e-06,
"loss": 0.7919,
"step": 22800
},
{
"epoch": 26.94,
"learning_rate": 5e-06,
"loss": 0.8058,
"step": 22900
},
{
"epoch": 27.06,
"learning_rate": 5e-06,
"loss": 0.7936,
"step": 23000
},
{
"epoch": 27.18,
"learning_rate": 5e-06,
"loss": 0.7966,
"step": 23100
},
{
"epoch": 27.29,
"learning_rate": 5e-06,
"loss": 0.8066,
"step": 23200
},
{
"epoch": 27.41,
"learning_rate": 5e-06,
"loss": 0.7742,
"step": 23300
},
{
"epoch": 27.53,
"learning_rate": 5e-06,
"loss": 0.7858,
"step": 23400
},
{
"epoch": 27.65,
"learning_rate": 5e-06,
"loss": 0.7878,
"step": 23500
},
{
"epoch": 27.76,
"learning_rate": 5e-06,
"loss": 0.8145,
"step": 23600
},
{
"epoch": 27.88,
"learning_rate": 5e-06,
"loss": 0.7742,
"step": 23700
},
{
"epoch": 28.0,
"learning_rate": 5e-06,
"loss": 0.8084,
"step": 23800
},
{
"epoch": 28.12,
"learning_rate": 5e-06,
"loss": 0.7966,
"step": 23900
},
{
"epoch": 28.24,
"learning_rate": 5e-06,
"loss": 0.7893,
"step": 24000
},
{
"epoch": 28.35,
"learning_rate": 5e-06,
"loss": 0.7749,
"step": 24100
},
{
"epoch": 28.47,
"learning_rate": 5e-06,
"loss": 0.8018,
"step": 24200
},
{
"epoch": 28.59,
"learning_rate": 5e-06,
"loss": 0.7528,
"step": 24300
},
{
"epoch": 28.71,
"learning_rate": 5e-06,
"loss": 0.7794,
"step": 24400
},
{
"epoch": 28.82,
"learning_rate": 5e-06,
"loss": 0.7573,
"step": 24500
},
{
"epoch": 28.94,
"learning_rate": 5e-06,
"loss": 0.7688,
"step": 24600
},
{
"epoch": 29.06,
"learning_rate": 5e-06,
"loss": 0.7859,
"step": 24700
},
{
"epoch": 29.18,
"learning_rate": 5e-06,
"loss": 0.739,
"step": 24800
},
{
"epoch": 29.29,
"learning_rate": 5e-06,
"loss": 0.7646,
"step": 24900
},
{
"epoch": 29.41,
"learning_rate": 5e-06,
"loss": 0.757,
"step": 25000
},
{
"epoch": 29.53,
"learning_rate": 5e-06,
"loss": 0.7316,
"step": 25100
},
{
"epoch": 29.65,
"learning_rate": 5e-06,
"loss": 0.746,
"step": 25200
},
{
"epoch": 29.76,
"learning_rate": 5e-06,
"loss": 0.7443,
"step": 25300
},
{
"epoch": 29.88,
"learning_rate": 5e-06,
"loss": 0.766,
"step": 25400
},
{
"epoch": 30.0,
"learning_rate": 5e-06,
"loss": 0.7928,
"step": 25500
},
{
"epoch": 30.12,
"learning_rate": 5e-06,
"loss": 0.7454,
"step": 25600
},
{
"epoch": 30.24,
"learning_rate": 5e-06,
"loss": 0.7576,
"step": 25700
},
{
"epoch": 30.35,
"learning_rate": 5e-06,
"loss": 0.7885,
"step": 25800
},
{
"epoch": 30.47,
"learning_rate": 5e-06,
"loss": 0.7166,
"step": 25900
},
{
"epoch": 30.59,
"learning_rate": 5e-06,
"loss": 0.727,
"step": 26000
},
{
"epoch": 30.71,
"learning_rate": 5e-06,
"loss": 0.7202,
"step": 26100
},
{
"epoch": 30.82,
"learning_rate": 5e-06,
"loss": 0.7493,
"step": 26200
},
{
"epoch": 30.94,
"learning_rate": 5e-06,
"loss": 0.7584,
"step": 26300
},
{
"epoch": 31.06,
"learning_rate": 5e-06,
"loss": 0.7856,
"step": 26400
},
{
"epoch": 31.18,
"learning_rate": 5e-06,
"loss": 0.7151,
"step": 26500
},
{
"epoch": 31.29,
"learning_rate": 5e-06,
"loss": 0.7352,
"step": 26600
},
{
"epoch": 31.41,
"learning_rate": 5e-06,
"loss": 0.7561,
"step": 26700
},
{
"epoch": 31.53,
"learning_rate": 5e-06,
"loss": 0.7357,
"step": 26800
},
{
"epoch": 31.65,
"learning_rate": 5e-06,
"loss": 0.7398,
"step": 26900
},
{
"epoch": 31.76,
"learning_rate": 5e-06,
"loss": 0.717,
"step": 27000
},
{
"epoch": 31.88,
"learning_rate": 5e-06,
"loss": 0.7405,
"step": 27100
},
{
"epoch": 32.0,
"learning_rate": 5e-06,
"loss": 0.7155,
"step": 27200
},
{
"epoch": 32.12,
"learning_rate": 5e-06,
"loss": 0.7264,
"step": 27300
},
{
"epoch": 32.24,
"learning_rate": 5e-06,
"loss": 0.7139,
"step": 27400
},
{
"epoch": 32.35,
"learning_rate": 5e-06,
"loss": 0.7467,
"step": 27500
},
{
"epoch": 32.47,
"learning_rate": 5e-06,
"loss": 0.7192,
"step": 27600
},
{
"epoch": 32.59,
"learning_rate": 5e-06,
"loss": 0.7297,
"step": 27700
},
{
"epoch": 32.71,
"learning_rate": 5e-06,
"loss": 0.6969,
"step": 27800
},
{
"epoch": 32.82,
"learning_rate": 5e-06,
"loss": 0.7302,
"step": 27900
},
{
"epoch": 32.94,
"learning_rate": 5e-06,
"loss": 0.6971,
"step": 28000
},
{
"epoch": 33.06,
"learning_rate": 5e-06,
"loss": 0.7248,
"step": 28100
},
{
"epoch": 33.18,
"learning_rate": 5e-06,
"loss": 0.7306,
"step": 28200
},
{
"epoch": 33.29,
"learning_rate": 5e-06,
"loss": 0.7182,
"step": 28300
},
{
"epoch": 33.41,
"learning_rate": 5e-06,
"loss": 0.7212,
"step": 28400
},
{
"epoch": 33.53,
"learning_rate": 5e-06,
"loss": 0.7015,
"step": 28500
},
{
"epoch": 33.65,
"learning_rate": 5e-06,
"loss": 0.7072,
"step": 28600
},
{
"epoch": 33.76,
"learning_rate": 5e-06,
"loss": 0.714,
"step": 28700
},
{
"epoch": 33.88,
"learning_rate": 5e-06,
"loss": 0.7088,
"step": 28800
},
{
"epoch": 34.0,
"learning_rate": 5e-06,
"loss": 0.6743,
"step": 28900
},
{
"epoch": 34.12,
"learning_rate": 5e-06,
"loss": 0.7316,
"step": 29000
},
{
"epoch": 34.24,
"learning_rate": 5e-06,
"loss": 0.7142,
"step": 29100
},
{
"epoch": 34.35,
"learning_rate": 5e-06,
"loss": 0.6911,
"step": 29200
},
{
"epoch": 34.47,
"learning_rate": 5e-06,
"loss": 0.713,
"step": 29300
},
{
"epoch": 34.59,
"learning_rate": 5e-06,
"loss": 0.7091,
"step": 29400
},
{
"epoch": 34.71,
"learning_rate": 5e-06,
"loss": 0.7057,
"step": 29500
},
{
"epoch": 34.82,
"learning_rate": 5e-06,
"loss": 0.6711,
"step": 29600
},
{
"epoch": 34.94,
"learning_rate": 5e-06,
"loss": 0.7152,
"step": 29700
},
{
"epoch": 35.06,
"learning_rate": 5e-06,
"loss": 0.6721,
"step": 29800
},
{
"epoch": 35.18,
"learning_rate": 5e-06,
"loss": 0.7131,
"step": 29900
},
{
"epoch": 35.29,
"learning_rate": 5e-06,
"loss": 0.6883,
"step": 30000
},
{
"epoch": 35.29,
"eval_cer": 0.11668475732671732,
"eval_loss": 0.5099760293960571,
"eval_runtime": 8.0478,
"eval_samples_per_second": 37.277,
"eval_steps_per_second": 18.639,
"eval_wer": 0.4008547008547009,
"step": 30000
},
{
"epoch": 35.41,
"learning_rate": 4.9850000000000006e-06,
"loss": 0.6949,
"step": 30100
},
{
"epoch": 35.53,
"learning_rate": 4.968500000000001e-06,
"loss": 0.6943,
"step": 30200
},
{
"epoch": 35.65,
"learning_rate": 4.951833333333333e-06,
"loss": 0.705,
"step": 30300
},
{
"epoch": 35.76,
"learning_rate": 4.935166666666667e-06,
"loss": 0.6903,
"step": 30400
},
{
"epoch": 35.88,
"learning_rate": 4.9185000000000004e-06,
"loss": 0.6813,
"step": 30500
},
{
"epoch": 36.0,
"learning_rate": 4.901833333333334e-06,
"loss": 0.6993,
"step": 30600
},
{
"epoch": 36.12,
"learning_rate": 4.885166666666667e-06,
"loss": 0.7115,
"step": 30700
},
{
"epoch": 36.24,
"learning_rate": 4.8685e-06,
"loss": 0.6808,
"step": 30800
},
{
"epoch": 36.35,
"learning_rate": 4.851833333333334e-06,
"loss": 0.6784,
"step": 30900
},
{
"epoch": 36.47,
"learning_rate": 4.8351666666666665e-06,
"loss": 0.6953,
"step": 31000
},
{
"epoch": 36.59,
"learning_rate": 4.8185000000000005e-06,
"loss": 0.6499,
"step": 31100
},
{
"epoch": 36.71,
"learning_rate": 4.802000000000001e-06,
"loss": 0.6982,
"step": 31200
},
{
"epoch": 36.82,
"learning_rate": 4.785333333333333e-06,
"loss": 0.7057,
"step": 31300
},
{
"epoch": 36.94,
"learning_rate": 4.768666666666667e-06,
"loss": 0.7036,
"step": 31400
},
{
"epoch": 37.06,
"learning_rate": 4.752e-06,
"loss": 0.6677,
"step": 31500
},
{
"epoch": 37.18,
"learning_rate": 4.735333333333334e-06,
"loss": 0.6643,
"step": 31600
},
{
"epoch": 37.29,
"learning_rate": 4.718666666666667e-06,
"loss": 0.7145,
"step": 31700
},
{
"epoch": 37.41,
"learning_rate": 4.702e-06,
"loss": 0.6781,
"step": 31800
},
{
"epoch": 37.53,
"learning_rate": 4.685333333333334e-06,
"loss": 0.69,
"step": 31900
},
{
"epoch": 37.65,
"learning_rate": 4.668666666666667e-06,
"loss": 0.6714,
"step": 32000
},
{
"epoch": 37.76,
"learning_rate": 4.6520000000000005e-06,
"loss": 0.67,
"step": 32100
},
{
"epoch": 37.88,
"learning_rate": 4.635333333333334e-06,
"loss": 0.6496,
"step": 32200
},
{
"epoch": 38.0,
"learning_rate": 4.618666666666667e-06,
"loss": 0.663,
"step": 32300
},
{
"epoch": 38.12,
"learning_rate": 4.602e-06,
"loss": 0.6378,
"step": 32400
},
{
"epoch": 38.24,
"learning_rate": 4.585333333333334e-06,
"loss": 0.694,
"step": 32500
},
{
"epoch": 38.35,
"learning_rate": 4.5686666666666666e-06,
"loss": 0.6994,
"step": 32600
},
{
"epoch": 38.47,
"learning_rate": 4.552000000000001e-06,
"loss": 0.6652,
"step": 32700
},
{
"epoch": 38.59,
"learning_rate": 4.535333333333334e-06,
"loss": 0.6658,
"step": 32800
},
{
"epoch": 38.71,
"learning_rate": 4.518666666666667e-06,
"loss": 0.6388,
"step": 32900
},
{
"epoch": 38.82,
"learning_rate": 4.502e-06,
"loss": 0.6541,
"step": 33000
},
{
"epoch": 38.94,
"learning_rate": 4.4853333333333335e-06,
"loss": 0.69,
"step": 33100
},
{
"epoch": 39.06,
"learning_rate": 4.4686666666666675e-06,
"loss": 0.6705,
"step": 33200
},
{
"epoch": 39.18,
"learning_rate": 4.452e-06,
"loss": 0.6568,
"step": 33300
},
{
"epoch": 39.29,
"learning_rate": 4.435333333333334e-06,
"loss": 0.6731,
"step": 33400
},
{
"epoch": 39.41,
"learning_rate": 4.418666666666667e-06,
"loss": 0.6174,
"step": 33500
},
{
"epoch": 39.53,
"learning_rate": 4.4021666666666666e-06,
"loss": 0.6488,
"step": 33600
},
{
"epoch": 39.65,
"learning_rate": 4.385500000000001e-06,
"loss": 0.6672,
"step": 33700
},
{
"epoch": 39.76,
"learning_rate": 4.368833333333334e-06,
"loss": 0.6654,
"step": 33800
},
{
"epoch": 39.88,
"learning_rate": 4.352166666666667e-06,
"loss": 0.6484,
"step": 33900
},
{
"epoch": 40.0,
"learning_rate": 4.3355e-06,
"loss": 0.6738,
"step": 34000
},
{
"epoch": 40.12,
"learning_rate": 4.3188333333333335e-06,
"loss": 0.6553,
"step": 34100
},
{
"epoch": 40.24,
"learning_rate": 4.3021666666666675e-06,
"loss": 0.6726,
"step": 34200
},
{
"epoch": 40.35,
"learning_rate": 4.2855e-06,
"loss": 0.6605,
"step": 34300
},
{
"epoch": 40.47,
"learning_rate": 4.268833333333334e-06,
"loss": 0.6471,
"step": 34400
},
{
"epoch": 40.59,
"learning_rate": 4.252166666666667e-06,
"loss": 0.6644,
"step": 34500
},
{
"epoch": 40.71,
"learning_rate": 4.2355e-06,
"loss": 0.6396,
"step": 34600
},
{
"epoch": 40.82,
"learning_rate": 4.2188333333333336e-06,
"loss": 0.6682,
"step": 34700
},
{
"epoch": 40.94,
"learning_rate": 4.202166666666667e-06,
"loss": 0.6269,
"step": 34800
},
{
"epoch": 41.06,
"learning_rate": 4.1855e-06,
"loss": 0.6254,
"step": 34900
},
{
"epoch": 41.18,
"learning_rate": 4.168833333333333e-06,
"loss": 0.6285,
"step": 35000
},
{
"epoch": 41.29,
"learning_rate": 4.152166666666667e-06,
"loss": 0.6405,
"step": 35100
},
{
"epoch": 41.41,
"learning_rate": 4.1355000000000005e-06,
"loss": 0.6531,
"step": 35200
},
{
"epoch": 41.53,
"learning_rate": 4.118833333333334e-06,
"loss": 0.626,
"step": 35300
},
{
"epoch": 41.65,
"learning_rate": 4.102166666666667e-06,
"loss": 0.6745,
"step": 35400
},
{
"epoch": 41.76,
"learning_rate": 4.085500000000001e-06,
"loss": 0.6601,
"step": 35500
},
{
"epoch": 41.88,
"learning_rate": 4.068833333333333e-06,
"loss": 0.6223,
"step": 35600
},
{
"epoch": 42.0,
"learning_rate": 4.052166666666667e-06,
"loss": 0.6439,
"step": 35700
},
{
"epoch": 42.12,
"learning_rate": 4.035500000000001e-06,
"loss": 0.6274,
"step": 35800
},
{
"epoch": 42.24,
"learning_rate": 4.018833333333334e-06,
"loss": 0.6163,
"step": 35900
},
{
"epoch": 42.35,
"learning_rate": 4.002166666666667e-06,
"loss": 0.651,
"step": 36000
},
{
"epoch": 42.47,
"learning_rate": 3.9855e-06,
"loss": 0.6341,
"step": 36100
},
{
"epoch": 42.59,
"learning_rate": 3.968833333333333e-06,
"loss": 0.6236,
"step": 36200
},
{
"epoch": 42.71,
"learning_rate": 3.952166666666667e-06,
"loss": 0.6525,
"step": 36300
},
{
"epoch": 42.82,
"learning_rate": 3.935500000000001e-06,
"loss": 0.653,
"step": 36400
},
{
"epoch": 42.94,
"learning_rate": 3.918833333333333e-06,
"loss": 0.6356,
"step": 36500
},
{
"epoch": 43.06,
"learning_rate": 3.902166666666667e-06,
"loss": 0.6413,
"step": 36600
},
{
"epoch": 43.18,
"learning_rate": 3.8855e-06,
"loss": 0.636,
"step": 36700
},
{
"epoch": 43.29,
"learning_rate": 3.8688333333333335e-06,
"loss": 0.6495,
"step": 36800
},
{
"epoch": 43.41,
"learning_rate": 3.852166666666667e-06,
"loss": 0.6472,
"step": 36900
},
{
"epoch": 43.53,
"learning_rate": 3.835666666666667e-06,
"loss": 0.6387,
"step": 37000
},
{
"epoch": 43.65,
"learning_rate": 3.819e-06,
"loss": 0.5985,
"step": 37100
},
{
"epoch": 43.76,
"learning_rate": 3.8023333333333334e-06,
"loss": 0.6109,
"step": 37200
},
{
"epoch": 43.88,
"learning_rate": 3.785666666666667e-06,
"loss": 0.6498,
"step": 37300
},
{
"epoch": 44.0,
"learning_rate": 3.7690000000000003e-06,
"loss": 0.6243,
"step": 37400
},
{
"epoch": 44.12,
"learning_rate": 3.7523333333333335e-06,
"loss": 0.6068,
"step": 37500
},
{
"epoch": 44.24,
"learning_rate": 3.735666666666667e-06,
"loss": 0.6291,
"step": 37600
},
{
"epoch": 44.35,
"learning_rate": 3.7190000000000003e-06,
"loss": 0.6021,
"step": 37700
},
{
"epoch": 44.47,
"learning_rate": 3.702333333333334e-06,
"loss": 0.6444,
"step": 37800
},
{
"epoch": 44.59,
"learning_rate": 3.6856666666666667e-06,
"loss": 0.6265,
"step": 37900
},
{
"epoch": 44.71,
"learning_rate": 3.6690000000000004e-06,
"loss": 0.6596,
"step": 38000
},
{
"epoch": 44.82,
"learning_rate": 3.652333333333334e-06,
"loss": 0.6339,
"step": 38100
},
{
"epoch": 44.94,
"learning_rate": 3.6356666666666668e-06,
"loss": 0.5719,
"step": 38200
},
{
"epoch": 45.06,
"learning_rate": 3.6190000000000004e-06,
"loss": 0.6112,
"step": 38300
},
{
"epoch": 45.18,
"learning_rate": 3.6023333333333336e-06,
"loss": 0.5938,
"step": 38400
},
{
"epoch": 45.29,
"learning_rate": 3.585666666666667e-06,
"loss": 0.6407,
"step": 38500
},
{
"epoch": 45.41,
"learning_rate": 3.569e-06,
"loss": 0.6178,
"step": 38600
},
{
"epoch": 45.53,
"learning_rate": 3.5523333333333337e-06,
"loss": 0.6155,
"step": 38700
},
{
"epoch": 45.65,
"learning_rate": 3.535666666666667e-06,
"loss": 0.6266,
"step": 38800
},
{
"epoch": 45.76,
"learning_rate": 3.519e-06,
"loss": 0.6224,
"step": 38900
},
{
"epoch": 45.88,
"learning_rate": 3.5023333333333337e-06,
"loss": 0.6226,
"step": 39000
},
{
"epoch": 46.0,
"learning_rate": 3.4856666666666674e-06,
"loss": 0.6466,
"step": 39100
},
{
"epoch": 46.12,
"learning_rate": 3.469e-06,
"loss": 0.6224,
"step": 39200
},
{
"epoch": 46.24,
"learning_rate": 3.452333333333334e-06,
"loss": 0.6353,
"step": 39300
},
{
"epoch": 46.35,
"learning_rate": 3.435666666666667e-06,
"loss": 0.6275,
"step": 39400
},
{
"epoch": 46.47,
"learning_rate": 3.4190000000000002e-06,
"loss": 0.5966,
"step": 39500
},
{
"epoch": 46.59,
"learning_rate": 3.4023333333333334e-06,
"loss": 0.5977,
"step": 39600
},
{
"epoch": 46.71,
"learning_rate": 3.385666666666667e-06,
"loss": 0.6113,
"step": 39700
},
{
"epoch": 46.82,
"learning_rate": 3.369e-06,
"loss": 0.5967,
"step": 39800
},
{
"epoch": 46.94,
"learning_rate": 3.3523333333333335e-06,
"loss": 0.6262,
"step": 39900
},
{
"epoch": 47.06,
"learning_rate": 3.3358333333333337e-06,
"loss": 0.5981,
"step": 40000
},
{
"epoch": 47.06,
"eval_cer": 0.1052101100945883,
"eval_loss": 0.48587092757225037,
"eval_runtime": 8.036,
"eval_samples_per_second": 37.332,
"eval_steps_per_second": 18.666,
"eval_wer": 0.3572649572649573,
"step": 40000
},
{
"epoch": 47.18,
"learning_rate": 3.3191666666666674e-06,
"loss": 0.6019,
"step": 40100
},
{
"epoch": 47.29,
"learning_rate": 3.3025e-06,
"loss": 0.5866,
"step": 40200
},
{
"epoch": 47.41,
"learning_rate": 3.2858333333333338e-06,
"loss": 0.5983,
"step": 40300
},
{
"epoch": 47.53,
"learning_rate": 3.269166666666667e-06,
"loss": 0.5854,
"step": 40400
},
{
"epoch": 47.65,
"learning_rate": 3.2525e-06,
"loss": 0.5665,
"step": 40500
},
{
"epoch": 47.76,
"learning_rate": 3.2358333333333334e-06,
"loss": 0.638,
"step": 40600
},
{
"epoch": 47.88,
"learning_rate": 3.219166666666667e-06,
"loss": 0.6153,
"step": 40700
},
{
"epoch": 48.0,
"learning_rate": 3.2025000000000003e-06,
"loss": 0.6046,
"step": 40800
},
{
"epoch": 48.12,
"learning_rate": 3.1858333333333335e-06,
"loss": 0.5652,
"step": 40900
},
{
"epoch": 48.24,
"learning_rate": 3.169166666666667e-06,
"loss": 0.6097,
"step": 41000
},
{
"epoch": 48.35,
"learning_rate": 3.1525e-06,
"loss": 0.5932,
"step": 41100
},
{
"epoch": 48.47,
"learning_rate": 3.1358333333333335e-06,
"loss": 0.6151,
"step": 41200
},
{
"epoch": 48.59,
"learning_rate": 3.119166666666667e-06,
"loss": 0.6048,
"step": 41300
},
{
"epoch": 48.71,
"learning_rate": 3.1025000000000004e-06,
"loss": 0.6,
"step": 41400
},
{
"epoch": 48.82,
"learning_rate": 3.0858333333333336e-06,
"loss": 0.5761,
"step": 41500
},
{
"epoch": 48.94,
"learning_rate": 3.0691666666666668e-06,
"loss": 0.6254,
"step": 41600
},
{
"epoch": 49.06,
"learning_rate": 3.0525000000000004e-06,
"loss": 0.5672,
"step": 41700
},
{
"epoch": 49.18,
"learning_rate": 3.035833333333333e-06,
"loss": 0.6149,
"step": 41800
},
{
"epoch": 49.29,
"learning_rate": 3.019166666666667e-06,
"loss": 0.5854,
"step": 41900
},
{
"epoch": 49.41,
"learning_rate": 3.0025000000000005e-06,
"loss": 0.6052,
"step": 42000
},
{
"epoch": 49.53,
"learning_rate": 2.9858333333333333e-06,
"loss": 0.5895,
"step": 42100
},
{
"epoch": 49.65,
"learning_rate": 2.969166666666667e-06,
"loss": 0.5834,
"step": 42200
},
{
"epoch": 49.76,
"learning_rate": 2.9525000000000005e-06,
"loss": 0.6388,
"step": 42300
},
{
"epoch": 49.88,
"learning_rate": 2.9358333333333333e-06,
"loss": 0.5918,
"step": 42400
},
{
"epoch": 50.0,
"learning_rate": 2.919166666666667e-06,
"loss": 0.5773,
"step": 42500
},
{
"epoch": 50.12,
"learning_rate": 2.9025e-06,
"loss": 0.6082,
"step": 42600
},
{
"epoch": 50.24,
"learning_rate": 2.8860000000000004e-06,
"loss": 0.6115,
"step": 42700
},
{
"epoch": 50.35,
"learning_rate": 2.8693333333333336e-06,
"loss": 0.5777,
"step": 42800
},
{
"epoch": 50.47,
"learning_rate": 2.852666666666667e-06,
"loss": 0.5943,
"step": 42900
},
{
"epoch": 50.59,
"learning_rate": 2.8360000000000005e-06,
"loss": 0.6074,
"step": 43000
},
{
"epoch": 50.71,
"learning_rate": 2.8193333333333332e-06,
"loss": 0.6122,
"step": 43100
},
{
"epoch": 50.82,
"learning_rate": 2.802666666666667e-06,
"loss": 0.5838,
"step": 43200
},
{
"epoch": 50.94,
"learning_rate": 2.7860000000000005e-06,
"loss": 0.58,
"step": 43300
},
{
"epoch": 51.06,
"learning_rate": 2.7693333333333333e-06,
"loss": 0.5893,
"step": 43400
},
{
"epoch": 51.18,
"learning_rate": 2.752666666666667e-06,
"loss": 0.5824,
"step": 43500
},
{
"epoch": 51.29,
"learning_rate": 2.736e-06,
"loss": 0.5602,
"step": 43600
},
{
"epoch": 51.41,
"learning_rate": 2.7193333333333338e-06,
"loss": 0.5984,
"step": 43700
},
{
"epoch": 51.53,
"learning_rate": 2.7026666666666666e-06,
"loss": 0.598,
"step": 43800
},
{
"epoch": 51.65,
"learning_rate": 2.686e-06,
"loss": 0.6005,
"step": 43900
},
{
"epoch": 51.76,
"learning_rate": 2.669333333333334e-06,
"loss": 0.5941,
"step": 44000
},
{
"epoch": 51.88,
"learning_rate": 2.6526666666666666e-06,
"loss": 0.5956,
"step": 44100
},
{
"epoch": 52.0,
"learning_rate": 2.6360000000000003e-06,
"loss": 0.5674,
"step": 44200
},
{
"epoch": 52.12,
"learning_rate": 2.619333333333334e-06,
"loss": 0.5929,
"step": 44300
},
{
"epoch": 52.24,
"learning_rate": 2.6026666666666667e-06,
"loss": 0.5803,
"step": 44400
},
{
"epoch": 52.35,
"learning_rate": 2.5860000000000003e-06,
"loss": 0.5656,
"step": 44500
},
{
"epoch": 52.47,
"learning_rate": 2.5693333333333335e-06,
"loss": 0.611,
"step": 44600
},
{
"epoch": 52.59,
"learning_rate": 2.5526666666666667e-06,
"loss": 0.5677,
"step": 44700
},
{
"epoch": 52.71,
"learning_rate": 2.536e-06,
"loss": 0.5909,
"step": 44800
},
{
"epoch": 52.82,
"learning_rate": 2.5193333333333336e-06,
"loss": 0.5803,
"step": 44900
},
{
"epoch": 52.94,
"learning_rate": 2.5026666666666672e-06,
"loss": 0.589,
"step": 45000
},
{
"epoch": 53.06,
"learning_rate": 2.486e-06,
"loss": 0.592,
"step": 45100
},
{
"epoch": 53.18,
"learning_rate": 2.4693333333333336e-06,
"loss": 0.583,
"step": 45200
},
{
"epoch": 53.29,
"learning_rate": 2.452666666666667e-06,
"loss": 0.5544,
"step": 45300
},
{
"epoch": 53.41,
"learning_rate": 2.4360000000000005e-06,
"loss": 0.5524,
"step": 45400
},
{
"epoch": 53.53,
"learning_rate": 2.4193333333333337e-06,
"loss": 0.5719,
"step": 45500
},
{
"epoch": 53.65,
"learning_rate": 2.402666666666667e-06,
"loss": 0.5986,
"step": 45600
},
{
"epoch": 53.76,
"learning_rate": 2.386e-06,
"loss": 0.5815,
"step": 45700
},
{
"epoch": 53.88,
"learning_rate": 2.3693333333333333e-06,
"loss": 0.5761,
"step": 45800
},
{
"epoch": 54.0,
"learning_rate": 2.352666666666667e-06,
"loss": 0.594,
"step": 45900
},
{
"epoch": 54.12,
"learning_rate": 2.336e-06,
"loss": 0.5625,
"step": 46000
},
{
"epoch": 54.24,
"learning_rate": 2.3195e-06,
"loss": 0.5961,
"step": 46100
},
{
"epoch": 54.35,
"learning_rate": 2.3028333333333336e-06,
"loss": 0.5907,
"step": 46200
},
{
"epoch": 54.47,
"learning_rate": 2.286166666666667e-06,
"loss": 0.5821,
"step": 46300
},
{
"epoch": 54.59,
"learning_rate": 2.2695000000000005e-06,
"loss": 0.5623,
"step": 46400
},
{
"epoch": 54.71,
"learning_rate": 2.2528333333333337e-06,
"loss": 0.5477,
"step": 46500
},
{
"epoch": 54.82,
"learning_rate": 2.236166666666667e-06,
"loss": 0.5685,
"step": 46600
},
{
"epoch": 54.94,
"learning_rate": 2.2195e-06,
"loss": 0.566,
"step": 46700
},
{
"epoch": 55.06,
"learning_rate": 2.2028333333333333e-06,
"loss": 0.5954,
"step": 46800
},
{
"epoch": 55.18,
"learning_rate": 2.1861666666666665e-06,
"loss": 0.5681,
"step": 46900
},
{
"epoch": 55.29,
"learning_rate": 2.1695e-06,
"loss": 0.5613,
"step": 47000
},
{
"epoch": 55.41,
"learning_rate": 2.1528333333333334e-06,
"loss": 0.6032,
"step": 47100
},
{
"epoch": 55.53,
"learning_rate": 2.136166666666667e-06,
"loss": 0.574,
"step": 47200
},
{
"epoch": 55.65,
"learning_rate": 2.1195e-06,
"loss": 0.576,
"step": 47300
},
{
"epoch": 55.76,
"learning_rate": 2.1028333333333334e-06,
"loss": 0.5908,
"step": 47400
},
{
"epoch": 55.88,
"learning_rate": 2.086166666666667e-06,
"loss": 0.5963,
"step": 47500
},
{
"epoch": 56.0,
"learning_rate": 2.0695000000000003e-06,
"loss": 0.5514,
"step": 47600
},
{
"epoch": 56.12,
"learning_rate": 2.0528333333333335e-06,
"loss": 0.5786,
"step": 47700
},
{
"epoch": 56.24,
"learning_rate": 2.0361666666666667e-06,
"loss": 0.5802,
"step": 47800
},
{
"epoch": 56.35,
"learning_rate": 2.0195e-06,
"loss": 0.5713,
"step": 47900
},
{
"epoch": 56.47,
"learning_rate": 2.0028333333333335e-06,
"loss": 0.5573,
"step": 48000
},
{
"epoch": 56.59,
"learning_rate": 1.9861666666666667e-06,
"loss": 0.5811,
"step": 48100
},
{
"epoch": 56.71,
"learning_rate": 1.9695e-06,
"loss": 0.581,
"step": 48200
},
{
"epoch": 56.82,
"learning_rate": 1.953e-06,
"loss": 0.5859,
"step": 48300
},
{
"epoch": 56.94,
"learning_rate": 1.9363333333333334e-06,
"loss": 0.5347,
"step": 48400
},
{
"epoch": 57.06,
"learning_rate": 1.919666666666667e-06,
"loss": 0.5601,
"step": 48500
},
{
"epoch": 57.18,
"learning_rate": 1.903e-06,
"loss": 0.5458,
"step": 48600
},
{
"epoch": 57.29,
"learning_rate": 1.8863333333333332e-06,
"loss": 0.5625,
"step": 48700
},
{
"epoch": 57.41,
"learning_rate": 1.8696666666666669e-06,
"loss": 0.5777,
"step": 48800
},
{
"epoch": 57.53,
"learning_rate": 1.853e-06,
"loss": 0.5575,
"step": 48900
},
{
"epoch": 57.65,
"learning_rate": 1.8363333333333335e-06,
"loss": 0.5938,
"step": 49000
},
{
"epoch": 57.76,
"learning_rate": 1.8196666666666667e-06,
"loss": 0.538,
"step": 49100
},
{
"epoch": 57.88,
"learning_rate": 1.803e-06,
"loss": 0.5787,
"step": 49200
},
{
"epoch": 58.0,
"learning_rate": 1.7863333333333336e-06,
"loss": 0.57,
"step": 49300
},
{
"epoch": 58.12,
"learning_rate": 1.7696666666666668e-06,
"loss": 0.5726,
"step": 49400
},
{
"epoch": 58.24,
"learning_rate": 1.7530000000000002e-06,
"loss": 0.5859,
"step": 49500
},
{
"epoch": 58.35,
"learning_rate": 1.7363333333333334e-06,
"loss": 0.5675,
"step": 49600
},
{
"epoch": 58.47,
"learning_rate": 1.7196666666666666e-06,
"loss": 0.5726,
"step": 49700
},
{
"epoch": 58.59,
"learning_rate": 1.7030000000000003e-06,
"loss": 0.5534,
"step": 49800
},
{
"epoch": 58.71,
"learning_rate": 1.6863333333333335e-06,
"loss": 0.5703,
"step": 49900
},
{
"epoch": 58.82,
"learning_rate": 1.6696666666666669e-06,
"loss": 0.5618,
"step": 50000
},
{
"epoch": 58.82,
"eval_cer": 0.09924019227787254,
"eval_loss": 0.4731317162513733,
"eval_runtime": 8.1161,
"eval_samples_per_second": 36.964,
"eval_steps_per_second": 18.482,
"eval_wer": 0.33589743589743587,
"step": 50000
},
{
"epoch": 58.94,
"learning_rate": 1.653e-06,
"loss": 0.5616,
"step": 50100
},
{
"epoch": 59.06,
"learning_rate": 1.6363333333333333e-06,
"loss": 0.5285,
"step": 50200
},
{
"epoch": 59.18,
"learning_rate": 1.619666666666667e-06,
"loss": 0.5561,
"step": 50300
},
{
"epoch": 59.29,
"learning_rate": 1.6030000000000002e-06,
"loss": 0.5872,
"step": 50400
},
{
"epoch": 59.41,
"learning_rate": 1.5863333333333334e-06,
"loss": 0.559,
"step": 50500
},
{
"epoch": 59.53,
"learning_rate": 1.5696666666666668e-06,
"loss": 0.5518,
"step": 50600
},
{
"epoch": 59.65,
"learning_rate": 1.553e-06,
"loss": 0.5641,
"step": 50700
},
{
"epoch": 59.76,
"learning_rate": 1.5363333333333336e-06,
"loss": 0.5567,
"step": 50800
},
{
"epoch": 59.88,
"learning_rate": 1.5196666666666668e-06,
"loss": 0.5475,
"step": 50900
},
{
"epoch": 60.0,
"learning_rate": 1.503e-06,
"loss": 0.5741,
"step": 51000
},
{
"epoch": 60.12,
"learning_rate": 1.4863333333333335e-06,
"loss": 0.5537,
"step": 51100
},
{
"epoch": 60.24,
"learning_rate": 1.4696666666666667e-06,
"loss": 0.5887,
"step": 51200
},
{
"epoch": 60.35,
"learning_rate": 1.4530000000000003e-06,
"loss": 0.5697,
"step": 51300
},
{
"epoch": 60.47,
"learning_rate": 1.4363333333333335e-06,
"loss": 0.5254,
"step": 51400
},
{
"epoch": 60.59,
"learning_rate": 1.4196666666666667e-06,
"loss": 0.5531,
"step": 51500
},
{
"epoch": 60.71,
"learning_rate": 1.4030000000000002e-06,
"loss": 0.5752,
"step": 51600
},
{
"epoch": 60.82,
"learning_rate": 1.3865e-06,
"loss": 0.5885,
"step": 51700
},
{
"epoch": 60.94,
"learning_rate": 1.3698333333333336e-06,
"loss": 0.5348,
"step": 51800
},
{
"epoch": 61.06,
"learning_rate": 1.3531666666666668e-06,
"loss": 0.5477,
"step": 51900
},
{
"epoch": 61.18,
"learning_rate": 1.3365e-06,
"loss": 0.5655,
"step": 52000
},
{
"epoch": 61.29,
"learning_rate": 1.3198333333333335e-06,
"loss": 0.5846,
"step": 52100
},
{
"epoch": 61.41,
"learning_rate": 1.3031666666666667e-06,
"loss": 0.5345,
"step": 52200
},
{
"epoch": 61.53,
"learning_rate": 1.2864999999999999e-06,
"loss": 0.5482,
"step": 52300
},
{
"epoch": 61.65,
"learning_rate": 1.2698333333333335e-06,
"loss": 0.5474,
"step": 52400
},
{
"epoch": 61.76,
"learning_rate": 1.2531666666666667e-06,
"loss": 0.5829,
"step": 52500
},
{
"epoch": 61.88,
"learning_rate": 1.2365000000000001e-06,
"loss": 0.5268,
"step": 52600
},
{
"epoch": 62.0,
"learning_rate": 1.2198333333333334e-06,
"loss": 0.5452,
"step": 52700
},
{
"epoch": 62.12,
"learning_rate": 1.2031666666666668e-06,
"loss": 0.5627,
"step": 52800
},
{
"epoch": 62.24,
"learning_rate": 1.1865000000000002e-06,
"loss": 0.5335,
"step": 52900
},
{
"epoch": 62.35,
"learning_rate": 1.1698333333333334e-06,
"loss": 0.586,
"step": 53000
},
{
"epoch": 62.47,
"learning_rate": 1.1531666666666668e-06,
"loss": 0.533,
"step": 53100
},
{
"epoch": 62.59,
"learning_rate": 1.1365e-06,
"loss": 0.5268,
"step": 53200
},
{
"epoch": 62.71,
"learning_rate": 1.1198333333333335e-06,
"loss": 0.5653,
"step": 53300
},
{
"epoch": 62.82,
"learning_rate": 1.1031666666666667e-06,
"loss": 0.5776,
"step": 53400
},
{
"epoch": 62.94,
"learning_rate": 1.0865e-06,
"loss": 0.5267,
"step": 53500
},
{
"epoch": 63.06,
"learning_rate": 1.0698333333333335e-06,
"loss": 0.5701,
"step": 53600
},
{
"epoch": 63.18,
"learning_rate": 1.0531666666666667e-06,
"loss": 0.529,
"step": 53700
},
{
"epoch": 63.29,
"learning_rate": 1.0365000000000002e-06,
"loss": 0.5636,
"step": 53800
},
{
"epoch": 63.41,
"learning_rate": 1.0198333333333334e-06,
"loss": 0.5399,
"step": 53900
},
{
"epoch": 63.53,
"learning_rate": 1.0031666666666668e-06,
"loss": 0.5481,
"step": 54000
},
{
"epoch": 63.65,
"learning_rate": 9.865e-07,
"loss": 0.5492,
"step": 54100
},
{
"epoch": 63.76,
"learning_rate": 9.698333333333334e-07,
"loss": 0.576,
"step": 54200
},
{
"epoch": 63.88,
"learning_rate": 9.531666666666666e-07,
"loss": 0.5833,
"step": 54300
},
{
"epoch": 64.0,
"learning_rate": 9.365000000000001e-07,
"loss": 0.5444,
"step": 54400
},
{
"epoch": 64.12,
"learning_rate": 9.198333333333334e-07,
"loss": 0.5716,
"step": 54500
},
{
"epoch": 64.24,
"learning_rate": 9.031666666666668e-07,
"loss": 0.5418,
"step": 54600
},
{
"epoch": 64.35,
"learning_rate": 8.865000000000001e-07,
"loss": 0.5329,
"step": 54700
},
{
"epoch": 64.47,
"learning_rate": 8.698333333333333e-07,
"loss": 0.5762,
"step": 54800
},
{
"epoch": 64.59,
"learning_rate": 8.531666666666667e-07,
"loss": 0.5156,
"step": 54900
},
{
"epoch": 64.71,
"learning_rate": 8.366666666666668e-07,
"loss": 0.5502,
"step": 55000
},
{
"epoch": 64.82,
"learning_rate": 8.200000000000001e-07,
"loss": 0.5556,
"step": 55100
},
{
"epoch": 64.94,
"learning_rate": 8.033333333333335e-07,
"loss": 0.5585,
"step": 55200
},
{
"epoch": 65.06,
"learning_rate": 7.866666666666667e-07,
"loss": 0.5561,
"step": 55300
},
{
"epoch": 65.18,
"learning_rate": 7.7e-07,
"loss": 0.5365,
"step": 55400
},
{
"epoch": 65.29,
"learning_rate": 7.533333333333335e-07,
"loss": 0.5324,
"step": 55500
},
{
"epoch": 65.41,
"learning_rate": 7.366666666666668e-07,
"loss": 0.5634,
"step": 55600
},
{
"epoch": 65.53,
"learning_rate": 7.2e-07,
"loss": 0.5632,
"step": 55700
},
{
"epoch": 65.65,
"learning_rate": 7.033333333333334e-07,
"loss": 0.5343,
"step": 55800
},
{
"epoch": 65.76,
"learning_rate": 6.866666666666667e-07,
"loss": 0.5743,
"step": 55900
},
{
"epoch": 65.88,
"learning_rate": 6.7e-07,
"loss": 0.5488,
"step": 56000
},
{
"epoch": 66.0,
"learning_rate": 6.533333333333334e-07,
"loss": 0.5572,
"step": 56100
},
{
"epoch": 66.12,
"learning_rate": 6.366666666666667e-07,
"loss": 0.5544,
"step": 56200
},
{
"epoch": 66.24,
"learning_rate": 6.200000000000001e-07,
"loss": 0.5544,
"step": 56300
},
{
"epoch": 66.35,
"learning_rate": 6.033333333333334e-07,
"loss": 0.5441,
"step": 56400
},
{
"epoch": 66.47,
"learning_rate": 5.866666666666667e-07,
"loss": 0.546,
"step": 56500
},
{
"epoch": 66.59,
"learning_rate": 5.7e-07,
"loss": 0.5338,
"step": 56600
},
{
"epoch": 66.71,
"learning_rate": 5.533333333333334e-07,
"loss": 0.5499,
"step": 56700
},
{
"epoch": 66.82,
"learning_rate": 5.366666666666667e-07,
"loss": 0.5315,
"step": 56800
},
{
"epoch": 66.94,
"learning_rate": 5.2e-07,
"loss": 0.5681,
"step": 56900
},
{
"epoch": 67.06,
"learning_rate": 5.033333333333334e-07,
"loss": 0.5607,
"step": 57000
},
{
"epoch": 67.18,
"learning_rate": 4.866666666666666e-07,
"loss": 0.5514,
"step": 57100
},
{
"epoch": 67.29,
"learning_rate": 4.7000000000000005e-07,
"loss": 0.5569,
"step": 57200
},
{
"epoch": 67.41,
"learning_rate": 4.533333333333334e-07,
"loss": 0.5119,
"step": 57300
},
{
"epoch": 67.53,
"learning_rate": 4.366666666666667e-07,
"loss": 0.5858,
"step": 57400
},
{
"epoch": 67.65,
"learning_rate": 4.2000000000000006e-07,
"loss": 0.5448,
"step": 57500
},
{
"epoch": 67.76,
"learning_rate": 4.0333333333333337e-07,
"loss": 0.5451,
"step": 57600
},
{
"epoch": 67.88,
"learning_rate": 3.8666666666666674e-07,
"loss": 0.5356,
"step": 57700
},
{
"epoch": 68.0,
"learning_rate": 3.7e-07,
"loss": 0.5526,
"step": 57800
},
{
"epoch": 68.12,
"learning_rate": 3.533333333333334e-07,
"loss": 0.5392,
"step": 57900
},
{
"epoch": 68.24,
"learning_rate": 3.366666666666667e-07,
"loss": 0.5402,
"step": 58000
},
{
"epoch": 68.35,
"learning_rate": 3.2e-07,
"loss": 0.5597,
"step": 58100
},
{
"epoch": 68.47,
"learning_rate": 3.033333333333334e-07,
"loss": 0.5426,
"step": 58200
},
{
"epoch": 68.59,
"learning_rate": 2.866666666666667e-07,
"loss": 0.5742,
"step": 58300
},
{
"epoch": 68.71,
"learning_rate": 2.701666666666667e-07,
"loss": 0.5628,
"step": 58400
},
{
"epoch": 68.82,
"learning_rate": 2.5350000000000004e-07,
"loss": 0.5382,
"step": 58500
},
{
"epoch": 68.94,
"learning_rate": 2.3683333333333336e-07,
"loss": 0.5231,
"step": 58600
},
{
"epoch": 69.06,
"learning_rate": 2.201666666666667e-07,
"loss": 0.546,
"step": 58700
},
{
"epoch": 69.18,
"learning_rate": 2.0350000000000002e-07,
"loss": 0.5379,
"step": 58800
},
{
"epoch": 69.29,
"learning_rate": 1.8683333333333336e-07,
"loss": 0.5705,
"step": 58900
},
{
"epoch": 69.41,
"learning_rate": 1.7016666666666668e-07,
"loss": 0.5235,
"step": 59000
},
{
"epoch": 69.53,
"learning_rate": 1.5350000000000002e-07,
"loss": 0.5527,
"step": 59100
},
{
"epoch": 69.65,
"learning_rate": 1.3683333333333336e-07,
"loss": 0.5316,
"step": 59200
},
{
"epoch": 69.76,
"learning_rate": 1.2016666666666668e-07,
"loss": 0.5711,
"step": 59300
},
{
"epoch": 69.88,
"learning_rate": 1.0350000000000001e-07,
"loss": 0.5478,
"step": 59400
},
{
"epoch": 70.0,
"learning_rate": 8.7e-08,
"loss": 0.5449,
"step": 59500
},
{
"epoch": 70.12,
"learning_rate": 7.033333333333334e-08,
"loss": 0.5585,
"step": 59600
},
{
"epoch": 70.24,
"learning_rate": 5.3666666666666664e-08,
"loss": 0.5654,
"step": 59700
},
{
"epoch": 70.35,
"learning_rate": 3.700000000000001e-08,
"loss": 0.5099,
"step": 59800
},
{
"epoch": 70.47,
"learning_rate": 2.0333333333333333e-08,
"loss": 0.5503,
"step": 59900
},
{
"epoch": 70.59,
"learning_rate": 3.666666666666667e-09,
"loss": 0.5519,
"step": 60000
},
{
"epoch": 70.59,
"eval_cer": 0.09830981547526749,
"eval_loss": 0.4715472459793091,
"eval_runtime": 7.8706,
"eval_samples_per_second": 38.117,
"eval_steps_per_second": 19.058,
"eval_wer": 0.32863247863247863,
"step": 60000
}
],
"max_steps": 60000,
"num_train_epochs": 71,
"total_flos": 5.154044369018537e+19,
"trial_name": null,
"trial_params": null
}