{ "best_metric": null, "best_model_checkpoint": null, "epoch": 3.671562082777036, "global_step": 5500, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.33, "learning_rate": 4.9800000000000004e-05, "loss": 1.0211, "step": 500 }, { "epoch": 0.33, "eval_loss": 0.5140587091445923, "eval_runtime": 112.0215, "eval_samples_per_second": 13.372, "eval_steps_per_second": 1.678, "eval_wer": 0.32459210916641945, "step": 500 }, { "epoch": 0.67, "learning_rate": 9.98e-05, "loss": 0.7098, "step": 1000 }, { "epoch": 0.67, "eval_loss": 0.41307497024536133, "eval_runtime": 114.0249, "eval_samples_per_second": 13.137, "eval_steps_per_second": 1.649, "eval_wer": 0.2981311183625037, "step": 1000 }, { "epoch": 1.0, "learning_rate": 9.002403846153846e-05, "loss": 0.6115, "step": 1500 }, { "epoch": 1.0, "eval_loss": 0.37654194235801697, "eval_runtime": 115.4275, "eval_samples_per_second": 12.978, "eval_steps_per_second": 1.629, "eval_wer": 0.2660338178582023, "step": 1500 }, { "epoch": 1.34, "learning_rate": 8.000801282051282e-05, "loss": 0.5112, "step": 2000 }, { "epoch": 1.34, "eval_loss": 0.3202863931655884, "eval_runtime": 113.0512, "eval_samples_per_second": 13.251, "eval_steps_per_second": 1.663, "eval_wer": 0.24526846633046573, "step": 2000 }, { "epoch": 1.67, "learning_rate": 7.001201923076923e-05, "loss": 0.4763, "step": 2500 }, { "epoch": 1.67, "eval_loss": 0.29251885414123535, "eval_runtime": 113.4478, "eval_samples_per_second": 13.204, "eval_steps_per_second": 1.657, "eval_wer": 0.23500444971818452, "step": 2500 }, { "epoch": 2.0, "learning_rate": 5.999599358974359e-05, "loss": 0.4386, "step": 3000 }, { "epoch": 2.0, "eval_loss": 0.2935383915901184, "eval_runtime": 112.4069, "eval_samples_per_second": 13.327, "eval_steps_per_second": 1.672, "eval_wer": 0.22284188668051022, "step": 3000 }, { "epoch": 2.34, "learning_rate": 4.997996794871795e-05, "loss": 0.3802, "step": 3500 }, { "epoch": 2.34, "eval_loss": 0.2789919078350067, "eval_runtime": 111.4408, "eval_samples_per_second": 13.442, "eval_steps_per_second": 1.687, "eval_wer": 0.21388312073568674, "step": 3500 }, { "epoch": 2.67, "learning_rate": 3.998397435897436e-05, "loss": 0.3727, "step": 4000 }, { "epoch": 2.67, "eval_loss": 0.26136162877082825, "eval_runtime": 111.228, "eval_samples_per_second": 13.468, "eval_steps_per_second": 1.69, "eval_wer": 0.21050133491545536, "step": 4000 }, { "epoch": 3.0, "learning_rate": 2.9967948717948717e-05, "loss": 0.3747, "step": 4500 }, { "epoch": 3.0, "eval_loss": 0.24868248403072357, "eval_runtime": 112.653, "eval_samples_per_second": 13.297, "eval_steps_per_second": 1.669, "eval_wer": 0.20539899139721152, "step": 4500 }, { "epoch": 3.34, "learning_rate": 1.9951923076923078e-05, "loss": 0.3192, "step": 5000 }, { "epoch": 3.34, "eval_loss": 0.2479962557554245, "eval_runtime": 117.7279, "eval_samples_per_second": 12.724, "eval_steps_per_second": 1.597, "eval_wer": 0.20166122812221893, "step": 5000 }, { "epoch": 3.67, "learning_rate": 9.935897435897435e-06, "loss": 0.2852, "step": 5500 }, { "epoch": 3.67, "eval_loss": 0.24946188926696777, "eval_runtime": 116.0708, "eval_samples_per_second": 12.906, "eval_steps_per_second": 1.62, "eval_wer": 0.20005932957579353, "step": 5500 } ], "max_steps": 5992, "num_train_epochs": 4, "total_flos": 1.4196823993181012e+18, "trial_name": null, "trial_params": null }