{ "best_metric": 79.90477476395145, "best_model_checkpoint": "/data/jcanete/all_results/sqac/albeto_base/epochs_3_bs_16_lr_5e-5/checkpoint-2000", "epoch": 3.0, "global_step": 3114, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.19, "eval_exact_match": 40.55793991416309, "eval_f1": 61.9475026058651, "step": 200 }, { "epoch": 0.39, "eval_exact_match": 50.16094420600859, "eval_f1": 70.94487746222757, "step": 400 }, { "epoch": 0.48, "learning_rate": 4.206807964033398e-05, "loss": 1.908, "step": 500 }, { "epoch": 0.58, "eval_exact_match": 54.77467811158798, "eval_f1": 73.11200761877414, "step": 600 }, { "epoch": 0.77, "eval_exact_match": 55.90128755364807, "eval_f1": 74.35378026715777, "step": 800 }, { "epoch": 0.96, "learning_rate": 3.405587668593449e-05, "loss": 1.1479, "step": 1000 }, { "epoch": 0.96, "eval_exact_match": 58.74463519313305, "eval_f1": 77.15822408085789, "step": 1000 }, { "epoch": 1.16, "eval_exact_match": 58.90557939914163, "eval_f1": 76.90716161104929, "step": 1200 }, { "epoch": 1.35, "eval_exact_match": 59.49570815450644, "eval_f1": 77.54387552767798, "step": 1400 }, { "epoch": 1.45, "learning_rate": 2.6027617212588313e-05, "loss": 0.7268, "step": 1500 }, { "epoch": 1.54, "eval_exact_match": 59.227467811158796, "eval_f1": 77.8200127931914, "step": 1600 }, { "epoch": 1.73, "eval_exact_match": 61.31974248927039, "eval_f1": 78.96026149786353, "step": 1800 }, { "epoch": 1.93, "learning_rate": 1.7999357739242135e-05, "loss": 0.683, "step": 2000 }, { "epoch": 1.93, "eval_exact_match": 62.71459227467811, "eval_f1": 79.90477476395145, "step": 2000 }, { "epoch": 2.12, "eval_exact_match": 62.01716738197425, "eval_f1": 79.35780895037563, "step": 2200 }, { "epoch": 2.31, "eval_exact_match": 62.23175965665236, "eval_f1": 79.16073100037653, "step": 2400 }, { "epoch": 2.41, "learning_rate": 9.971098265895954e-06, "loss": 0.4189, "step": 2500 }, { "epoch": 2.5, "eval_exact_match": 60.89055793991416, "eval_f1": 79.00549485950138, "step": 2600 }, { "epoch": 2.7, "eval_exact_match": 61.85622317596567, "eval_f1": 79.2496307825153, "step": 2800 }, { "epoch": 2.89, "learning_rate": 1.9428387925497756e-06, "loss": 0.3417, "step": 3000 }, { "epoch": 2.89, "eval_exact_match": 62.55364806866953, "eval_f1": 79.81438829072098, "step": 3000 }, { "epoch": 3.0, "step": 3114, "total_flos": 1074824219579904.0, "train_loss": 0.8525694306262732, "train_runtime": 946.0422, "train_samples_per_second": 52.634, "train_steps_per_second": 3.292 } ], "max_steps": 3114, "num_train_epochs": 3, "total_flos": 1074824219579904.0, "trial_name": null, "trial_params": null }