{ "best_metric": 59.382051635096076, "best_model_checkpoint": "/data/jcanete/all_results/sqac/albeto_tiny/epochs_4_bs_16_lr_5e-5/checkpoint-2400", "epoch": 4.0, "global_step": 4152, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.19, "eval_exact_match": 12.339055793991417, "eval_f1": 28.93103280159431, "step": 200 }, { "epoch": 0.39, "eval_exact_match": 23.92703862660944, "eval_f1": 41.67915333843358, "step": 400 }, { "epoch": 0.48, "learning_rate": 4.4026974951830445e-05, "loss": 3.1377, "step": 500 }, { "epoch": 0.58, "eval_exact_match": 31.86695278969957, "eval_f1": 51.18317520944259, "step": 600 }, { "epoch": 0.77, "eval_exact_match": 34.871244635193136, "eval_f1": 53.9432519365253, "step": 800 }, { "epoch": 0.96, "learning_rate": 3.800578034682081e-05, "loss": 2.0078, "step": 1000 }, { "epoch": 0.96, "eval_exact_match": 35.51502145922747, "eval_f1": 55.221685158386705, "step": 1000 }, { "epoch": 1.16, "eval_exact_match": 36.85622317596567, "eval_f1": 55.20708770919938, "step": 1200 }, { "epoch": 1.35, "eval_exact_match": 37.98283261802575, "eval_f1": 56.614251341537866, "step": 1400 }, { "epoch": 1.45, "learning_rate": 3.198458574181118e-05, "loss": 1.4374, "step": 1500 }, { "epoch": 1.54, "eval_exact_match": 39.002145922746784, "eval_f1": 57.702126636307476, "step": 1600 }, { "epoch": 1.73, "eval_exact_match": 39.64592274678112, "eval_f1": 58.69230555304524, "step": 1800 }, { "epoch": 1.93, "learning_rate": 2.596339113680154e-05, "loss": 1.3597, "step": 2000 }, { "epoch": 1.93, "eval_exact_match": 39.64592274678112, "eval_f1": 58.05721827009323, "step": 2000 }, { "epoch": 2.12, "eval_exact_match": 39.27038626609442, "eval_f1": 57.648146496721296, "step": 2200 }, { "epoch": 2.31, "eval_exact_match": 40.50429184549356, "eval_f1": 59.382051635096076, "step": 2400 }, { "epoch": 2.41, "learning_rate": 1.995423892100193e-05, "loss": 0.9536, "step": 2500 }, { "epoch": 2.5, "eval_exact_match": 40.71888412017167, "eval_f1": 59.060573449175955, "step": 2600 }, { "epoch": 2.7, "eval_exact_match": 39.8068669527897, "eval_f1": 58.80449299317162, "step": 2800 }, { "epoch": 2.89, "learning_rate": 1.3933044315992294e-05, "loss": 0.8884, "step": 3000 }, { "epoch": 2.89, "eval_exact_match": 40.772532188841204, "eval_f1": 58.85814483853365, "step": 3000 }, { "epoch": 3.08, "eval_exact_match": 40.02145922746781, "eval_f1": 59.12527092459649, "step": 3200 }, { "epoch": 3.28, "eval_exact_match": 40.933476394849784, "eval_f1": 59.19992976262888, "step": 3400 }, { "epoch": 3.37, "learning_rate": 7.91184971098266e-06, "loss": 0.6567, "step": 3500 }, { "epoch": 3.47, "eval_exact_match": 40.933476394849784, "eval_f1": 59.280000618875235, "step": 3600 }, { "epoch": 3.66, "eval_exact_match": 40.50429184549356, "eval_f1": 58.81358724565813, "step": 3800 }, { "epoch": 3.85, "learning_rate": 1.890655105973025e-06, "loss": 0.5809, "step": 4000 }, { "epoch": 3.85, "eval_exact_match": 40.50429184549356, "eval_f1": 58.87104735095327, "step": 4000 }, { "epoch": 4.0, "step": 4152, "total_flos": 241925105088000.0, "train_loss": 1.34779805898207, "train_runtime": 436.6525, "train_samples_per_second": 152.048, "train_steps_per_second": 9.509 } ], "max_steps": 4152, "num_train_epochs": 4, "total_flos": 241925105088000.0, "trial_name": null, "trial_params": null }