{ "best_metric": 0.06275933235883713, "best_model_checkpoint": "intent_classification_model/checkpoint-152", "epoch": 16.0, "eval_steps": 500, "global_step": 1216, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.9867549668874173, "eval_loss": 0.20886486768722534, "eval_runtime": 0.1475, "eval_samples_per_second": 2048.099, "eval_steps_per_second": 128.854, "step": 76 }, { "epoch": 2.0, "eval_accuracy": 0.9834437086092715, "eval_loss": 0.06275933235883713, "eval_runtime": 0.1586, "eval_samples_per_second": 1904.103, "eval_steps_per_second": 119.795, "step": 152 }, { "epoch": 3.0, "eval_accuracy": 0.9867549668874173, "eval_loss": 0.06509935110807419, "eval_runtime": 0.1445, "eval_samples_per_second": 2090.586, "eval_steps_per_second": 131.527, "step": 228 }, { "epoch": 4.0, "eval_accuracy": 0.9768211920529801, "eval_loss": 0.08112386614084244, "eval_runtime": 0.1335, "eval_samples_per_second": 2262.833, "eval_steps_per_second": 142.364, "step": 304 }, { "epoch": 5.0, "eval_accuracy": 0.9701986754966887, "eval_loss": 0.11257749050855637, "eval_runtime": 0.134, "eval_samples_per_second": 2253.71, "eval_steps_per_second": 141.79, "step": 380 }, { "epoch": 6.0, "eval_accuracy": 0.9735099337748344, "eval_loss": 0.11174333095550537, "eval_runtime": 0.1339, "eval_samples_per_second": 2255.512, "eval_steps_per_second": 141.903, "step": 456 }, { "epoch": 6.58, "learning_rate": 1.1776315789473684e-05, "loss": 0.1883, "step": 500 }, { "epoch": 7.0, "eval_accuracy": 0.9768211920529801, "eval_loss": 0.10020075738430023, "eval_runtime": 0.145, "eval_samples_per_second": 2083.04, "eval_steps_per_second": 131.052, "step": 532 }, { "epoch": 8.0, "eval_accuracy": 0.9735099337748344, "eval_loss": 0.116866335272789, "eval_runtime": 0.1348, "eval_samples_per_second": 2240.912, "eval_steps_per_second": 140.985, "step": 608 }, { "epoch": 9.0, "eval_accuracy": 0.9701986754966887, "eval_loss": 0.14152054488658905, "eval_runtime": 0.1308, "eval_samples_per_second": 2309.736, "eval_steps_per_second": 145.314, "step": 684 }, { "epoch": 10.0, "eval_accuracy": 0.9735099337748344, "eval_loss": 0.1344088315963745, "eval_runtime": 0.1195, "eval_samples_per_second": 2526.256, "eval_steps_per_second": 158.937, "step": 760 }, { "epoch": 11.0, "eval_accuracy": 0.9735099337748344, "eval_loss": 0.13409321010112762, "eval_runtime": 0.1399, "eval_samples_per_second": 2159.267, "eval_steps_per_second": 135.848, "step": 836 }, { "epoch": 12.0, "eval_accuracy": 0.9735099337748344, "eval_loss": 0.12705937027931213, "eval_runtime": 0.1366, "eval_samples_per_second": 2210.321, "eval_steps_per_second": 139.06, "step": 912 }, { "epoch": 13.0, "eval_accuracy": 0.9735099337748344, "eval_loss": 0.13874845206737518, "eval_runtime": 0.1374, "eval_samples_per_second": 2197.254, "eval_steps_per_second": 138.238, "step": 988 }, { "epoch": 13.16, "learning_rate": 3.5526315789473687e-06, "loss": 0.018, "step": 1000 }, { "epoch": 14.0, "eval_accuracy": 0.9735099337748344, "eval_loss": 0.13716736435890198, "eval_runtime": 0.1193, "eval_samples_per_second": 2530.546, "eval_steps_per_second": 159.207, "step": 1064 }, { "epoch": 15.0, "eval_accuracy": 0.9735099337748344, "eval_loss": 0.13588877022266388, "eval_runtime": 0.1396, "eval_samples_per_second": 2163.789, "eval_steps_per_second": 136.132, "step": 1140 }, { "epoch": 16.0, "eval_accuracy": 0.9735099337748344, "eval_loss": 0.13579562306404114, "eval_runtime": 0.1288, "eval_samples_per_second": 2345.226, "eval_steps_per_second": 147.547, "step": 1216 } ], "logging_steps": 500, "max_steps": 1216, "num_train_epochs": 16, "save_steps": 500, "total_flos": 62384098266840.0, "trial_name": null, "trial_params": null }