|
{ |
|
"best_metric": 0.8778576539129843, |
|
"best_model_checkpoint": "./fields_classification/checkpoint-4610", |
|
"epoch": 9.98916576381365, |
|
"eval_steps": 500, |
|
"global_step": 4610, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"learning_rate": 3e-05, |
|
"loss": 0.1747, |
|
"step": 461 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.38636055803873764, |
|
"eval_f1": 0.5336014591030258, |
|
"eval_loss": 0.08355075865983963, |
|
"eval_precision": 0.8621731902674928, |
|
"eval_recall": 0.38636055803873764, |
|
"eval_roc_auc": 0.6919450088040092, |
|
"eval_runtime": 116.991, |
|
"eval_samples_per_second": 126.215, |
|
"eval_steps_per_second": 1.975, |
|
"step": 461 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"learning_rate": 3e-05, |
|
"loss": 0.0684, |
|
"step": 923 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.769944467018827, |
|
"eval_f1": 0.8073713737883038, |
|
"eval_loss": 0.05430687218904495, |
|
"eval_precision": 0.8486228260058222, |
|
"eval_recall": 0.769944467018827, |
|
"eval_roc_auc": 0.8822253826357849, |
|
"eval_runtime": 117.0652, |
|
"eval_samples_per_second": 126.135, |
|
"eval_steps_per_second": 1.973, |
|
"step": 923 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"learning_rate": 3e-05, |
|
"loss": 0.0498, |
|
"step": 1384 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.8040769334958688, |
|
"eval_f1": 0.8276895206243033, |
|
"eval_loss": 0.04519835114479065, |
|
"eval_precision": 0.8522743578705697, |
|
"eval_recall": 0.8044832723825004, |
|
"eval_roc_auc": 0.8994527969660029, |
|
"eval_runtime": 116.7477, |
|
"eval_samples_per_second": 126.478, |
|
"eval_steps_per_second": 1.979, |
|
"step": 1384 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"learning_rate": 3e-05, |
|
"loss": 0.0407, |
|
"step": 1846 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.8289990518759311, |
|
"eval_f1": 0.8456551724137932, |
|
"eval_loss": 0.039659492671489716, |
|
"eval_precision": 0.8614584796965014, |
|
"eval_recall": 0.8304212379791412, |
|
"eval_roc_auc": 0.9125396180414465, |
|
"eval_runtime": 117.5369, |
|
"eval_samples_per_second": 125.629, |
|
"eval_steps_per_second": 1.965, |
|
"step": 1846 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"learning_rate": 3e-05, |
|
"loss": 0.035, |
|
"step": 2307 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.8405119869971557, |
|
"eval_f1": 0.8543429844097995, |
|
"eval_loss": 0.03649652376770973, |
|
"eval_precision": 0.8646230667868784, |
|
"eval_recall": 0.8443044832723825, |
|
"eval_roc_auc": 0.919508329947176, |
|
"eval_runtime": 117.0597, |
|
"eval_samples_per_second": 126.141, |
|
"eval_steps_per_second": 1.973, |
|
"step": 2307 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"learning_rate": 3e-05, |
|
"loss": 0.0303, |
|
"step": 2769 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.8518217526750643, |
|
"eval_f1": 0.8653773746363169, |
|
"eval_loss": 0.0338783822953701, |
|
"eval_precision": 0.8748702332341338, |
|
"eval_recall": 0.8560883109846946, |
|
"eval_roc_auc": 0.9255952864689151, |
|
"eval_runtime": 116.7614, |
|
"eval_samples_per_second": 126.463, |
|
"eval_steps_per_second": 1.978, |
|
"step": 2769 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"learning_rate": 3e-05, |
|
"loss": 0.0268, |
|
"step": 3230 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_accuracy": 0.8566300961668698, |
|
"eval_f1": 0.8697338868849113, |
|
"eval_loss": 0.03237078711390495, |
|
"eval_precision": 0.8740766073871409, |
|
"eval_recall": 0.865434105377218, |
|
"eval_roc_auc": 0.9302234863876474, |
|
"eval_runtime": 117.0283, |
|
"eval_samples_per_second": 126.175, |
|
"eval_steps_per_second": 1.974, |
|
"step": 3230 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"learning_rate": 3e-05, |
|
"loss": 0.0237, |
|
"step": 3692 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.8580522822700799, |
|
"eval_f1": 0.8707677634716261, |
|
"eval_loss": 0.03161860257387161, |
|
"eval_precision": 0.8759594298245614, |
|
"eval_recall": 0.8656372748205337, |
|
"eval_roc_auc": 0.9303670594609237, |
|
"eval_runtime": 116.6155, |
|
"eval_samples_per_second": 126.621, |
|
"eval_steps_per_second": 1.981, |
|
"step": 3692 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"learning_rate": 3e-05, |
|
"loss": 0.0211, |
|
"step": 4153 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_accuracy": 0.8651632127861303, |
|
"eval_f1": 0.8777002891648241, |
|
"eval_loss": 0.030687741935253143, |
|
"eval_precision": 0.8818101032196323, |
|
"eval_recall": 0.8736286062576188, |
|
"eval_roc_auc": 0.9344724366788568, |
|
"eval_runtime": 116.7518, |
|
"eval_samples_per_second": 126.473, |
|
"eval_steps_per_second": 1.979, |
|
"step": 4153 |
|
}, |
|
{ |
|
"epoch": 9.99, |
|
"learning_rate": 3e-05, |
|
"loss": 0.0188, |
|
"step": 4610 |
|
}, |
|
{ |
|
"epoch": 9.99, |
|
"eval_accuracy": 0.8656372748205337, |
|
"eval_f1": 0.8778576539129843, |
|
"eval_loss": 0.03020327538251877, |
|
"eval_precision": 0.8833047651696949, |
|
"eval_recall": 0.8724773127454964, |
|
"eval_roc_auc": 0.9339333604225925, |
|
"eval_runtime": 117.271, |
|
"eval_samples_per_second": 125.914, |
|
"eval_steps_per_second": 1.97, |
|
"step": 4610 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 4610, |
|
"num_train_epochs": 10, |
|
"save_steps": 500, |
|
"total_flos": 1.5527107913529754e+17, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|