|
{ |
|
"best_metric": 0.8780487804878049, |
|
"best_model_checkpoint": "Cvt-finetuned-thyroid/checkpoint-33", |
|
"epoch": 30.0, |
|
"global_step": 90, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"eval_f1": 0.19148936170212766, |
|
"eval_loss": 0.7407425045967102, |
|
"eval_runtime": 0.5779, |
|
"eval_samples_per_second": 173.027, |
|
"eval_steps_per_second": 6.921, |
|
"step": 3 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_f1": 0.3773584905660377, |
|
"eval_loss": 0.729247510433197, |
|
"eval_runtime": 0.5528, |
|
"eval_samples_per_second": 180.896, |
|
"eval_steps_per_second": 7.236, |
|
"step": 6 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_f1": 0.4786324786324786, |
|
"eval_loss": 0.7105527520179749, |
|
"eval_runtime": 0.558, |
|
"eval_samples_per_second": 179.203, |
|
"eval_steps_per_second": 7.168, |
|
"step": 9 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_f1": 0.6060606060606061, |
|
"eval_loss": 0.6890331506729126, |
|
"eval_runtime": 0.5504, |
|
"eval_samples_per_second": 181.671, |
|
"eval_steps_per_second": 7.267, |
|
"step": 12 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_f1": 0.7, |
|
"eval_loss": 0.6695859432220459, |
|
"eval_runtime": 0.5595, |
|
"eval_samples_per_second": 178.745, |
|
"eval_steps_per_second": 7.15, |
|
"step": 15 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_f1": 0.7761194029850746, |
|
"eval_loss": 0.6517141461372375, |
|
"eval_runtime": 0.5632, |
|
"eval_samples_per_second": 177.548, |
|
"eval_steps_per_second": 7.102, |
|
"step": 18 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_f1": 0.828125, |
|
"eval_loss": 0.6349117755889893, |
|
"eval_runtime": 0.5567, |
|
"eval_samples_per_second": 179.616, |
|
"eval_steps_per_second": 7.185, |
|
"step": 21 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_f1": 0.8503937007874015, |
|
"eval_loss": 0.618772029876709, |
|
"eval_runtime": 0.5546, |
|
"eval_samples_per_second": 180.325, |
|
"eval_steps_per_second": 7.213, |
|
"step": 24 |
|
}, |
|
{ |
|
"epoch": 8.33, |
|
"learning_rate": 8.024691358024692e-06, |
|
"loss": 0.634, |
|
"step": 25 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_f1": 0.8709677419354839, |
|
"eval_loss": 0.6039881706237793, |
|
"eval_runtime": 0.5519, |
|
"eval_samples_per_second": 181.185, |
|
"eval_steps_per_second": 7.247, |
|
"step": 27 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_f1": 0.8709677419354839, |
|
"eval_loss": 0.5912619829177856, |
|
"eval_runtime": 0.5573, |
|
"eval_samples_per_second": 179.441, |
|
"eval_steps_per_second": 7.178, |
|
"step": 30 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_f1": 0.8780487804878049, |
|
"eval_loss": 0.5805598497390747, |
|
"eval_runtime": 0.5574, |
|
"eval_samples_per_second": 179.394, |
|
"eval_steps_per_second": 7.176, |
|
"step": 33 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_f1": 0.8688524590163933, |
|
"eval_loss": 0.5723507404327393, |
|
"eval_runtime": 0.5544, |
|
"eval_samples_per_second": 180.362, |
|
"eval_steps_per_second": 7.214, |
|
"step": 36 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_f1": 0.8688524590163933, |
|
"eval_loss": 0.5652728080749512, |
|
"eval_runtime": 0.5588, |
|
"eval_samples_per_second": 178.951, |
|
"eval_steps_per_second": 7.158, |
|
"step": 39 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_f1": 0.8688524590163933, |
|
"eval_loss": 0.5592342019081116, |
|
"eval_runtime": 0.5516, |
|
"eval_samples_per_second": 181.294, |
|
"eval_steps_per_second": 7.252, |
|
"step": 42 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_f1": 0.8760330578512396, |
|
"eval_loss": 0.553566575050354, |
|
"eval_runtime": 0.558, |
|
"eval_samples_per_second": 179.226, |
|
"eval_steps_per_second": 7.169, |
|
"step": 45 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_f1": 0.8760330578512396, |
|
"eval_loss": 0.5487043857574463, |
|
"eval_runtime": 0.5688, |
|
"eval_samples_per_second": 175.802, |
|
"eval_steps_per_second": 7.032, |
|
"step": 48 |
|
}, |
|
{ |
|
"epoch": 16.67, |
|
"learning_rate": 4.938271604938272e-06, |
|
"loss": 0.5096, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_f1": 0.8760330578512396, |
|
"eval_loss": 0.5434445142745972, |
|
"eval_runtime": 0.5636, |
|
"eval_samples_per_second": 177.42, |
|
"eval_steps_per_second": 7.097, |
|
"step": 51 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_f1": 0.8760330578512396, |
|
"eval_loss": 0.5385234951972961, |
|
"eval_runtime": 0.561, |
|
"eval_samples_per_second": 178.247, |
|
"eval_steps_per_second": 7.13, |
|
"step": 54 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_f1": 0.8760330578512396, |
|
"eval_loss": 0.5339138507843018, |
|
"eval_runtime": 0.5531, |
|
"eval_samples_per_second": 180.806, |
|
"eval_steps_per_second": 7.232, |
|
"step": 57 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_f1": 0.8739495798319329, |
|
"eval_loss": 0.5293477177619934, |
|
"eval_runtime": 0.5612, |
|
"eval_samples_per_second": 178.191, |
|
"eval_steps_per_second": 7.128, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_f1": 0.8739495798319329, |
|
"eval_loss": 0.5248751640319824, |
|
"eval_runtime": 0.554, |
|
"eval_samples_per_second": 180.518, |
|
"eval_steps_per_second": 7.221, |
|
"step": 63 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_f1": 0.8739495798319329, |
|
"eval_loss": 0.5204405784606934, |
|
"eval_runtime": 0.564, |
|
"eval_samples_per_second": 177.317, |
|
"eval_steps_per_second": 7.093, |
|
"step": 66 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_f1": 0.8739495798319329, |
|
"eval_loss": 0.5157800912857056, |
|
"eval_runtime": 0.5507, |
|
"eval_samples_per_second": 181.589, |
|
"eval_steps_per_second": 7.264, |
|
"step": 69 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_f1": 0.8739495798319329, |
|
"eval_loss": 0.5112195014953613, |
|
"eval_runtime": 0.5502, |
|
"eval_samples_per_second": 181.737, |
|
"eval_steps_per_second": 7.269, |
|
"step": 72 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"learning_rate": 1.8518518518518519e-06, |
|
"loss": 0.4584, |
|
"step": 75 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_f1": 0.8739495798319329, |
|
"eval_loss": 0.5078128576278687, |
|
"eval_runtime": 0.5542, |
|
"eval_samples_per_second": 180.427, |
|
"eval_steps_per_second": 7.217, |
|
"step": 75 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"eval_f1": 0.8739495798319329, |
|
"eval_loss": 0.5054234266281128, |
|
"eval_runtime": 0.5564, |
|
"eval_samples_per_second": 179.717, |
|
"eval_steps_per_second": 7.189, |
|
"step": 78 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"eval_f1": 0.8739495798319329, |
|
"eval_loss": 0.503419041633606, |
|
"eval_runtime": 0.5536, |
|
"eval_samples_per_second": 180.639, |
|
"eval_steps_per_second": 7.226, |
|
"step": 81 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_f1": 0.8739495798319329, |
|
"eval_loss": 0.5020792484283447, |
|
"eval_runtime": 0.5563, |
|
"eval_samples_per_second": 179.771, |
|
"eval_steps_per_second": 7.191, |
|
"step": 84 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"eval_f1": 0.8739495798319329, |
|
"eval_loss": 0.5012262463569641, |
|
"eval_runtime": 0.5542, |
|
"eval_samples_per_second": 180.449, |
|
"eval_steps_per_second": 7.218, |
|
"step": 87 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_f1": 0.8739495798319329, |
|
"eval_loss": 0.50089430809021, |
|
"eval_runtime": 0.553, |
|
"eval_samples_per_second": 180.845, |
|
"eval_steps_per_second": 7.234, |
|
"step": 90 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"step": 90, |
|
"total_flos": 2.7816295750742016e+17, |
|
"train_loss": 0.517905675040351, |
|
"train_runtime": 173.4592, |
|
"train_samples_per_second": 63.819, |
|
"train_steps_per_second": 0.519 |
|
} |
|
], |
|
"max_steps": 90, |
|
"num_train_epochs": 30, |
|
"total_flos": 2.7816295750742016e+17, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|