dinov2_Liveness_detection_v2.2.1 / trainer_state.json
nguyenkhoa's picture
End of training
1890f3d verified
raw
history blame
9.36 kB
{
"best_metric": 0.030054476112127304,
"best_model_checkpoint": "./dinov2_Liveness_detection_v2.2.1/checkpoint-960",
"epoch": 5.0,
"eval_steps": 64,
"global_step": 990,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.32323232323232326,
"grad_norm": 5.1993489265441895,
"learning_rate": 4.696969696969697e-05,
"loss": 0.4052,
"step": 64
},
{
"epoch": 0.32323232323232326,
"eval_accuracy": 0.9712097686781231,
"eval_f1": 0.9713372966580719,
"eval_loss": 0.07746175676584244,
"eval_precision": 0.9712492471516934,
"eval_recall": 0.9712097686781231,
"eval_runtime": 513.7785,
"eval_samples_per_second": 73.962,
"eval_steps_per_second": 9.245,
"step": 64
},
{
"epoch": 0.6464646464646465,
"grad_norm": 4.368253231048584,
"learning_rate": 4.3737373737373736e-05,
"loss": 0.0784,
"step": 128
},
{
"epoch": 0.6464646464646465,
"eval_accuracy": 0.9802889549724992,
"eval_f1": 0.980265299265069,
"eval_loss": 0.054525312036275864,
"eval_precision": 0.9803559157542755,
"eval_recall": 0.9802889549724992,
"eval_runtime": 493.8537,
"eval_samples_per_second": 76.946,
"eval_steps_per_second": 9.618,
"step": 128
},
{
"epoch": 0.9696969696969697,
"grad_norm": 6.4717583656311035,
"learning_rate": 4.0505050505050506e-05,
"loss": 0.0639,
"step": 192
},
{
"epoch": 0.9696969696969697,
"eval_accuracy": 0.9771046606489644,
"eval_f1": 0.9772131122819654,
"eval_loss": 0.0614825114607811,
"eval_precision": 0.9772293201056353,
"eval_recall": 0.9771046606489644,
"eval_runtime": 494.1919,
"eval_samples_per_second": 76.893,
"eval_steps_per_second": 9.612,
"step": 192
},
{
"epoch": 1.2929292929292928,
"grad_norm": 5.717361927032471,
"learning_rate": 3.7272727272727276e-05,
"loss": 0.0479,
"step": 256
},
{
"epoch": 1.2929292929292928,
"eval_accuracy": 0.9794994605121188,
"eval_f1": 0.9793994612943837,
"eval_loss": 0.057158615440130234,
"eval_precision": 0.9800037878399945,
"eval_recall": 0.9794994605121188,
"eval_runtime": 451.5225,
"eval_samples_per_second": 84.16,
"eval_steps_per_second": 10.52,
"step": 256
},
{
"epoch": 1.6161616161616161,
"grad_norm": 7.240455627441406,
"learning_rate": 3.4040404040404045e-05,
"loss": 0.0439,
"step": 320
},
{
"epoch": 1.6161616161616161,
"eval_accuracy": 0.984394326166478,
"eval_f1": 0.984415214874111,
"eval_loss": 0.042214084416627884,
"eval_precision": 0.9843782986693216,
"eval_recall": 0.984394326166478,
"eval_runtime": 528.4934,
"eval_samples_per_second": 71.903,
"eval_steps_per_second": 8.988,
"step": 320
},
{
"epoch": 1.9393939393939394,
"grad_norm": 3.2924530506134033,
"learning_rate": 3.080808080808081e-05,
"loss": 0.0392,
"step": 384
},
{
"epoch": 1.9393939393939394,
"eval_accuracy": 0.9802626384904866,
"eval_f1": 0.9801401584145893,
"eval_loss": 0.05642416328191757,
"eval_precision": 0.980989991407714,
"eval_recall": 0.9802626384904866,
"eval_runtime": 541.8272,
"eval_samples_per_second": 70.133,
"eval_steps_per_second": 8.767,
"step": 384
},
{
"epoch": 2.2626262626262625,
"grad_norm": 5.49556827545166,
"learning_rate": 2.7575757575757578e-05,
"loss": 0.0374,
"step": 448
},
{
"epoch": 2.2626262626262625,
"eval_accuracy": 0.9837100976341483,
"eval_f1": 0.9837088988305677,
"eval_loss": 0.04635660722851753,
"eval_precision": 0.983712570988981,
"eval_recall": 0.9837100976341483,
"eval_runtime": 523.4635,
"eval_samples_per_second": 72.593,
"eval_steps_per_second": 9.074,
"step": 448
},
{
"epoch": 2.5858585858585856,
"grad_norm": 7.576784133911133,
"learning_rate": 2.4343434343434344e-05,
"loss": 0.0273,
"step": 512
},
{
"epoch": 2.5858585858585856,
"eval_accuracy": 0.9861048974973026,
"eval_f1": 0.9861281800402698,
"eval_loss": 0.03779837116599083,
"eval_precision": 0.9860990328572948,
"eval_recall": 0.9861048974973026,
"eval_runtime": 526.8186,
"eval_samples_per_second": 72.131,
"eval_steps_per_second": 9.016,
"step": 512
},
{
"epoch": 2.909090909090909,
"grad_norm": 8.414101600646973,
"learning_rate": 2.111111111111111e-05,
"loss": 0.0271,
"step": 576
},
{
"epoch": 2.909090909090909,
"eval_accuracy": 0.9883417984683808,
"eval_f1": 0.9883335392334167,
"eval_loss": 0.03357573598623276,
"eval_precision": 0.988365298180521,
"eval_recall": 0.9883417984683808,
"eval_runtime": 528.7169,
"eval_samples_per_second": 71.872,
"eval_steps_per_second": 8.984,
"step": 576
},
{
"epoch": 3.2323232323232323,
"grad_norm": 4.41958475112915,
"learning_rate": 1.787878787878788e-05,
"loss": 0.021,
"step": 640
},
{
"epoch": 3.2323232323232323,
"eval_accuracy": 0.985894365641201,
"eval_f1": 0.9859268508760648,
"eval_loss": 0.04180537536740303,
"eval_precision": 0.9859071918052413,
"eval_recall": 0.985894365641201,
"eval_runtime": 523.9915,
"eval_samples_per_second": 72.52,
"eval_steps_per_second": 9.065,
"step": 640
},
{
"epoch": 3.5555555555555554,
"grad_norm": 10.126025199890137,
"learning_rate": 1.4646464646464647e-05,
"loss": 0.019,
"step": 704
},
{
"epoch": 3.5555555555555554,
"eval_accuracy": 0.9848417063606937,
"eval_f1": 0.9848982600089184,
"eval_loss": 0.04540397599339485,
"eval_precision": 0.9849383014159727,
"eval_recall": 0.9848417063606937,
"eval_runtime": 525.5117,
"eval_samples_per_second": 72.31,
"eval_steps_per_second": 9.039,
"step": 704
},
{
"epoch": 3.878787878787879,
"grad_norm": 3.757537603378296,
"learning_rate": 1.1414141414141415e-05,
"loss": 0.0177,
"step": 768
},
{
"epoch": 3.878787878787879,
"eval_accuracy": 0.9883154819863681,
"eval_f1": 0.9883223194841958,
"eval_loss": 0.03590450435876846,
"eval_precision": 0.9883066841617396,
"eval_recall": 0.9883154819863681,
"eval_runtime": 522.9339,
"eval_samples_per_second": 72.667,
"eval_steps_per_second": 9.083,
"step": 768
},
{
"epoch": 4.202020202020202,
"grad_norm": 4.959455966949463,
"learning_rate": 8.181818181818183e-06,
"loss": 0.0134,
"step": 832
},
{
"epoch": 4.202020202020202,
"eval_accuracy": 0.9874470380799495,
"eval_f1": 0.987400014046709,
"eval_loss": 0.04097573831677437,
"eval_precision": 0.9877259518894549,
"eval_recall": 0.9874470380799495,
"eval_runtime": 521.4997,
"eval_samples_per_second": 72.867,
"eval_steps_per_second": 9.108,
"step": 832
},
{
"epoch": 4.525252525252525,
"grad_norm": 3.8119397163391113,
"learning_rate": 4.949494949494949e-06,
"loss": 0.0102,
"step": 896
},
{
"epoch": 4.525252525252525,
"eval_accuracy": 0.9909997631516619,
"eval_f1": 0.9910005190250708,
"eval_loss": 0.031363558024168015,
"eval_precision": 0.9909983512838277,
"eval_recall": 0.9909997631516619,
"eval_runtime": 523.3329,
"eval_samples_per_second": 72.612,
"eval_steps_per_second": 9.076,
"step": 896
},
{
"epoch": 4.848484848484849,
"grad_norm": 3.6070823669433594,
"learning_rate": 1.7171717171717171e-06,
"loss": 0.0103,
"step": 960
},
{
"epoch": 4.848484848484849,
"eval_accuracy": 0.9909997631516619,
"eval_f1": 0.9909972985219008,
"eval_loss": 0.030054476112127304,
"eval_precision": 0.9910057473707247,
"eval_recall": 0.9909997631516619,
"eval_runtime": 534.5024,
"eval_samples_per_second": 71.094,
"eval_steps_per_second": 8.887,
"step": 960
},
{
"epoch": 5.0,
"step": 990,
"total_flos": 3.78521471397888e+18,
"train_loss": 0.055960290434986654,
"train_runtime": 18290.5686,
"train_samples_per_second": 41.551,
"train_steps_per_second": 0.054
}
],
"logging_steps": 64,
"max_steps": 990,
"num_input_tokens_seen": 0,
"num_train_epochs": 5,
"save_steps": 64,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 3.78521471397888e+18,
"train_batch_size": 768,
"trial_name": null,
"trial_params": null
}