{ "best_metric": 0.030054476112127304, "best_model_checkpoint": "./dinov2_Liveness_detection_v2.2.1/checkpoint-960", "epoch": 5.0, "eval_steps": 64, "global_step": 990, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.32323232323232326, "grad_norm": 5.1993489265441895, "learning_rate": 4.696969696969697e-05, "loss": 0.4052, "step": 64 }, { "epoch": 0.32323232323232326, "eval_accuracy": 0.9712097686781231, "eval_f1": 0.9713372966580719, "eval_loss": 0.07746175676584244, "eval_precision": 0.9712492471516934, "eval_recall": 0.9712097686781231, "eval_runtime": 513.7785, "eval_samples_per_second": 73.962, "eval_steps_per_second": 9.245, "step": 64 }, { "epoch": 0.6464646464646465, "grad_norm": 4.368253231048584, "learning_rate": 4.3737373737373736e-05, "loss": 0.0784, "step": 128 }, { "epoch": 0.6464646464646465, "eval_accuracy": 0.9802889549724992, "eval_f1": 0.980265299265069, "eval_loss": 0.054525312036275864, "eval_precision": 0.9803559157542755, "eval_recall": 0.9802889549724992, "eval_runtime": 493.8537, "eval_samples_per_second": 76.946, "eval_steps_per_second": 9.618, "step": 128 }, { "epoch": 0.9696969696969697, "grad_norm": 6.4717583656311035, "learning_rate": 4.0505050505050506e-05, "loss": 0.0639, "step": 192 }, { "epoch": 0.9696969696969697, "eval_accuracy": 0.9771046606489644, "eval_f1": 0.9772131122819654, "eval_loss": 0.0614825114607811, "eval_precision": 0.9772293201056353, "eval_recall": 0.9771046606489644, "eval_runtime": 494.1919, "eval_samples_per_second": 76.893, "eval_steps_per_second": 9.612, "step": 192 }, { "epoch": 1.2929292929292928, "grad_norm": 5.717361927032471, "learning_rate": 3.7272727272727276e-05, "loss": 0.0479, "step": 256 }, { "epoch": 1.2929292929292928, "eval_accuracy": 0.9794994605121188, "eval_f1": 0.9793994612943837, "eval_loss": 0.057158615440130234, "eval_precision": 0.9800037878399945, "eval_recall": 0.9794994605121188, "eval_runtime": 451.5225, "eval_samples_per_second": 84.16, "eval_steps_per_second": 10.52, "step": 256 }, { "epoch": 1.6161616161616161, "grad_norm": 7.240455627441406, "learning_rate": 3.4040404040404045e-05, "loss": 0.0439, "step": 320 }, { "epoch": 1.6161616161616161, "eval_accuracy": 0.984394326166478, "eval_f1": 0.984415214874111, "eval_loss": 0.042214084416627884, "eval_precision": 0.9843782986693216, "eval_recall": 0.984394326166478, "eval_runtime": 528.4934, "eval_samples_per_second": 71.903, "eval_steps_per_second": 8.988, "step": 320 }, { "epoch": 1.9393939393939394, "grad_norm": 3.2924530506134033, "learning_rate": 3.080808080808081e-05, "loss": 0.0392, "step": 384 }, { "epoch": 1.9393939393939394, "eval_accuracy": 0.9802626384904866, "eval_f1": 0.9801401584145893, "eval_loss": 0.05642416328191757, "eval_precision": 0.980989991407714, "eval_recall": 0.9802626384904866, "eval_runtime": 541.8272, "eval_samples_per_second": 70.133, "eval_steps_per_second": 8.767, "step": 384 }, { "epoch": 2.2626262626262625, "grad_norm": 5.49556827545166, "learning_rate": 2.7575757575757578e-05, "loss": 0.0374, "step": 448 }, { "epoch": 2.2626262626262625, "eval_accuracy": 0.9837100976341483, "eval_f1": 0.9837088988305677, "eval_loss": 0.04635660722851753, "eval_precision": 0.983712570988981, "eval_recall": 0.9837100976341483, "eval_runtime": 523.4635, "eval_samples_per_second": 72.593, "eval_steps_per_second": 9.074, "step": 448 }, { "epoch": 2.5858585858585856, "grad_norm": 7.576784133911133, "learning_rate": 2.4343434343434344e-05, "loss": 0.0273, "step": 512 }, { "epoch": 2.5858585858585856, "eval_accuracy": 0.9861048974973026, "eval_f1": 0.9861281800402698, "eval_loss": 0.03779837116599083, "eval_precision": 0.9860990328572948, "eval_recall": 0.9861048974973026, "eval_runtime": 526.8186, "eval_samples_per_second": 72.131, "eval_steps_per_second": 9.016, "step": 512 }, { "epoch": 2.909090909090909, "grad_norm": 8.414101600646973, "learning_rate": 2.111111111111111e-05, "loss": 0.0271, "step": 576 }, { "epoch": 2.909090909090909, "eval_accuracy": 0.9883417984683808, "eval_f1": 0.9883335392334167, "eval_loss": 0.03357573598623276, "eval_precision": 0.988365298180521, "eval_recall": 0.9883417984683808, "eval_runtime": 528.7169, "eval_samples_per_second": 71.872, "eval_steps_per_second": 8.984, "step": 576 }, { "epoch": 3.2323232323232323, "grad_norm": 4.41958475112915, "learning_rate": 1.787878787878788e-05, "loss": 0.021, "step": 640 }, { "epoch": 3.2323232323232323, "eval_accuracy": 0.985894365641201, "eval_f1": 0.9859268508760648, "eval_loss": 0.04180537536740303, "eval_precision": 0.9859071918052413, "eval_recall": 0.985894365641201, "eval_runtime": 523.9915, "eval_samples_per_second": 72.52, "eval_steps_per_second": 9.065, "step": 640 }, { "epoch": 3.5555555555555554, "grad_norm": 10.126025199890137, "learning_rate": 1.4646464646464647e-05, "loss": 0.019, "step": 704 }, { "epoch": 3.5555555555555554, "eval_accuracy": 0.9848417063606937, "eval_f1": 0.9848982600089184, "eval_loss": 0.04540397599339485, "eval_precision": 0.9849383014159727, "eval_recall": 0.9848417063606937, "eval_runtime": 525.5117, "eval_samples_per_second": 72.31, "eval_steps_per_second": 9.039, "step": 704 }, { "epoch": 3.878787878787879, "grad_norm": 3.757537603378296, "learning_rate": 1.1414141414141415e-05, "loss": 0.0177, "step": 768 }, { "epoch": 3.878787878787879, "eval_accuracy": 0.9883154819863681, "eval_f1": 0.9883223194841958, "eval_loss": 0.03590450435876846, "eval_precision": 0.9883066841617396, "eval_recall": 0.9883154819863681, "eval_runtime": 522.9339, "eval_samples_per_second": 72.667, "eval_steps_per_second": 9.083, "step": 768 }, { "epoch": 4.202020202020202, "grad_norm": 4.959455966949463, "learning_rate": 8.181818181818183e-06, "loss": 0.0134, "step": 832 }, { "epoch": 4.202020202020202, "eval_accuracy": 0.9874470380799495, "eval_f1": 0.987400014046709, "eval_loss": 0.04097573831677437, "eval_precision": 0.9877259518894549, "eval_recall": 0.9874470380799495, "eval_runtime": 521.4997, "eval_samples_per_second": 72.867, "eval_steps_per_second": 9.108, "step": 832 }, { "epoch": 4.525252525252525, "grad_norm": 3.8119397163391113, "learning_rate": 4.949494949494949e-06, "loss": 0.0102, "step": 896 }, { "epoch": 4.525252525252525, "eval_accuracy": 0.9909997631516619, "eval_f1": 0.9910005190250708, "eval_loss": 0.031363558024168015, "eval_precision": 0.9909983512838277, "eval_recall": 0.9909997631516619, "eval_runtime": 523.3329, "eval_samples_per_second": 72.612, "eval_steps_per_second": 9.076, "step": 896 }, { "epoch": 4.848484848484849, "grad_norm": 3.6070823669433594, "learning_rate": 1.7171717171717171e-06, "loss": 0.0103, "step": 960 }, { "epoch": 4.848484848484849, "eval_accuracy": 0.9909997631516619, "eval_f1": 0.9909972985219008, "eval_loss": 0.030054476112127304, "eval_precision": 0.9910057473707247, "eval_recall": 0.9909997631516619, "eval_runtime": 534.5024, "eval_samples_per_second": 71.094, "eval_steps_per_second": 8.887, "step": 960 }, { "epoch": 5.0, "step": 990, "total_flos": 3.78521471397888e+18, "train_loss": 0.055960290434986654, "train_runtime": 18290.5686, "train_samples_per_second": 41.551, "train_steps_per_second": 0.054 } ], "logging_steps": 64, "max_steps": 990, "num_input_tokens_seen": 0, "num_train_epochs": 5, "save_steps": 64, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 3.78521471397888e+18, "train_batch_size": 768, "trial_name": null, "trial_params": null }