| { | |
| "best_metric": 0.9174279061436503, | |
| "best_model_checkpoint": "DynamicFreightPackinglist_Jun24/checkpoint-3000", | |
| "epoch": 2.657218777679362, | |
| "global_step": 3000, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 0.09, | |
| "eval_accuracy": 0.8657594809519709, | |
| "eval_f1": 0.294485668558126, | |
| "eval_loss": 0.6096277832984924, | |
| "eval_precision": 0.3776119402985075, | |
| "eval_recall": 0.24135463868352014, | |
| "eval_runtime": 37.7163, | |
| "eval_samples_per_second": 10.181, | |
| "eval_steps_per_second": 5.091, | |
| "step": 100 | |
| }, | |
| { | |
| "epoch": 0.18, | |
| "eval_accuracy": 0.9066833175437086, | |
| "eval_f1": 0.42788946412963086, | |
| "eval_loss": 0.466012567281723, | |
| "eval_precision": 0.49051950053954063, | |
| "eval_recall": 0.37944192702122587, | |
| "eval_runtime": 37.9564, | |
| "eval_samples_per_second": 10.117, | |
| "eval_steps_per_second": 5.058, | |
| "step": 200 | |
| }, | |
| { | |
| "epoch": 0.27, | |
| "eval_accuracy": 0.9190566416903511, | |
| "eval_f1": 0.45627078849540204, | |
| "eval_loss": 0.3901040554046631, | |
| "eval_precision": 0.5035267021736001, | |
| "eval_recall": 0.4171237777247794, | |
| "eval_runtime": 37.9745, | |
| "eval_samples_per_second": 10.112, | |
| "eval_steps_per_second": 5.056, | |
| "step": 300 | |
| }, | |
| { | |
| "epoch": 0.35, | |
| "eval_accuracy": 0.9322768638934343, | |
| "eval_f1": 0.5466886577010912, | |
| "eval_loss": 0.3380320370197296, | |
| "eval_precision": 0.5840336134453782, | |
| "eval_recall": 0.5138325781063677, | |
| "eval_runtime": 37.9718, | |
| "eval_samples_per_second": 10.113, | |
| "eval_steps_per_second": 5.056, | |
| "step": 400 | |
| }, | |
| { | |
| "epoch": 0.44, | |
| "learning_rate": 8.333333333333334e-06, | |
| "loss": 0.4269, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 0.44, | |
| "eval_accuracy": 0.9360233112278586, | |
| "eval_f1": 0.5705544933078396, | |
| "eval_loss": 0.2771761417388916, | |
| "eval_precision": 0.6128148959474261, | |
| "eval_recall": 0.5337467207250179, | |
| "eval_runtime": 38.0237, | |
| "eval_samples_per_second": 10.099, | |
| "eval_steps_per_second": 5.049, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 0.53, | |
| "eval_accuracy": 0.9542962133608934, | |
| "eval_f1": 0.6891029650944577, | |
| "eval_loss": 0.2250644564628601, | |
| "eval_precision": 0.7247368421052631, | |
| "eval_recall": 0.6568089673264965, | |
| "eval_runtime": 37.8718, | |
| "eval_samples_per_second": 10.139, | |
| "eval_steps_per_second": 5.07, | |
| "step": 600 | |
| }, | |
| { | |
| "epoch": 0.62, | |
| "eval_accuracy": 0.9598082278299314, | |
| "eval_f1": 0.730193368491241, | |
| "eval_loss": 0.2054944485425949, | |
| "eval_precision": 0.7425718160522747, | |
| "eval_recall": 0.7182208442642499, | |
| "eval_runtime": 37.7502, | |
| "eval_samples_per_second": 10.172, | |
| "eval_steps_per_second": 5.086, | |
| "step": 700 | |
| }, | |
| { | |
| "epoch": 0.71, | |
| "eval_accuracy": 0.9699853587115667, | |
| "eval_f1": 0.7988021024324654, | |
| "eval_loss": 0.16418181359767914, | |
| "eval_precision": 0.819332998996991, | |
| "eval_recall": 0.7792749821130456, | |
| "eval_runtime": 37.9005, | |
| "eval_samples_per_second": 10.132, | |
| "eval_steps_per_second": 5.066, | |
| "step": 800 | |
| }, | |
| { | |
| "epoch": 0.8, | |
| "eval_accuracy": 0.9699710045072202, | |
| "eval_f1": 0.7916867469879518, | |
| "eval_loss": 0.1568066030740738, | |
| "eval_precision": 0.7999756513270027, | |
| "eval_recall": 0.783567851180539, | |
| "eval_runtime": 37.6869, | |
| "eval_samples_per_second": 10.189, | |
| "eval_steps_per_second": 5.095, | |
| "step": 900 | |
| }, | |
| { | |
| "epoch": 0.89, | |
| "learning_rate": 6.666666666666667e-06, | |
| "loss": 0.2059, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 0.89, | |
| "eval_accuracy": 0.9699135876898344, | |
| "eval_f1": 0.8125, | |
| "eval_loss": 0.15771125257015228, | |
| "eval_precision": 0.828826593897296, | |
| "eval_recall": 0.7968041974719771, | |
| "eval_runtime": 37.8726, | |
| "eval_samples_per_second": 10.139, | |
| "eval_steps_per_second": 5.07, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 0.97, | |
| "eval_accuracy": 0.9756839778371085, | |
| "eval_f1": 0.844042306046341, | |
| "eval_loss": 0.1233619749546051, | |
| "eval_precision": 0.8660143018441852, | |
| "eval_recall": 0.8231576436918674, | |
| "eval_runtime": 37.8462, | |
| "eval_samples_per_second": 10.146, | |
| "eval_steps_per_second": 5.073, | |
| "step": 1100 | |
| }, | |
| { | |
| "epoch": 1.06, | |
| "eval_accuracy": 0.9739327649068412, | |
| "eval_f1": 0.8383422200678624, | |
| "eval_loss": 0.13158756494522095, | |
| "eval_precision": 0.852180339985218, | |
| "eval_recall": 0.8249463391366564, | |
| "eval_runtime": 37.9995, | |
| "eval_samples_per_second": 10.105, | |
| "eval_steps_per_second": 5.053, | |
| "step": 1200 | |
| }, | |
| { | |
| "epoch": 1.15, | |
| "eval_accuracy": 0.9773921281543364, | |
| "eval_f1": 0.8546778437251422, | |
| "eval_loss": 0.12233193963766098, | |
| "eval_precision": 0.8777177328138746, | |
| "eval_recall": 0.8328165990937276, | |
| "eval_runtime": 37.8677, | |
| "eval_samples_per_second": 10.141, | |
| "eval_steps_per_second": 5.07, | |
| "step": 1300 | |
| }, | |
| { | |
| "epoch": 1.24, | |
| "eval_accuracy": 0.9784830476846669, | |
| "eval_f1": 0.8620398310199154, | |
| "eval_loss": 0.1114952489733696, | |
| "eval_precision": 0.8726783968719453, | |
| "eval_recall": 0.8516575244455045, | |
| "eval_runtime": 37.8077, | |
| "eval_samples_per_second": 10.157, | |
| "eval_steps_per_second": 5.078, | |
| "step": 1400 | |
| }, | |
| { | |
| "epoch": 1.33, | |
| "learning_rate": 5e-06, | |
| "loss": 0.1384, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 1.33, | |
| "eval_accuracy": 0.9778801711021158, | |
| "eval_f1": 0.8650332474689989, | |
| "eval_loss": 0.10301075130701065, | |
| "eval_precision": 0.8691465029493198, | |
| "eval_recall": 0.8609587407584068, | |
| "eval_runtime": 37.7478, | |
| "eval_samples_per_second": 10.173, | |
| "eval_steps_per_second": 5.086, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 1.42, | |
| "eval_accuracy": 0.9811529296931071, | |
| "eval_f1": 0.8748258947495913, | |
| "eval_loss": 0.09539026767015457, | |
| "eval_precision": 0.8887658422542144, | |
| "eval_recall": 0.8613164798473647, | |
| "eval_runtime": 37.6325, | |
| "eval_samples_per_second": 10.204, | |
| "eval_steps_per_second": 5.102, | |
| "step": 1600 | |
| }, | |
| { | |
| "epoch": 1.51, | |
| "eval_accuracy": 0.9819711193408549, | |
| "eval_f1": 0.8838249516441005, | |
| "eval_loss": 0.09302261471748352, | |
| "eval_precision": 0.8961755332189262, | |
| "eval_recall": 0.8718101597901264, | |
| "eval_runtime": 37.72, | |
| "eval_samples_per_second": 10.18, | |
| "eval_steps_per_second": 5.09, | |
| "step": 1700 | |
| }, | |
| { | |
| "epoch": 1.59, | |
| "eval_accuracy": 0.9812821175322252, | |
| "eval_f1": 0.8815182901275221, | |
| "eval_loss": 0.09258309751749039, | |
| "eval_precision": 0.8851749428880606, | |
| "eval_recall": 0.8778917243024088, | |
| "eval_runtime": 37.682, | |
| "eval_samples_per_second": 10.191, | |
| "eval_steps_per_second": 5.095, | |
| "step": 1800 | |
| }, | |
| { | |
| "epoch": 1.68, | |
| "eval_accuracy": 0.9810380960583355, | |
| "eval_f1": 0.8837905834431532, | |
| "eval_loss": 0.0902891755104065, | |
| "eval_precision": 0.8879393355801637, | |
| "eval_recall": 0.8796804197471977, | |
| "eval_runtime": 37.6694, | |
| "eval_samples_per_second": 10.194, | |
| "eval_steps_per_second": 5.097, | |
| "step": 1900 | |
| }, | |
| { | |
| "epoch": 1.77, | |
| "learning_rate": 3.3333333333333333e-06, | |
| "loss": 0.0968, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 1.77, | |
| "eval_accuracy": 0.9826314127407918, | |
| "eval_f1": 0.8884760592077666, | |
| "eval_loss": 0.08607935905456543, | |
| "eval_precision": 0.8930249367546079, | |
| "eval_recall": 0.8839732888146912, | |
| "eval_runtime": 37.6927, | |
| "eval_samples_per_second": 10.188, | |
| "eval_steps_per_second": 5.094, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 1.86, | |
| "eval_accuracy": 0.9845692303275629, | |
| "eval_f1": 0.8967495219885278, | |
| "eval_loss": 0.07529100030660629, | |
| "eval_precision": 0.8986826347305389, | |
| "eval_recall": 0.8948247078464107, | |
| "eval_runtime": 37.5991, | |
| "eval_samples_per_second": 10.213, | |
| "eval_steps_per_second": 5.107, | |
| "step": 2100 | |
| }, | |
| { | |
| "epoch": 1.95, | |
| "eval_accuracy": 0.9830046220537996, | |
| "eval_f1": 0.8961644162982435, | |
| "eval_loss": 0.08021637052297592, | |
| "eval_precision": 0.8979885057471264, | |
| "eval_recall": 0.8943477223944669, | |
| "eval_runtime": 37.5671, | |
| "eval_samples_per_second": 10.222, | |
| "eval_steps_per_second": 5.111, | |
| "step": 2200 | |
| }, | |
| { | |
| "epoch": 2.04, | |
| "eval_accuracy": 0.9849137312318779, | |
| "eval_f1": 0.9005910800644815, | |
| "eval_loss": 0.07370590418577194, | |
| "eval_precision": 0.9018294870261868, | |
| "eval_recall": 0.899356069639876, | |
| "eval_runtime": 37.6512, | |
| "eval_samples_per_second": 10.199, | |
| "eval_steps_per_second": 5.099, | |
| "step": 2300 | |
| }, | |
| { | |
| "epoch": 2.13, | |
| "eval_accuracy": 0.9839807079493583, | |
| "eval_f1": 0.9032528103324563, | |
| "eval_loss": 0.07483410835266113, | |
| "eval_precision": 0.9058527224754138, | |
| "eval_recall": 0.9006677796327212, | |
| "eval_runtime": 37.6471, | |
| "eval_samples_per_second": 10.2, | |
| "eval_steps_per_second": 5.1, | |
| "step": 2400 | |
| }, | |
| { | |
| "epoch": 2.21, | |
| "learning_rate": 1.6666666666666667e-06, | |
| "loss": 0.0918, | |
| "step": 2500 | |
| }, | |
| { | |
| "epoch": 2.21, | |
| "eval_accuracy": 0.985301294749232, | |
| "eval_f1": 0.907269366092194, | |
| "eval_loss": 0.07416214793920517, | |
| "eval_precision": 0.9074317070261243, | |
| "eval_recall": 0.9071070832339614, | |
| "eval_runtime": 37.7271, | |
| "eval_samples_per_second": 10.178, | |
| "eval_steps_per_second": 5.089, | |
| "step": 2500 | |
| }, | |
| { | |
| "epoch": 2.3, | |
| "eval_accuracy": 0.986693652570838, | |
| "eval_f1": 0.9162969180956949, | |
| "eval_loss": 0.06871066987514496, | |
| "eval_precision": 0.9214905933429812, | |
| "eval_recall": 0.911161459575483, | |
| "eval_runtime": 37.5742, | |
| "eval_samples_per_second": 10.22, | |
| "eval_steps_per_second": 5.11, | |
| "step": 2600 | |
| }, | |
| { | |
| "epoch": 2.39, | |
| "eval_accuracy": 0.9862773806447909, | |
| "eval_f1": 0.9115873679183333, | |
| "eval_loss": 0.06786704063415527, | |
| "eval_precision": 0.9127316198445905, | |
| "eval_recall": 0.9104459813975674, | |
| "eval_runtime": 37.6479, | |
| "eval_samples_per_second": 10.2, | |
| "eval_steps_per_second": 5.1, | |
| "step": 2700 | |
| }, | |
| { | |
| "epoch": 2.48, | |
| "eval_accuracy": 0.9870381534751529, | |
| "eval_f1": 0.9173381080274545, | |
| "eval_loss": 0.06866415590047836, | |
| "eval_precision": 0.9182698052336002, | |
| "eval_recall": 0.9164082995468639, | |
| "eval_runtime": 37.6027, | |
| "eval_samples_per_second": 10.212, | |
| "eval_steps_per_second": 5.106, | |
| "step": 2800 | |
| }, | |
| { | |
| "epoch": 2.57, | |
| "eval_accuracy": 0.9870237992708064, | |
| "eval_f1": 0.9173084960296136, | |
| "eval_loss": 0.06812075525522232, | |
| "eval_precision": 0.918569891187373, | |
| "eval_recall": 0.916050560457906, | |
| "eval_runtime": 37.5601, | |
| "eval_samples_per_second": 10.224, | |
| "eval_steps_per_second": 5.112, | |
| "step": 2900 | |
| }, | |
| { | |
| "epoch": 2.66, | |
| "learning_rate": 0.0, | |
| "loss": 0.074, | |
| "step": 3000 | |
| }, | |
| { | |
| "epoch": 2.66, | |
| "eval_accuracy": 0.9870812160881922, | |
| "eval_f1": 0.9174279061436503, | |
| "eval_loss": 0.06755248457193375, | |
| "eval_precision": 0.9186894655028099, | |
| "eval_recall": 0.916169806820892, | |
| "eval_runtime": 37.5655, | |
| "eval_samples_per_second": 10.222, | |
| "eval_steps_per_second": 5.111, | |
| "step": 3000 | |
| } | |
| ], | |
| "max_steps": 3000, | |
| "num_train_epochs": 3, | |
| "total_flos": 1592999774208000.0, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |