|
{ |
|
"best_metric": 0.9796821008984106, |
|
"best_model_checkpoint": "test/checkpoint-1500", |
|
"epoch": 13.377926421404682, |
|
"global_step": 4000, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.03, |
|
"eval_accuracy": 0.8922687113634554, |
|
"eval_f1": 0.0, |
|
"eval_loss": 1.3138163089752197, |
|
"eval_precision": 0.0, |
|
"eval_recall": 0.0, |
|
"eval_runtime": 42.6447, |
|
"eval_samples_per_second": 10.06, |
|
"eval_steps_per_second": 1.688, |
|
"step": 10 |
|
}, |
|
{ |
|
"epoch": 0.07, |
|
"eval_accuracy": 0.8922687113634554, |
|
"eval_f1": 0.0, |
|
"eval_loss": 0.7134402394294739, |
|
"eval_precision": 0.0, |
|
"eval_recall": 0.0, |
|
"eval_runtime": 44.6528, |
|
"eval_samples_per_second": 9.607, |
|
"eval_steps_per_second": 1.612, |
|
"step": 20 |
|
}, |
|
{ |
|
"epoch": 0.1, |
|
"eval_accuracy": 0.8922687113634554, |
|
"eval_f1": 0.0, |
|
"eval_loss": 0.6043053865432739, |
|
"eval_precision": 0.0, |
|
"eval_recall": 0.0, |
|
"eval_runtime": 44.2765, |
|
"eval_samples_per_second": 9.689, |
|
"eval_steps_per_second": 1.626, |
|
"step": 30 |
|
}, |
|
{ |
|
"epoch": 0.13, |
|
"eval_accuracy": 0.8922687113634554, |
|
"eval_f1": 0.0, |
|
"eval_loss": 0.5121276378631592, |
|
"eval_precision": 0.0, |
|
"eval_recall": 0.0, |
|
"eval_runtime": 45.3257, |
|
"eval_samples_per_second": 9.465, |
|
"eval_steps_per_second": 1.589, |
|
"step": 40 |
|
}, |
|
{ |
|
"epoch": 0.17, |
|
"eval_accuracy": 0.8922687113634554, |
|
"eval_f1": 0.0, |
|
"eval_loss": 0.4018501937389374, |
|
"eval_precision": 0.0, |
|
"eval_recall": 0.0, |
|
"eval_runtime": 44.7272, |
|
"eval_samples_per_second": 9.591, |
|
"eval_steps_per_second": 1.61, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 0.2, |
|
"eval_accuracy": 0.908479477859436, |
|
"eval_f1": 0.0, |
|
"eval_loss": 0.3501987159252167, |
|
"eval_precision": 0.0, |
|
"eval_recall": 0.0, |
|
"eval_runtime": 44.7765, |
|
"eval_samples_per_second": 9.581, |
|
"eval_steps_per_second": 1.608, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 0.23, |
|
"eval_accuracy": 0.9237218434108938, |
|
"eval_f1": 0.0, |
|
"eval_loss": 0.29354768991470337, |
|
"eval_precision": 0.0, |
|
"eval_recall": 0.0, |
|
"eval_runtime": 44.776, |
|
"eval_samples_per_second": 9.581, |
|
"eval_steps_per_second": 1.608, |
|
"step": 70 |
|
}, |
|
{ |
|
"epoch": 0.27, |
|
"eval_accuracy": 0.9264413255153751, |
|
"eval_f1": 0.0008230452674897119, |
|
"eval_loss": 0.24890266358852386, |
|
"eval_precision": 0.001594896331738437, |
|
"eval_recall": 0.0005546311702717693, |
|
"eval_runtime": 44.807, |
|
"eval_samples_per_second": 9.574, |
|
"eval_steps_per_second": 1.607, |
|
"step": 80 |
|
}, |
|
{ |
|
"epoch": 0.3, |
|
"eval_accuracy": 0.9392427900559815, |
|
"eval_f1": 0.013897161008536827, |
|
"eval_loss": 0.2203027307987213, |
|
"eval_precision": 0.02445842068483578, |
|
"eval_recall": 0.009706045479755962, |
|
"eval_runtime": 44.7926, |
|
"eval_samples_per_second": 9.577, |
|
"eval_steps_per_second": 1.607, |
|
"step": 90 |
|
}, |
|
{ |
|
"epoch": 0.33, |
|
"eval_accuracy": 0.935727361969701, |
|
"eval_f1": 0.00045840018336007336, |
|
"eval_loss": 0.19940191507339478, |
|
"eval_precision": 0.001321003963011889, |
|
"eval_recall": 0.00027731558513588466, |
|
"eval_runtime": 44.7253, |
|
"eval_samples_per_second": 9.592, |
|
"eval_steps_per_second": 1.61, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 0.37, |
|
"eval_accuracy": 0.943779682152238, |
|
"eval_f1": 0.07579030041233065, |
|
"eval_loss": 0.1813557893037796, |
|
"eval_precision": 0.12979152656355078, |
|
"eval_recall": 0.053521907931225736, |
|
"eval_runtime": 44.6764, |
|
"eval_samples_per_second": 9.602, |
|
"eval_steps_per_second": 1.612, |
|
"step": 110 |
|
}, |
|
{ |
|
"epoch": 0.4, |
|
"eval_accuracy": 0.9479053354912313, |
|
"eval_f1": 0.11372837688627163, |
|
"eval_loss": 0.16338485479354858, |
|
"eval_precision": 0.16903719912472648, |
|
"eval_recall": 0.08569051580698835, |
|
"eval_runtime": 44.7776, |
|
"eval_samples_per_second": 9.581, |
|
"eval_steps_per_second": 1.608, |
|
"step": 120 |
|
}, |
|
{ |
|
"epoch": 0.43, |
|
"eval_accuracy": 0.9628027911172429, |
|
"eval_f1": 0.33931930904737473, |
|
"eval_loss": 0.14094215631484985, |
|
"eval_precision": 0.4426595269968764, |
|
"eval_recall": 0.27509706045479754, |
|
"eval_runtime": 44.9683, |
|
"eval_samples_per_second": 9.54, |
|
"eval_steps_per_second": 1.601, |
|
"step": 130 |
|
}, |
|
{ |
|
"epoch": 0.47, |
|
"eval_accuracy": 0.9663580165026133, |
|
"eval_f1": 0.34743875278396436, |
|
"eval_loss": 0.12451943010091782, |
|
"eval_precision": 0.40746268656716417, |
|
"eval_recall": 0.30282861896838603, |
|
"eval_runtime": 44.682, |
|
"eval_samples_per_second": 9.601, |
|
"eval_steps_per_second": 1.611, |
|
"step": 140 |
|
}, |
|
{ |
|
"epoch": 0.5, |
|
"eval_accuracy": 0.9711734896924995, |
|
"eval_f1": 0.47246835443037977, |
|
"eval_loss": 0.11197753250598907, |
|
"eval_precision": 0.5501105379513633, |
|
"eval_recall": 0.4140321686078758, |
|
"eval_runtime": 44.7253, |
|
"eval_samples_per_second": 9.592, |
|
"eval_steps_per_second": 1.61, |
|
"step": 150 |
|
}, |
|
{ |
|
"epoch": 0.54, |
|
"eval_accuracy": 0.9736674537688043, |
|
"eval_f1": 0.5392111368909513, |
|
"eval_loss": 0.09976229071617126, |
|
"eval_precision": 0.6096537250786989, |
|
"eval_recall": 0.48336106489184694, |
|
"eval_runtime": 44.7165, |
|
"eval_samples_per_second": 9.594, |
|
"eval_steps_per_second": 1.61, |
|
"step": 160 |
|
}, |
|
{ |
|
"epoch": 0.57, |
|
"eval_accuracy": 0.9746623862460534, |
|
"eval_f1": 0.5685945368533496, |
|
"eval_loss": 0.09186050295829773, |
|
"eval_precision": 0.6321683067526298, |
|
"eval_recall": 0.5166389351081531, |
|
"eval_runtime": 44.7738, |
|
"eval_samples_per_second": 9.582, |
|
"eval_steps_per_second": 1.608, |
|
"step": 170 |
|
}, |
|
{ |
|
"epoch": 0.6, |
|
"eval_accuracy": 0.9771696160887214, |
|
"eval_f1": 0.5888754534461911, |
|
"eval_loss": 0.0845290869474411, |
|
"eval_precision": 0.6471760797342193, |
|
"eval_recall": 0.5402107598447032, |
|
"eval_runtime": 44.7399, |
|
"eval_samples_per_second": 9.589, |
|
"eval_steps_per_second": 1.609, |
|
"step": 180 |
|
}, |
|
{ |
|
"epoch": 0.64, |
|
"eval_accuracy": 0.980194210819559, |
|
"eval_f1": 0.6471658078205517, |
|
"eval_loss": 0.07714465260505676, |
|
"eval_precision": 0.7135695187165776, |
|
"eval_recall": 0.5920687742651137, |
|
"eval_runtime": 44.734, |
|
"eval_samples_per_second": 9.59, |
|
"eval_steps_per_second": 1.61, |
|
"step": 190 |
|
}, |
|
{ |
|
"epoch": 0.67, |
|
"eval_accuracy": 0.9795839855668462, |
|
"eval_f1": 0.7072773084333779, |
|
"eval_loss": 0.07666940242052078, |
|
"eval_precision": 0.7596306908627826, |
|
"eval_recall": 0.6616749861342207, |
|
"eval_runtime": 44.7886, |
|
"eval_samples_per_second": 9.578, |
|
"eval_steps_per_second": 1.608, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 0.7, |
|
"eval_accuracy": 0.9832586028494866, |
|
"eval_f1": 0.7367480643240022, |
|
"eval_loss": 0.06706634908914566, |
|
"eval_precision": 0.7954983922829582, |
|
"eval_recall": 0.6860787576261785, |
|
"eval_runtime": 44.9641, |
|
"eval_samples_per_second": 9.541, |
|
"eval_steps_per_second": 1.601, |
|
"step": 210 |
|
}, |
|
{ |
|
"epoch": 0.74, |
|
"eval_accuracy": 0.9847576344485421, |
|
"eval_f1": 0.7383826191913097, |
|
"eval_loss": 0.06665363162755966, |
|
"eval_precision": 0.8097286565188617, |
|
"eval_recall": 0.6785912368275097, |
|
"eval_runtime": 44.8134, |
|
"eval_samples_per_second": 9.573, |
|
"eval_steps_per_second": 1.607, |
|
"step": 220 |
|
}, |
|
{ |
|
"epoch": 0.77, |
|
"eval_accuracy": 0.9845321164203656, |
|
"eval_f1": 0.752096513167574, |
|
"eval_loss": 0.06071800738573074, |
|
"eval_precision": 0.8010028204324663, |
|
"eval_recall": 0.7088186356073212, |
|
"eval_runtime": 44.7268, |
|
"eval_samples_per_second": 9.592, |
|
"eval_steps_per_second": 1.61, |
|
"step": 230 |
|
}, |
|
{ |
|
"epoch": 0.8, |
|
"eval_accuracy": 0.986482184075774, |
|
"eval_f1": 0.7756542193472508, |
|
"eval_loss": 0.057662855833768845, |
|
"eval_precision": 0.8254067584480601, |
|
"eval_recall": 0.7315585135884637, |
|
"eval_runtime": 44.6791, |
|
"eval_samples_per_second": 9.602, |
|
"eval_steps_per_second": 1.611, |
|
"step": 240 |
|
}, |
|
{ |
|
"epoch": 0.84, |
|
"eval_accuracy": 0.9871454723939402, |
|
"eval_f1": 0.7851227662356531, |
|
"eval_loss": 0.054133981466293335, |
|
"eval_precision": 0.8245346353371986, |
|
"eval_recall": 0.7493067110371603, |
|
"eval_runtime": 44.7641, |
|
"eval_samples_per_second": 9.584, |
|
"eval_steps_per_second": 1.608, |
|
"step": 250 |
|
}, |
|
{ |
|
"epoch": 0.87, |
|
"eval_accuracy": 0.9884985805629991, |
|
"eval_f1": 0.8150755242704208, |
|
"eval_loss": 0.05026474595069885, |
|
"eval_precision": 0.8649237472766884, |
|
"eval_recall": 0.7706600110926234, |
|
"eval_runtime": 44.9736, |
|
"eval_samples_per_second": 9.539, |
|
"eval_steps_per_second": 1.601, |
|
"step": 260 |
|
}, |
|
{ |
|
"epoch": 0.9, |
|
"eval_accuracy": 0.9881934679366426, |
|
"eval_f1": 0.801503541997976, |
|
"eval_loss": 0.04910367354750633, |
|
"eval_precision": 0.8372093023255814, |
|
"eval_recall": 0.7687188019966722, |
|
"eval_runtime": 44.8146, |
|
"eval_samples_per_second": 9.573, |
|
"eval_steps_per_second": 1.607, |
|
"step": 270 |
|
}, |
|
{ |
|
"epoch": 0.94, |
|
"eval_accuracy": 0.987875089543923, |
|
"eval_f1": 0.8106457242582897, |
|
"eval_loss": 0.04733191058039665, |
|
"eval_precision": 0.8522935779816514, |
|
"eval_recall": 0.7728785357737105, |
|
"eval_runtime": 44.8863, |
|
"eval_samples_per_second": 9.557, |
|
"eval_steps_per_second": 1.604, |
|
"step": 280 |
|
}, |
|
{ |
|
"epoch": 0.97, |
|
"eval_accuracy": 0.9887904274229923, |
|
"eval_f1": 0.8112208387004436, |
|
"eval_loss": 0.046026937663555145, |
|
"eval_precision": 0.8382135462880804, |
|
"eval_recall": 0.785912368275097, |
|
"eval_runtime": 44.8674, |
|
"eval_samples_per_second": 9.562, |
|
"eval_steps_per_second": 1.605, |
|
"step": 290 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.9894404499747951, |
|
"eval_f1": 0.8500071766901106, |
|
"eval_loss": 0.0429680198431015, |
|
"eval_precision": 0.880987801249628, |
|
"eval_recall": 0.8211314475873545, |
|
"eval_runtime": 45.1867, |
|
"eval_samples_per_second": 9.494, |
|
"eval_steps_per_second": 1.593, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 1.04, |
|
"eval_accuracy": 0.9901170040593245, |
|
"eval_f1": 0.8402282453637661, |
|
"eval_loss": 0.04167770594358444, |
|
"eval_precision": 0.8651586368977673, |
|
"eval_recall": 0.8166943982251803, |
|
"eval_runtime": 44.8739, |
|
"eval_samples_per_second": 9.56, |
|
"eval_steps_per_second": 1.604, |
|
"step": 310 |
|
}, |
|
{ |
|
"epoch": 1.07, |
|
"eval_accuracy": 0.9908333554429439, |
|
"eval_f1": 0.8512689635616051, |
|
"eval_loss": 0.039857033640146255, |
|
"eval_precision": 0.8709022338265158, |
|
"eval_recall": 0.8325013865779257, |
|
"eval_runtime": 44.8161, |
|
"eval_samples_per_second": 9.572, |
|
"eval_steps_per_second": 1.607, |
|
"step": 320 |
|
}, |
|
{ |
|
"epoch": 1.1, |
|
"eval_accuracy": 0.9919211482847364, |
|
"eval_f1": 0.8664764621968616, |
|
"eval_loss": 0.03763346001505852, |
|
"eval_precision": 0.8921856639247944, |
|
"eval_recall": 0.8422074320576817, |
|
"eval_runtime": 45.0124, |
|
"eval_samples_per_second": 9.531, |
|
"eval_steps_per_second": 1.6, |
|
"step": 330 |
|
}, |
|
{ |
|
"epoch": 1.14, |
|
"eval_accuracy": 0.992106869013823, |
|
"eval_f1": 0.8503758332151468, |
|
"eval_loss": 0.035481277853250504, |
|
"eval_precision": 0.8702467343976777, |
|
"eval_recall": 0.8313921242373822, |
|
"eval_runtime": 44.8357, |
|
"eval_samples_per_second": 9.568, |
|
"eval_steps_per_second": 1.606, |
|
"step": 340 |
|
}, |
|
{ |
|
"epoch": 1.17, |
|
"eval_accuracy": 0.9925048420047227, |
|
"eval_f1": 0.8676303854875284, |
|
"eval_loss": 0.03401191905140877, |
|
"eval_precision": 0.8872463768115942, |
|
"eval_recall": 0.8488630061009429, |
|
"eval_runtime": 44.9137, |
|
"eval_samples_per_second": 9.552, |
|
"eval_steps_per_second": 1.603, |
|
"step": 350 |
|
}, |
|
{ |
|
"epoch": 1.2, |
|
"eval_accuracy": 0.9926905627338092, |
|
"eval_f1": 0.8718825708992448, |
|
"eval_loss": 0.032262638211250305, |
|
"eval_precision": 0.8968044561712107, |
|
"eval_recall": 0.8483083749306711, |
|
"eval_runtime": 44.876, |
|
"eval_samples_per_second": 9.56, |
|
"eval_steps_per_second": 1.604, |
|
"step": 360 |
|
}, |
|
{ |
|
"epoch": 1.24, |
|
"eval_accuracy": 0.9930487384256188, |
|
"eval_f1": 0.8813077469793889, |
|
"eval_loss": 0.03254028782248497, |
|
"eval_precision": 0.9040536599591718, |
|
"eval_recall": 0.8596783139212424, |
|
"eval_runtime": 44.7683, |
|
"eval_samples_per_second": 9.583, |
|
"eval_steps_per_second": 1.608, |
|
"step": 370 |
|
}, |
|
{ |
|
"epoch": 1.27, |
|
"eval_accuracy": 0.9927038285001725, |
|
"eval_f1": 0.8627060830017056, |
|
"eval_loss": 0.030650299042463303, |
|
"eval_precision": 0.8848396501457726, |
|
"eval_recall": 0.8416528008874099, |
|
"eval_runtime": 44.7059, |
|
"eval_samples_per_second": 9.596, |
|
"eval_steps_per_second": 1.611, |
|
"step": 380 |
|
}, |
|
{ |
|
"epoch": 1.3, |
|
"eval_accuracy": 0.9934467114165185, |
|
"eval_f1": 0.8900583131844688, |
|
"eval_loss": 0.029178058728575706, |
|
"eval_precision": 0.9135766423357664, |
|
"eval_recall": 0.867720465890183, |
|
"eval_runtime": 44.67, |
|
"eval_samples_per_second": 9.604, |
|
"eval_steps_per_second": 1.612, |
|
"step": 390 |
|
}, |
|
{ |
|
"epoch": 1.34, |
|
"eval_accuracy": 0.993300787986522, |
|
"eval_f1": 0.8887311950042579, |
|
"eval_loss": 0.02753848023712635, |
|
"eval_precision": 0.9101744186046512, |
|
"eval_recall": 0.8682750970604548, |
|
"eval_runtime": 44.9312, |
|
"eval_samples_per_second": 9.548, |
|
"eval_steps_per_second": 1.602, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 1.37, |
|
"eval_accuracy": 0.9936456979119683, |
|
"eval_f1": 0.894469525959368, |
|
"eval_loss": 0.027282511815428734, |
|
"eval_precision": 0.9103963239517519, |
|
"eval_recall": 0.8790904048807543, |
|
"eval_runtime": 44.6914, |
|
"eval_samples_per_second": 9.599, |
|
"eval_steps_per_second": 1.611, |
|
"step": 410 |
|
}, |
|
{ |
|
"epoch": 1.4, |
|
"eval_accuracy": 0.9922925897429095, |
|
"eval_f1": 0.8725379853685987, |
|
"eval_loss": 0.02893451787531376, |
|
"eval_precision": 0.8854940034266133, |
|
"eval_recall": 0.8599556295063783, |
|
"eval_runtime": 44.7493, |
|
"eval_samples_per_second": 9.587, |
|
"eval_steps_per_second": 1.609, |
|
"step": 420 |
|
}, |
|
{ |
|
"epoch": 1.44, |
|
"eval_accuracy": 0.9938712159401448, |
|
"eval_f1": 0.8959954719117023, |
|
"eval_loss": 0.024990031495690346, |
|
"eval_precision": 0.9147645189251662, |
|
"eval_recall": 0.8779811425402108, |
|
"eval_runtime": 44.6669, |
|
"eval_samples_per_second": 9.604, |
|
"eval_steps_per_second": 1.612, |
|
"step": 430 |
|
}, |
|
{ |
|
"epoch": 1.47, |
|
"eval_accuracy": 0.9938181528746916, |
|
"eval_f1": 0.8929327126534067, |
|
"eval_loss": 0.026491543278098106, |
|
"eval_precision": 0.9086993970714901, |
|
"eval_recall": 0.8777038269550749, |
|
"eval_runtime": 44.7596, |
|
"eval_samples_per_second": 9.585, |
|
"eval_steps_per_second": 1.609, |
|
"step": 440 |
|
}, |
|
{ |
|
"epoch": 1.51, |
|
"eval_accuracy": 0.9945610357910376, |
|
"eval_f1": 0.9141895681435781, |
|
"eval_loss": 0.0247773639857769, |
|
"eval_precision": 0.9245604083947816, |
|
"eval_recall": 0.9040488075429839, |
|
"eval_runtime": 44.7459, |
|
"eval_samples_per_second": 9.587, |
|
"eval_steps_per_second": 1.609, |
|
"step": 450 |
|
}, |
|
{ |
|
"epoch": 1.54, |
|
"eval_accuracy": 0.9943753150619511, |
|
"eval_f1": 0.9076814658210007, |
|
"eval_loss": 0.0243705864995718, |
|
"eval_precision": 0.9229005445686443, |
|
"eval_recall": 0.8929561841375485, |
|
"eval_runtime": 44.7374, |
|
"eval_samples_per_second": 9.589, |
|
"eval_steps_per_second": 1.609, |
|
"step": 460 |
|
}, |
|
{ |
|
"epoch": 1.57, |
|
"eval_accuracy": 0.994534504258311, |
|
"eval_f1": 0.9149444678757205, |
|
"eval_loss": 0.023830989375710487, |
|
"eval_precision": 0.9278585685771314, |
|
"eval_recall": 0.9023849140321686, |
|
"eval_runtime": 44.7741, |
|
"eval_samples_per_second": 9.581, |
|
"eval_steps_per_second": 1.608, |
|
"step": 470 |
|
}, |
|
{ |
|
"epoch": 1.61, |
|
"eval_accuracy": 0.9947069592210342, |
|
"eval_f1": 0.9177099451399635, |
|
"eval_loss": 0.022406980395317078, |
|
"eval_precision": 0.931201827005424, |
|
"eval_recall": 0.9046034387132557, |
|
"eval_runtime": 44.7025, |
|
"eval_samples_per_second": 9.597, |
|
"eval_steps_per_second": 1.611, |
|
"step": 480 |
|
}, |
|
{ |
|
"epoch": 1.64, |
|
"eval_accuracy": 0.9947069592210342, |
|
"eval_f1": 0.9264129826524903, |
|
"eval_loss": 0.023025579750537872, |
|
"eval_precision": 0.9347826086956522, |
|
"eval_recall": 0.918191902384914, |
|
"eval_runtime": 45.0649, |
|
"eval_samples_per_second": 9.52, |
|
"eval_steps_per_second": 1.598, |
|
"step": 490 |
|
}, |
|
{ |
|
"epoch": 1.67, |
|
"learning_rate": 9.5e-06, |
|
"loss": 0.1784, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 1.67, |
|
"eval_accuracy": 0.9953702475392003, |
|
"eval_f1": 0.9400780379041248, |
|
"eval_loss": 0.022061465308070183, |
|
"eval_precision": 0.9448179271708683, |
|
"eval_recall": 0.9353854686633388, |
|
"eval_runtime": 44.7675, |
|
"eval_samples_per_second": 9.583, |
|
"eval_steps_per_second": 1.608, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 1.71, |
|
"eval_accuracy": 0.9954100448382903, |
|
"eval_f1": 0.9358616843279419, |
|
"eval_loss": 0.02172040194272995, |
|
"eval_precision": 0.9411104879416713, |
|
"eval_recall": 0.9306711037160288, |
|
"eval_runtime": 44.9669, |
|
"eval_samples_per_second": 9.54, |
|
"eval_steps_per_second": 1.601, |
|
"step": 510 |
|
}, |
|
{ |
|
"epoch": 1.74, |
|
"eval_accuracy": 0.9952243241092038, |
|
"eval_f1": 0.9297780259667735, |
|
"eval_loss": 0.021418150514364243, |
|
"eval_precision": 0.9361821759910036, |
|
"eval_recall": 0.9234608985024958, |
|
"eval_runtime": 44.7829, |
|
"eval_samples_per_second": 9.58, |
|
"eval_steps_per_second": 1.608, |
|
"step": 520 |
|
}, |
|
{ |
|
"epoch": 1.77, |
|
"eval_accuracy": 0.9950651349128439, |
|
"eval_f1": 0.9294002516426674, |
|
"eval_loss": 0.02137417532503605, |
|
"eval_precision": 0.937129968987877, |
|
"eval_recall": 0.9217970049916805, |
|
"eval_runtime": 44.837, |
|
"eval_samples_per_second": 9.568, |
|
"eval_steps_per_second": 1.606, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 1.81, |
|
"eval_accuracy": 0.9954100448382903, |
|
"eval_f1": 0.9379098646574578, |
|
"eval_loss": 0.02044159732758999, |
|
"eval_precision": 0.94383600112328, |
|
"eval_recall": 0.9320576816417082, |
|
"eval_runtime": 44.8548, |
|
"eval_samples_per_second": 9.564, |
|
"eval_steps_per_second": 1.605, |
|
"step": 540 |
|
}, |
|
{ |
|
"epoch": 1.84, |
|
"eval_accuracy": 0.9959274097264599, |
|
"eval_f1": 0.9561111111111111, |
|
"eval_loss": 0.020166810601949692, |
|
"eval_precision": 0.9577072899276572, |
|
"eval_recall": 0.954520244037715, |
|
"eval_runtime": 44.8166, |
|
"eval_samples_per_second": 9.572, |
|
"eval_steps_per_second": 1.607, |
|
"step": 550 |
|
}, |
|
{ |
|
"epoch": 1.87, |
|
"eval_accuracy": 0.9952375898755671, |
|
"eval_f1": 0.9289403881055422, |
|
"eval_loss": 0.020729683339595795, |
|
"eval_precision": 0.935338768625246, |
|
"eval_recall": 0.9226289517470881, |
|
"eval_runtime": 44.8369, |
|
"eval_samples_per_second": 9.568, |
|
"eval_steps_per_second": 1.606, |
|
"step": 560 |
|
}, |
|
{ |
|
"epoch": 1.91, |
|
"eval_accuracy": 0.9960600673900931, |
|
"eval_f1": 0.9606211869107044, |
|
"eval_loss": 0.019887683913111687, |
|
"eval_precision": 0.9606211869107044, |
|
"eval_recall": 0.9606211869107044, |
|
"eval_runtime": 44.8366, |
|
"eval_samples_per_second": 9.568, |
|
"eval_steps_per_second": 1.606, |
|
"step": 570 |
|
}, |
|
{ |
|
"epoch": 1.94, |
|
"eval_accuracy": 0.9956753601655568, |
|
"eval_f1": 0.9422407794015311, |
|
"eval_loss": 0.021609965711832047, |
|
"eval_precision": 0.945794914780665, |
|
"eval_recall": 0.9387132556849695, |
|
"eval_runtime": 44.9147, |
|
"eval_samples_per_second": 9.551, |
|
"eval_steps_per_second": 1.603, |
|
"step": 580 |
|
}, |
|
{ |
|
"epoch": 1.97, |
|
"eval_accuracy": 0.9960468016237298, |
|
"eval_f1": 0.9564975677553856, |
|
"eval_loss": 0.019716205075383186, |
|
"eval_precision": 0.9587628865979382, |
|
"eval_recall": 0.9542429284525791, |
|
"eval_runtime": 45.3593, |
|
"eval_samples_per_second": 9.458, |
|
"eval_steps_per_second": 1.587, |
|
"step": 590 |
|
}, |
|
{ |
|
"epoch": 2.01, |
|
"eval_accuracy": 0.9957549547637367, |
|
"eval_f1": 0.9439577249339453, |
|
"eval_loss": 0.020143885165452957, |
|
"eval_precision": 0.9467224546722455, |
|
"eval_recall": 0.9412090959511925, |
|
"eval_runtime": 45.0377, |
|
"eval_samples_per_second": 9.525, |
|
"eval_steps_per_second": 1.599, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 2.04, |
|
"eval_accuracy": 0.9955029052028336, |
|
"eval_f1": 0.9359207036158034, |
|
"eval_loss": 0.019947798922657967, |
|
"eval_precision": 0.9423671633398931, |
|
"eval_recall": 0.9295618413754853, |
|
"eval_runtime": 45.1113, |
|
"eval_samples_per_second": 9.51, |
|
"eval_steps_per_second": 1.596, |
|
"step": 610 |
|
}, |
|
{ |
|
"epoch": 2.07, |
|
"eval_accuracy": 0.9961131304555464, |
|
"eval_f1": 0.9537564227190668, |
|
"eval_loss": 0.01930239051580429, |
|
"eval_precision": 0.9552155771905424, |
|
"eval_recall": 0.9523017193566279, |
|
"eval_runtime": 45.0399, |
|
"eval_samples_per_second": 9.525, |
|
"eval_steps_per_second": 1.599, |
|
"step": 620 |
|
}, |
|
{ |
|
"epoch": 2.11, |
|
"eval_accuracy": 0.9959141439600966, |
|
"eval_f1": 0.9510664993726474, |
|
"eval_loss": 0.020125582814216614, |
|
"eval_precision": 0.9562657695542472, |
|
"eval_recall": 0.9459234608985025, |
|
"eval_runtime": 44.9443, |
|
"eval_samples_per_second": 9.545, |
|
"eval_steps_per_second": 1.602, |
|
"step": 630 |
|
}, |
|
{ |
|
"epoch": 2.14, |
|
"eval_accuracy": 0.9965376349791727, |
|
"eval_f1": 0.9709141274238227, |
|
"eval_loss": 0.01933199167251587, |
|
"eval_precision": 0.9698395130049806, |
|
"eval_recall": 0.9719911259012757, |
|
"eval_runtime": 44.9595, |
|
"eval_samples_per_second": 9.542, |
|
"eval_steps_per_second": 1.601, |
|
"step": 640 |
|
}, |
|
{ |
|
"epoch": 2.17, |
|
"eval_accuracy": 0.9962988511846329, |
|
"eval_f1": 0.9642262895174709, |
|
"eval_loss": 0.0191953107714653, |
|
"eval_precision": 0.9642262895174709, |
|
"eval_recall": 0.9642262895174709, |
|
"eval_runtime": 44.8109, |
|
"eval_samples_per_second": 9.574, |
|
"eval_steps_per_second": 1.607, |
|
"step": 650 |
|
}, |
|
{ |
|
"epoch": 2.21, |
|
"eval_accuracy": 0.9957814862964633, |
|
"eval_f1": 0.947662247034194, |
|
"eval_loss": 0.019274834543466568, |
|
"eval_precision": 0.9539196403484125, |
|
"eval_recall": 0.9414864115363284, |
|
"eval_runtime": 45.2879, |
|
"eval_samples_per_second": 9.473, |
|
"eval_steps_per_second": 1.59, |
|
"step": 660 |
|
}, |
|
{ |
|
"epoch": 2.24, |
|
"eval_accuracy": 0.9965906980446261, |
|
"eval_f1": 0.9721568084222192, |
|
"eval_loss": 0.018348801881074905, |
|
"eval_precision": 0.9712150567395517, |
|
"eval_recall": 0.9731003882418192, |
|
"eval_runtime": 44.979, |
|
"eval_samples_per_second": 9.538, |
|
"eval_steps_per_second": 1.601, |
|
"step": 670 |
|
}, |
|
{ |
|
"epoch": 2.27, |
|
"eval_accuracy": 0.9968029503064392, |
|
"eval_f1": 0.975387168141593, |
|
"eval_loss": 0.018433524295687675, |
|
"eval_precision": 0.9726971869829013, |
|
"eval_recall": 0.9780920687742651, |
|
"eval_runtime": 44.9845, |
|
"eval_samples_per_second": 9.537, |
|
"eval_steps_per_second": 1.601, |
|
"step": 680 |
|
}, |
|
{ |
|
"epoch": 2.31, |
|
"eval_accuracy": 0.9967631530073492, |
|
"eval_f1": 0.9695880564003317, |
|
"eval_loss": 0.018039193004369736, |
|
"eval_precision": 0.9666482910694597, |
|
"eval_recall": 0.9725457570715474, |
|
"eval_runtime": 44.9711, |
|
"eval_samples_per_second": 9.539, |
|
"eval_steps_per_second": 1.601, |
|
"step": 690 |
|
}, |
|
{ |
|
"epoch": 2.34, |
|
"eval_accuracy": 0.9968029503064392, |
|
"eval_f1": 0.9738625363020329, |
|
"eval_loss": 0.01683180034160614, |
|
"eval_precision": 0.9713103448275862, |
|
"eval_recall": 0.9764281752634498, |
|
"eval_runtime": 44.9102, |
|
"eval_samples_per_second": 9.552, |
|
"eval_steps_per_second": 1.603, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 2.37, |
|
"eval_accuracy": 0.9969223422037091, |
|
"eval_f1": 0.9755152856550007, |
|
"eval_loss": 0.01656004600226879, |
|
"eval_precision": 0.9732266077836047, |
|
"eval_recall": 0.9778147531891292, |
|
"eval_runtime": 44.9636, |
|
"eval_samples_per_second": 9.541, |
|
"eval_steps_per_second": 1.601, |
|
"step": 710 |
|
}, |
|
{ |
|
"epoch": 2.41, |
|
"eval_accuracy": 0.9967498872409859, |
|
"eval_f1": 0.973655019412091, |
|
"eval_loss": 0.016868896782398224, |
|
"eval_precision": 0.973655019412091, |
|
"eval_recall": 0.973655019412091, |
|
"eval_runtime": 44.8793, |
|
"eval_samples_per_second": 9.559, |
|
"eval_steps_per_second": 1.604, |
|
"step": 720 |
|
}, |
|
{ |
|
"epoch": 2.44, |
|
"eval_accuracy": 0.9968427476055292, |
|
"eval_f1": 0.975765129483451, |
|
"eval_loss": 0.01695641689002514, |
|
"eval_precision": 0.9745504840940525, |
|
"eval_recall": 0.9769828064337216, |
|
"eval_runtime": 44.9769, |
|
"eval_samples_per_second": 9.538, |
|
"eval_steps_per_second": 1.601, |
|
"step": 730 |
|
}, |
|
{ |
|
"epoch": 2.47, |
|
"eval_accuracy": 0.9966968241755326, |
|
"eval_f1": 0.9696128763701957, |
|
"eval_loss": 0.017096424475312233, |
|
"eval_precision": 0.9702860316578729, |
|
"eval_recall": 0.968940654464781, |
|
"eval_runtime": 45.2584, |
|
"eval_samples_per_second": 9.479, |
|
"eval_steps_per_second": 1.591, |
|
"step": 740 |
|
}, |
|
{ |
|
"epoch": 2.51, |
|
"eval_accuracy": 0.9968294818391659, |
|
"eval_f1": 0.9747992245915259, |
|
"eval_loss": 0.016900014132261276, |
|
"eval_precision": 0.9734513274336283, |
|
"eval_recall": 0.9761508596783139, |
|
"eval_runtime": 44.9939, |
|
"eval_samples_per_second": 9.535, |
|
"eval_steps_per_second": 1.6, |
|
"step": 750 |
|
}, |
|
{ |
|
"epoch": 2.54, |
|
"eval_accuracy": 0.9969090764373458, |
|
"eval_f1": 0.9747992245915259, |
|
"eval_loss": 0.01711142621934414, |
|
"eval_precision": 0.9734513274336283, |
|
"eval_recall": 0.9761508596783139, |
|
"eval_runtime": 44.9916, |
|
"eval_samples_per_second": 9.535, |
|
"eval_steps_per_second": 1.6, |
|
"step": 760 |
|
}, |
|
{ |
|
"epoch": 2.58, |
|
"eval_accuracy": 0.9968029503064392, |
|
"eval_f1": 0.9726957726957727, |
|
"eval_loss": 0.017322950065135956, |
|
"eval_precision": 0.972291493488501, |
|
"eval_recall": 0.9731003882418192, |
|
"eval_runtime": 44.9667, |
|
"eval_samples_per_second": 9.54, |
|
"eval_steps_per_second": 1.601, |
|
"step": 770 |
|
}, |
|
{ |
|
"epoch": 2.61, |
|
"eval_accuracy": 0.9970019368018891, |
|
"eval_f1": 0.9776853776853778, |
|
"eval_loss": 0.015976430848240852, |
|
"eval_precision": 0.9772790246605708, |
|
"eval_recall": 0.9780920687742651, |
|
"eval_runtime": 44.9823, |
|
"eval_samples_per_second": 9.537, |
|
"eval_steps_per_second": 1.601, |
|
"step": 780 |
|
}, |
|
{ |
|
"epoch": 2.64, |
|
"eval_accuracy": 0.9968427476055292, |
|
"eval_f1": 0.9725685785536159, |
|
"eval_loss": 0.016221042722463608, |
|
"eval_precision": 0.9717607973421927, |
|
"eval_recall": 0.9733777038269551, |
|
"eval_runtime": 45.0356, |
|
"eval_samples_per_second": 9.526, |
|
"eval_steps_per_second": 1.599, |
|
"step": 790 |
|
}, |
|
{ |
|
"epoch": 2.68, |
|
"eval_accuracy": 0.9967764187737126, |
|
"eval_f1": 0.9714760454167821, |
|
"eval_loss": 0.016350209712982178, |
|
"eval_precision": 0.9701327433628318, |
|
"eval_recall": 0.9728230726566833, |
|
"eval_runtime": 44.9594, |
|
"eval_samples_per_second": 9.542, |
|
"eval_steps_per_second": 1.601, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 2.71, |
|
"eval_accuracy": 0.9969223422037091, |
|
"eval_f1": 0.9753325942350333, |
|
"eval_loss": 0.0164735559374094, |
|
"eval_precision": 0.974792243767313, |
|
"eval_recall": 0.9758735440931781, |
|
"eval_runtime": 44.8809, |
|
"eval_samples_per_second": 9.559, |
|
"eval_steps_per_second": 1.604, |
|
"step": 810 |
|
}, |
|
{ |
|
"epoch": 2.74, |
|
"eval_accuracy": 0.9968692791382558, |
|
"eval_f1": 0.9754541672444876, |
|
"eval_loss": 0.01638418808579445, |
|
"eval_precision": 0.9755894590846047, |
|
"eval_recall": 0.9753189129229063, |
|
"eval_runtime": 45.2809, |
|
"eval_samples_per_second": 9.474, |
|
"eval_steps_per_second": 1.59, |
|
"step": 820 |
|
}, |
|
{ |
|
"epoch": 2.78, |
|
"eval_accuracy": 0.9951712610437505, |
|
"eval_f1": 0.9239864864864865, |
|
"eval_loss": 0.0193793848156929, |
|
"eval_precision": 0.9382504288164666, |
|
"eval_recall": 0.9101497504159733, |
|
"eval_runtime": 44.9984, |
|
"eval_samples_per_second": 9.534, |
|
"eval_steps_per_second": 1.6, |
|
"step": 830 |
|
}, |
|
{ |
|
"epoch": 2.81, |
|
"eval_accuracy": 0.9971213286991589, |
|
"eval_f1": 0.979071379071379, |
|
"eval_loss": 0.015317755751311779, |
|
"eval_precision": 0.9786644499861458, |
|
"eval_recall": 0.9794786466999446, |
|
"eval_runtime": 44.8121, |
|
"eval_samples_per_second": 9.573, |
|
"eval_steps_per_second": 1.607, |
|
"step": 840 |
|
}, |
|
{ |
|
"epoch": 2.84, |
|
"eval_accuracy": 0.9968825449046191, |
|
"eval_f1": 0.9747712780704185, |
|
"eval_loss": 0.016130488365888596, |
|
"eval_precision": 0.9745011086474501, |
|
"eval_recall": 0.9750415973377704, |
|
"eval_runtime": 44.9246, |
|
"eval_samples_per_second": 9.549, |
|
"eval_steps_per_second": 1.603, |
|
"step": 850 |
|
}, |
|
{ |
|
"epoch": 2.88, |
|
"eval_accuracy": 0.9965111034464461, |
|
"eval_f1": 0.9585304759254106, |
|
"eval_loss": 0.017094574868679047, |
|
"eval_precision": 0.9620111731843576, |
|
"eval_recall": 0.9550748752079867, |
|
"eval_runtime": 44.9689, |
|
"eval_samples_per_second": 9.54, |
|
"eval_steps_per_second": 1.601, |
|
"step": 860 |
|
}, |
|
{ |
|
"epoch": 2.91, |
|
"eval_accuracy": 0.997041734100979, |
|
"eval_f1": 0.9767634854771784, |
|
"eval_loss": 0.016324549913406372, |
|
"eval_precision": 0.9743377483443708, |
|
"eval_recall": 0.9792013311148087, |
|
"eval_runtime": 44.9212, |
|
"eval_samples_per_second": 9.55, |
|
"eval_steps_per_second": 1.603, |
|
"step": 870 |
|
}, |
|
{ |
|
"epoch": 2.94, |
|
"eval_accuracy": 0.9970284683346157, |
|
"eval_f1": 0.9753394292047659, |
|
"eval_loss": 0.016577888280153275, |
|
"eval_precision": 0.9745293466223699, |
|
"eval_recall": 0.9761508596783139, |
|
"eval_runtime": 45.0626, |
|
"eval_samples_per_second": 9.52, |
|
"eval_steps_per_second": 1.598, |
|
"step": 880 |
|
}, |
|
{ |
|
"epoch": 2.98, |
|
"eval_accuracy": 0.9968560133718924, |
|
"eval_f1": 0.9743589743589743, |
|
"eval_loss": 0.01666262373328209, |
|
"eval_precision": 0.973954003879191, |
|
"eval_recall": 0.9747642817526345, |
|
"eval_runtime": 44.929, |
|
"eval_samples_per_second": 9.548, |
|
"eval_steps_per_second": 1.603, |
|
"step": 890 |
|
}, |
|
{ |
|
"epoch": 3.01, |
|
"eval_accuracy": 0.9966570268764426, |
|
"eval_f1": 0.9715396362626684, |
|
"eval_loss": 0.01778605580329895, |
|
"eval_precision": 0.9727550736725049, |
|
"eval_recall": 0.9703272323904604, |
|
"eval_runtime": 44.9166, |
|
"eval_samples_per_second": 9.551, |
|
"eval_steps_per_second": 1.603, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 3.04, |
|
"eval_accuracy": 0.9970815314000689, |
|
"eval_f1": 0.9786407766990292, |
|
"eval_loss": 0.016635755077004433, |
|
"eval_precision": 0.978912319644839, |
|
"eval_recall": 0.978369384359401, |
|
"eval_runtime": 45.1716, |
|
"eval_samples_per_second": 9.497, |
|
"eval_steps_per_second": 1.594, |
|
"step": 910 |
|
}, |
|
{ |
|
"epoch": 3.08, |
|
"eval_accuracy": 0.9971478602318856, |
|
"eval_f1": 0.9811529933481152, |
|
"eval_loss": 0.01662967912852764, |
|
"eval_precision": 0.9806094182825484, |
|
"eval_recall": 0.9816971713810316, |
|
"eval_runtime": 44.9112, |
|
"eval_samples_per_second": 9.552, |
|
"eval_steps_per_second": 1.603, |
|
"step": 920 |
|
}, |
|
{ |
|
"epoch": 3.11, |
|
"eval_accuracy": 0.9969488737364357, |
|
"eval_f1": 0.9753052164261932, |
|
"eval_loss": 0.016620052978396416, |
|
"eval_precision": 0.975846751804553, |
|
"eval_recall": 0.9747642817526345, |
|
"eval_runtime": 44.9363, |
|
"eval_samples_per_second": 9.547, |
|
"eval_steps_per_second": 1.602, |
|
"step": 930 |
|
}, |
|
{ |
|
"epoch": 3.14, |
|
"eval_accuracy": 0.9972407205964289, |
|
"eval_f1": 0.9815508392287419, |
|
"eval_loss": 0.015619627200067043, |
|
"eval_precision": 0.9819594782126007, |
|
"eval_recall": 0.9811425402107599, |
|
"eval_runtime": 44.9174, |
|
"eval_samples_per_second": 9.551, |
|
"eval_steps_per_second": 1.603, |
|
"step": 940 |
|
}, |
|
{ |
|
"epoch": 3.18, |
|
"eval_accuracy": 0.9970947971664323, |
|
"eval_f1": 0.9779442363712026, |
|
"eval_loss": 0.015341303311288357, |
|
"eval_precision": 0.9783513738551207, |
|
"eval_recall": 0.9775374376039934, |
|
"eval_runtime": 45.0123, |
|
"eval_samples_per_second": 9.531, |
|
"eval_steps_per_second": 1.6, |
|
"step": 950 |
|
}, |
|
{ |
|
"epoch": 3.21, |
|
"eval_accuracy": 0.9968692791382558, |
|
"eval_f1": 0.9764281752634498, |
|
"eval_loss": 0.01650950312614441, |
|
"eval_precision": 0.9764281752634498, |
|
"eval_recall": 0.9764281752634498, |
|
"eval_runtime": 44.93, |
|
"eval_samples_per_second": 9.548, |
|
"eval_steps_per_second": 1.602, |
|
"step": 960 |
|
}, |
|
{ |
|
"epoch": 3.24, |
|
"eval_accuracy": 0.9968692791382558, |
|
"eval_f1": 0.9774144381321879, |
|
"eval_loss": 0.01659621112048626, |
|
"eval_precision": 0.9767377457767932, |
|
"eval_recall": 0.9780920687742651, |
|
"eval_runtime": 44.9897, |
|
"eval_samples_per_second": 9.536, |
|
"eval_steps_per_second": 1.6, |
|
"step": 970 |
|
}, |
|
{ |
|
"epoch": 3.28, |
|
"eval_accuracy": 0.9967498872409859, |
|
"eval_f1": 0.9746572496884087, |
|
"eval_loss": 0.016826625913381577, |
|
"eval_precision": 0.9734439834024896, |
|
"eval_recall": 0.9758735440931781, |
|
"eval_runtime": 45.2137, |
|
"eval_samples_per_second": 9.488, |
|
"eval_steps_per_second": 1.592, |
|
"step": 980 |
|
}, |
|
{ |
|
"epoch": 3.31, |
|
"eval_accuracy": 0.9968958106709824, |
|
"eval_f1": 0.978146611341632, |
|
"eval_loss": 0.016263196244835854, |
|
"eval_precision": 0.9757174392935982, |
|
"eval_recall": 0.9805879090404881, |
|
"eval_runtime": 44.9271, |
|
"eval_samples_per_second": 9.549, |
|
"eval_steps_per_second": 1.603, |
|
"step": 990 |
|
}, |
|
{ |
|
"epoch": 3.34, |
|
"learning_rate": 9e-06, |
|
"loss": 0.0154, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 3.34, |
|
"eval_accuracy": 0.9968294818391659, |
|
"eval_f1": 0.9775809576529201, |
|
"eval_loss": 0.016901057213544846, |
|
"eval_precision": 0.9756906077348066, |
|
"eval_recall": 0.9794786466999446, |
|
"eval_runtime": 44.996, |
|
"eval_samples_per_second": 9.534, |
|
"eval_steps_per_second": 1.6, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 3.38, |
|
"eval_accuracy": 0.997041734100979, |
|
"eval_f1": 0.9803269603768356, |
|
"eval_loss": 0.01609906367957592, |
|
"eval_precision": 0.9795127353266888, |
|
"eval_recall": 0.9811425402107599, |
|
"eval_runtime": 45.3202, |
|
"eval_samples_per_second": 9.466, |
|
"eval_steps_per_second": 1.589, |
|
"step": 1010 |
|
}, |
|
{ |
|
"epoch": 3.41, |
|
"eval_accuracy": 0.9968692791382558, |
|
"eval_f1": 0.977993079584775, |
|
"eval_loss": 0.016519052907824516, |
|
"eval_precision": 0.9762365294280188, |
|
"eval_recall": 0.9797559622850804, |
|
"eval_runtime": 45.0574, |
|
"eval_samples_per_second": 9.521, |
|
"eval_steps_per_second": 1.598, |
|
"step": 1020 |
|
}, |
|
{ |
|
"epoch": 3.44, |
|
"eval_accuracy": 0.9967233557082593, |
|
"eval_f1": 0.9722530521642619, |
|
"eval_loss": 0.01666153408586979, |
|
"eval_precision": 0.9727928928373126, |
|
"eval_recall": 0.9717138103161398, |
|
"eval_runtime": 45.0201, |
|
"eval_samples_per_second": 9.529, |
|
"eval_steps_per_second": 1.599, |
|
"step": 1030 |
|
}, |
|
{ |
|
"epoch": 3.48, |
|
"eval_accuracy": 0.9969090764373458, |
|
"eval_f1": 0.9761640798226164, |
|
"eval_loss": 0.015780288726091385, |
|
"eval_precision": 0.9756232686980609, |
|
"eval_recall": 0.9767054908485857, |
|
"eval_runtime": 45.2347, |
|
"eval_samples_per_second": 9.484, |
|
"eval_steps_per_second": 1.592, |
|
"step": 1040 |
|
}, |
|
{ |
|
"epoch": 3.51, |
|
"eval_accuracy": 0.9968958106709824, |
|
"eval_f1": 0.9766284054764209, |
|
"eval_loss": 0.015381171368062496, |
|
"eval_precision": 0.9740689655172414, |
|
"eval_recall": 0.9792013311148087, |
|
"eval_runtime": 45.2769, |
|
"eval_samples_per_second": 9.475, |
|
"eval_steps_per_second": 1.59, |
|
"step": 1050 |
|
}, |
|
{ |
|
"epoch": 3.55, |
|
"eval_accuracy": 0.9959804727919132, |
|
"eval_f1": 0.9448555074689375, |
|
"eval_loss": 0.01652899943292141, |
|
"eval_precision": 0.9513635085746416, |
|
"eval_recall": 0.9384359400998337, |
|
"eval_runtime": 45.1375, |
|
"eval_samples_per_second": 9.504, |
|
"eval_steps_per_second": 1.595, |
|
"step": 1060 |
|
}, |
|
{ |
|
"epoch": 3.58, |
|
"eval_accuracy": 0.9968825449046191, |
|
"eval_f1": 0.9749619587771476, |
|
"eval_loss": 0.015719007700681686, |
|
"eval_precision": 0.9726745790781121, |
|
"eval_recall": 0.9772601220188575, |
|
"eval_runtime": 45.0215, |
|
"eval_samples_per_second": 9.529, |
|
"eval_steps_per_second": 1.599, |
|
"step": 1070 |
|
}, |
|
{ |
|
"epoch": 3.61, |
|
"eval_accuracy": 0.9968692791382558, |
|
"eval_f1": 0.9782458085076902, |
|
"eval_loss": 0.01600920408964157, |
|
"eval_precision": 0.977568540570479, |
|
"eval_recall": 0.9789240155296728, |
|
"eval_runtime": 45.1658, |
|
"eval_samples_per_second": 9.498, |
|
"eval_steps_per_second": 1.594, |
|
"step": 1080 |
|
}, |
|
{ |
|
"epoch": 3.65, |
|
"eval_accuracy": 0.99580801782919, |
|
"eval_f1": 0.9429732380552053, |
|
"eval_loss": 0.01786983013153076, |
|
"eval_precision": 0.9529878221467006, |
|
"eval_recall": 0.9331669439822518, |
|
"eval_runtime": 45.14, |
|
"eval_samples_per_second": 9.504, |
|
"eval_steps_per_second": 1.595, |
|
"step": 1090 |
|
}, |
|
{ |
|
"epoch": 3.68, |
|
"eval_accuracy": 0.9968692791382558, |
|
"eval_f1": 0.977439446366782, |
|
"eval_loss": 0.015765171498060226, |
|
"eval_precision": 0.9756838905775076, |
|
"eval_recall": 0.9792013311148087, |
|
"eval_runtime": 45.1016, |
|
"eval_samples_per_second": 9.512, |
|
"eval_steps_per_second": 1.596, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 3.71, |
|
"eval_accuracy": 0.9968958106709824, |
|
"eval_f1": 0.977703919124775, |
|
"eval_loss": 0.015863990411162376, |
|
"eval_precision": 0.9764868603042877, |
|
"eval_recall": 0.9789240155296728, |
|
"eval_runtime": 45.1212, |
|
"eval_samples_per_second": 9.508, |
|
"eval_steps_per_second": 1.596, |
|
"step": 1110 |
|
}, |
|
{ |
|
"epoch": 3.75, |
|
"eval_accuracy": 0.9969621395027991, |
|
"eval_f1": 0.975609756097561, |
|
"eval_loss": 0.01584913209080696, |
|
"eval_precision": 0.9750692520775623, |
|
"eval_recall": 0.9761508596783139, |
|
"eval_runtime": 45.0612, |
|
"eval_samples_per_second": 9.52, |
|
"eval_steps_per_second": 1.598, |
|
"step": 1120 |
|
}, |
|
{ |
|
"epoch": 3.78, |
|
"eval_accuracy": 0.9969488737364357, |
|
"eval_f1": 0.9744869661674986, |
|
"eval_loss": 0.01588474027812481, |
|
"eval_precision": 0.9744869661674986, |
|
"eval_recall": 0.9744869661674986, |
|
"eval_runtime": 45.3578, |
|
"eval_samples_per_second": 9.458, |
|
"eval_steps_per_second": 1.587, |
|
"step": 1130 |
|
}, |
|
{ |
|
"epoch": 3.81, |
|
"eval_accuracy": 0.9968958106709824, |
|
"eval_f1": 0.9752846431546792, |
|
"eval_loss": 0.016261184588074684, |
|
"eval_precision": 0.9766407119021134, |
|
"eval_recall": 0.9739323349972269, |
|
"eval_runtime": 45.1022, |
|
"eval_samples_per_second": 9.512, |
|
"eval_steps_per_second": 1.596, |
|
"step": 1140 |
|
}, |
|
{ |
|
"epoch": 3.85, |
|
"eval_accuracy": 0.9967100899418959, |
|
"eval_f1": 0.9723145071982281, |
|
"eval_loss": 0.016805831342935562, |
|
"eval_precision": 0.970702045328911, |
|
"eval_recall": 0.9739323349972269, |
|
"eval_runtime": 45.1109, |
|
"eval_samples_per_second": 9.51, |
|
"eval_steps_per_second": 1.596, |
|
"step": 1150 |
|
}, |
|
{ |
|
"epoch": 3.88, |
|
"eval_accuracy": 0.9970152025682524, |
|
"eval_f1": 0.9805771365149833, |
|
"eval_loss": 0.01488415990024805, |
|
"eval_precision": 0.9811215991116047, |
|
"eval_recall": 0.9800332778702163, |
|
"eval_runtime": 45.1408, |
|
"eval_samples_per_second": 9.504, |
|
"eval_steps_per_second": 1.595, |
|
"step": 1160 |
|
}, |
|
{ |
|
"epoch": 3.91, |
|
"eval_accuracy": 0.9970152025682524, |
|
"eval_f1": 0.9792531120331951, |
|
"eval_loss": 0.014714999124407768, |
|
"eval_precision": 0.9768211920529801, |
|
"eval_recall": 0.9816971713810316, |
|
"eval_runtime": 45.0991, |
|
"eval_samples_per_second": 9.512, |
|
"eval_steps_per_second": 1.596, |
|
"step": 1170 |
|
}, |
|
{ |
|
"epoch": 3.95, |
|
"eval_accuracy": 0.9969754052691624, |
|
"eval_f1": 0.9757986447241046, |
|
"eval_loss": 0.01566295139491558, |
|
"eval_precision": 0.9732413793103448, |
|
"eval_recall": 0.978369384359401, |
|
"eval_runtime": 45.1028, |
|
"eval_samples_per_second": 9.512, |
|
"eval_steps_per_second": 1.596, |
|
"step": 1180 |
|
}, |
|
{ |
|
"epoch": 3.98, |
|
"eval_accuracy": 0.9969886710355257, |
|
"eval_f1": 0.9786880708552449, |
|
"eval_loss": 0.015323741361498833, |
|
"eval_precision": 0.9767955801104973, |
|
"eval_recall": 0.9805879090404881, |
|
"eval_runtime": 45.1524, |
|
"eval_samples_per_second": 9.501, |
|
"eval_steps_per_second": 1.595, |
|
"step": 1190 |
|
}, |
|
{ |
|
"epoch": 4.01, |
|
"eval_accuracy": 0.9968692791382558, |
|
"eval_f1": 0.9747642817526345, |
|
"eval_loss": 0.015690365806221962, |
|
"eval_precision": 0.9747642817526345, |
|
"eval_recall": 0.9747642817526345, |
|
"eval_runtime": 45.1208, |
|
"eval_samples_per_second": 9.508, |
|
"eval_steps_per_second": 1.596, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 4.05, |
|
"eval_accuracy": 0.9970549998673424, |
|
"eval_f1": 0.9797783933518006, |
|
"eval_loss": 0.015430403873324394, |
|
"eval_precision": 0.978693967902601, |
|
"eval_recall": 0.980865224625624, |
|
"eval_runtime": 45.032, |
|
"eval_samples_per_second": 9.527, |
|
"eval_steps_per_second": 1.599, |
|
"step": 1210 |
|
}, |
|
{ |
|
"epoch": 4.08, |
|
"eval_accuracy": 0.997041734100979, |
|
"eval_f1": 0.9780052566053397, |
|
"eval_loss": 0.0156533382833004, |
|
"eval_precision": 0.9757107369583218, |
|
"eval_recall": 0.9803105934553522, |
|
"eval_runtime": 45.2988, |
|
"eval_samples_per_second": 9.47, |
|
"eval_steps_per_second": 1.589, |
|
"step": 1220 |
|
}, |
|
{ |
|
"epoch": 4.11, |
|
"eval_accuracy": 0.9968958106709824, |
|
"eval_f1": 0.9735493698933665, |
|
"eval_loss": 0.016326196491718292, |
|
"eval_precision": 0.9723374827109267, |
|
"eval_recall": 0.9747642817526345, |
|
"eval_runtime": 45.0756, |
|
"eval_samples_per_second": 9.517, |
|
"eval_steps_per_second": 1.597, |
|
"step": 1230 |
|
}, |
|
{ |
|
"epoch": 4.15, |
|
"eval_accuracy": 0.997041734100979, |
|
"eval_f1": 0.9778699861687413, |
|
"eval_loss": 0.015600275248289108, |
|
"eval_precision": 0.9754415011037527, |
|
"eval_recall": 0.9803105934553522, |
|
"eval_runtime": 44.9579, |
|
"eval_samples_per_second": 9.542, |
|
"eval_steps_per_second": 1.601, |
|
"step": 1240 |
|
}, |
|
{ |
|
"epoch": 4.18, |
|
"eval_accuracy": 0.9970152025682524, |
|
"eval_f1": 0.9774331995015921, |
|
"eval_loss": 0.015862880274653435, |
|
"eval_precision": 0.9759469173348079, |
|
"eval_recall": 0.9789240155296728, |
|
"eval_runtime": 45.0784, |
|
"eval_samples_per_second": 9.517, |
|
"eval_steps_per_second": 1.597, |
|
"step": 1250 |
|
}, |
|
{ |
|
"epoch": 4.21, |
|
"eval_accuracy": 0.9970284683346157, |
|
"eval_f1": 0.9802076124567475, |
|
"eval_loss": 0.01617247611284256, |
|
"eval_precision": 0.9784470848300636, |
|
"eval_recall": 0.9819744869661675, |
|
"eval_runtime": 45.0516, |
|
"eval_samples_per_second": 9.522, |
|
"eval_steps_per_second": 1.598, |
|
"step": 1260 |
|
}, |
|
{ |
|
"epoch": 4.25, |
|
"eval_accuracy": 0.9970815314000689, |
|
"eval_f1": 0.978146611341632, |
|
"eval_loss": 0.016013789921998978, |
|
"eval_precision": 0.9757174392935982, |
|
"eval_recall": 0.9805879090404881, |
|
"eval_runtime": 45.1173, |
|
"eval_samples_per_second": 9.509, |
|
"eval_steps_per_second": 1.596, |
|
"step": 1270 |
|
}, |
|
{ |
|
"epoch": 4.28, |
|
"eval_accuracy": 0.9968560133718924, |
|
"eval_f1": 0.9744157101369105, |
|
"eval_loss": 0.01655399613082409, |
|
"eval_precision": 0.9718620689655172, |
|
"eval_recall": 0.9769828064337216, |
|
"eval_runtime": 45.0171, |
|
"eval_samples_per_second": 9.53, |
|
"eval_steps_per_second": 1.599, |
|
"step": 1280 |
|
}, |
|
{ |
|
"epoch": 4.31, |
|
"eval_accuracy": 0.9971080629327956, |
|
"eval_f1": 0.9793600221637346, |
|
"eval_loss": 0.015200940892100334, |
|
"eval_precision": 0.9784112925546637, |
|
"eval_recall": 0.9803105934553522, |
|
"eval_runtime": 45.0877, |
|
"eval_samples_per_second": 9.515, |
|
"eval_steps_per_second": 1.597, |
|
"step": 1290 |
|
}, |
|
{ |
|
"epoch": 4.35, |
|
"eval_accuracy": 0.9968294818391659, |
|
"eval_f1": 0.9751175006911805, |
|
"eval_loss": 0.016674669459462166, |
|
"eval_precision": 0.9721609702315325, |
|
"eval_recall": 0.9780920687742651, |
|
"eval_runtime": 45.3184, |
|
"eval_samples_per_second": 9.466, |
|
"eval_steps_per_second": 1.589, |
|
"step": 1300 |
|
}, |
|
{ |
|
"epoch": 4.38, |
|
"eval_accuracy": 0.9968294818391659, |
|
"eval_f1": 0.9766413268832067, |
|
"eval_loss": 0.01657554879784584, |
|
"eval_precision": 0.9735464315238358, |
|
"eval_recall": 0.9797559622850804, |
|
"eval_runtime": 45.1144, |
|
"eval_samples_per_second": 9.509, |
|
"eval_steps_per_second": 1.596, |
|
"step": 1310 |
|
}, |
|
{ |
|
"epoch": 4.41, |
|
"eval_accuracy": 0.9968958106709824, |
|
"eval_f1": 0.9781586950511474, |
|
"eval_loss": 0.016078708693385124, |
|
"eval_precision": 0.9751929437706726, |
|
"eval_recall": 0.9811425402107599, |
|
"eval_runtime": 45.1076, |
|
"eval_samples_per_second": 9.511, |
|
"eval_steps_per_second": 1.596, |
|
"step": 1320 |
|
}, |
|
{ |
|
"epoch": 4.45, |
|
"eval_accuracy": 0.9967764187737126, |
|
"eval_f1": 0.9739251040221916, |
|
"eval_loss": 0.015717538073658943, |
|
"eval_precision": 0.9741953385127636, |
|
"eval_recall": 0.973655019412091, |
|
"eval_runtime": 45.0205, |
|
"eval_samples_per_second": 9.529, |
|
"eval_steps_per_second": 1.599, |
|
"step": 1330 |
|
}, |
|
{ |
|
"epoch": 4.48, |
|
"eval_accuracy": 0.9968692791382558, |
|
"eval_f1": 0.9795127353266887, |
|
"eval_loss": 0.015196431428194046, |
|
"eval_precision": 0.9778883360972913, |
|
"eval_recall": 0.9811425402107599, |
|
"eval_runtime": 45.4378, |
|
"eval_samples_per_second": 9.441, |
|
"eval_steps_per_second": 1.585, |
|
"step": 1340 |
|
}, |
|
{ |
|
"epoch": 4.52, |
|
"eval_accuracy": 0.9967233557082593, |
|
"eval_f1": 0.971064654575661, |
|
"eval_loss": 0.015703538432717323, |
|
"eval_precision": 0.9695880564003317, |
|
"eval_recall": 0.9725457570715474, |
|
"eval_runtime": 45.4022, |
|
"eval_samples_per_second": 9.449, |
|
"eval_steps_per_second": 1.586, |
|
"step": 1350 |
|
}, |
|
{ |
|
"epoch": 4.55, |
|
"eval_accuracy": 0.9968162160728026, |
|
"eval_f1": 0.9755828390122776, |
|
"eval_loss": 0.015339327044785023, |
|
"eval_precision": 0.9706286027998902, |
|
"eval_recall": 0.9805879090404881, |
|
"eval_runtime": 45.4342, |
|
"eval_samples_per_second": 9.442, |
|
"eval_steps_per_second": 1.585, |
|
"step": 1360 |
|
}, |
|
{ |
|
"epoch": 4.58, |
|
"eval_accuracy": 0.9968692791382558, |
|
"eval_f1": 0.9758587391364325, |
|
"eval_loss": 0.015390865504741669, |
|
"eval_precision": 0.9709031018391435, |
|
"eval_recall": 0.980865224625624, |
|
"eval_runtime": 45.7337, |
|
"eval_samples_per_second": 9.38, |
|
"eval_steps_per_second": 1.574, |
|
"step": 1370 |
|
}, |
|
{ |
|
"epoch": 4.62, |
|
"eval_accuracy": 0.9969886710355257, |
|
"eval_f1": 0.9785822854774078, |
|
"eval_loss": 0.015035979449748993, |
|
"eval_precision": 0.97521343982374, |
|
"eval_recall": 0.9819744869661675, |
|
"eval_runtime": 45.4663, |
|
"eval_samples_per_second": 9.436, |
|
"eval_steps_per_second": 1.584, |
|
"step": 1380 |
|
}, |
|
{ |
|
"epoch": 4.65, |
|
"eval_accuracy": 0.9970682656337057, |
|
"eval_f1": 0.9809234171965718, |
|
"eval_loss": 0.014896390959620476, |
|
"eval_precision": 0.9779492833517089, |
|
"eval_recall": 0.9839156960621187, |
|
"eval_runtime": 45.0989, |
|
"eval_samples_per_second": 9.512, |
|
"eval_steps_per_second": 1.596, |
|
"step": 1390 |
|
}, |
|
{ |
|
"epoch": 4.68, |
|
"eval_accuracy": 0.9968560133718924, |
|
"eval_f1": 0.9768339768339769, |
|
"eval_loss": 0.015806537121534348, |
|
"eval_precision": 0.9714755896873286, |
|
"eval_recall": 0.9822518025513034, |
|
"eval_runtime": 45.0416, |
|
"eval_samples_per_second": 9.525, |
|
"eval_steps_per_second": 1.599, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 4.72, |
|
"eval_accuracy": 0.997041734100979, |
|
"eval_f1": 0.9778761061946902, |
|
"eval_loss": 0.015140415169298649, |
|
"eval_precision": 0.9751792608935466, |
|
"eval_recall": 0.9805879090404881, |
|
"eval_runtime": 45.6611, |
|
"eval_samples_per_second": 9.395, |
|
"eval_steps_per_second": 1.577, |
|
"step": 1410 |
|
}, |
|
{ |
|
"epoch": 4.75, |
|
"eval_accuracy": 0.9970549998673424, |
|
"eval_f1": 0.9795353982300885, |
|
"eval_loss": 0.015615841373801231, |
|
"eval_precision": 0.9768339768339769, |
|
"eval_recall": 0.9822518025513034, |
|
"eval_runtime": 45.3516, |
|
"eval_samples_per_second": 9.459, |
|
"eval_steps_per_second": 1.588, |
|
"step": 1420 |
|
}, |
|
{ |
|
"epoch": 4.78, |
|
"eval_accuracy": 0.9971876575309756, |
|
"eval_f1": 0.9802240354031254, |
|
"eval_loss": 0.015609286725521088, |
|
"eval_precision": 0.9776551724137931, |
|
"eval_recall": 0.9828064337215752, |
|
"eval_runtime": 45.8817, |
|
"eval_samples_per_second": 9.35, |
|
"eval_steps_per_second": 1.569, |
|
"step": 1430 |
|
}, |
|
{ |
|
"epoch": 4.82, |
|
"eval_accuracy": 0.997041734100979, |
|
"eval_f1": 0.980777209238003, |
|
"eval_loss": 0.015975775197148323, |
|
"eval_precision": 0.9782068965517241, |
|
"eval_recall": 0.9833610648918469, |
|
"eval_runtime": 45.1602, |
|
"eval_samples_per_second": 9.5, |
|
"eval_steps_per_second": 1.594, |
|
"step": 1440 |
|
}, |
|
{ |
|
"epoch": 4.85, |
|
"eval_accuracy": 0.9970682656337057, |
|
"eval_f1": 0.9810642709053213, |
|
"eval_loss": 0.015114562585949898, |
|
"eval_precision": 0.9779553596031965, |
|
"eval_recall": 0.9841930116472546, |
|
"eval_runtime": 45.0898, |
|
"eval_samples_per_second": 9.514, |
|
"eval_steps_per_second": 1.597, |
|
"step": 1450 |
|
}, |
|
{ |
|
"epoch": 4.88, |
|
"eval_accuracy": 0.9970549998673424, |
|
"eval_f1": 0.9806576402321082, |
|
"eval_loss": 0.01497586164623499, |
|
"eval_precision": 0.977147577092511, |
|
"eval_recall": 0.9841930116472546, |
|
"eval_runtime": 47.111, |
|
"eval_samples_per_second": 9.106, |
|
"eval_steps_per_second": 1.528, |
|
"step": 1460 |
|
}, |
|
{ |
|
"epoch": 4.92, |
|
"eval_accuracy": 0.9970284683346157, |
|
"eval_f1": 0.9779005524861878, |
|
"eval_loss": 0.014804758131504059, |
|
"eval_precision": 0.9741331865712713, |
|
"eval_recall": 0.9816971713810316, |
|
"eval_runtime": 45.7757, |
|
"eval_samples_per_second": 9.372, |
|
"eval_steps_per_second": 1.573, |
|
"step": 1470 |
|
}, |
|
{ |
|
"epoch": 4.95, |
|
"eval_accuracy": 0.9969621395027991, |
|
"eval_f1": 0.9767634854771784, |
|
"eval_loss": 0.015325279906392097, |
|
"eval_precision": 0.9743377483443708, |
|
"eval_recall": 0.9792013311148087, |
|
"eval_runtime": 45.788, |
|
"eval_samples_per_second": 9.369, |
|
"eval_steps_per_second": 1.572, |
|
"step": 1480 |
|
}, |
|
{ |
|
"epoch": 4.98, |
|
"eval_accuracy": 0.9970947971664323, |
|
"eval_f1": 0.9820143884892086, |
|
"eval_loss": 0.014990455470979214, |
|
"eval_precision": 0.9798453892876864, |
|
"eval_recall": 0.9841930116472546, |
|
"eval_runtime": 45.1213, |
|
"eval_samples_per_second": 9.508, |
|
"eval_steps_per_second": 1.596, |
|
"step": 1490 |
|
}, |
|
{ |
|
"epoch": 5.02, |
|
"learning_rate": 8.5e-06, |
|
"loss": 0.0081, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 5.02, |
|
"eval_accuracy": 0.9970947971664323, |
|
"eval_f1": 0.9796821008984106, |
|
"eval_loss": 0.01517151016741991, |
|
"eval_precision": 0.9765775695783963, |
|
"eval_recall": 0.9828064337215752, |
|
"eval_runtime": 45.193, |
|
"eval_samples_per_second": 9.493, |
|
"eval_steps_per_second": 1.593, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 5.05, |
|
"eval_accuracy": 0.9967366214746226, |
|
"eval_f1": 0.9682408174537421, |
|
"eval_loss": 0.01580970361828804, |
|
"eval_precision": 0.9642464246424642, |
|
"eval_recall": 0.9722684414864116, |
|
"eval_runtime": 45.4381, |
|
"eval_samples_per_second": 9.441, |
|
"eval_steps_per_second": 1.585, |
|
"step": 1510 |
|
}, |
|
{ |
|
"epoch": 5.08, |
|
"eval_accuracy": 0.9966702926428059, |
|
"eval_f1": 0.9666759233546237, |
|
"eval_loss": 0.01570785790681839, |
|
"eval_precision": 0.9680200222469411, |
|
"eval_recall": 0.9653355518580145, |
|
"eval_runtime": 45.4491, |
|
"eval_samples_per_second": 9.439, |
|
"eval_steps_per_second": 1.584, |
|
"step": 1520 |
|
}, |
|
{ |
|
"epoch": 5.12, |
|
"eval_accuracy": 0.9969886710355257, |
|
"eval_f1": 0.9800388134183532, |
|
"eval_loss": 0.015114962123334408, |
|
"eval_precision": 0.9797671840354767, |
|
"eval_recall": 0.9803105934553522, |
|
"eval_runtime": 45.1961, |
|
"eval_samples_per_second": 9.492, |
|
"eval_steps_per_second": 1.593, |
|
"step": 1530 |
|
}, |
|
{ |
|
"epoch": 5.15, |
|
"eval_accuracy": 0.9970815314000689, |
|
"eval_f1": 0.9818835569077582, |
|
"eval_loss": 0.01481586042791605, |
|
"eval_precision": 0.9793103448275862, |
|
"eval_recall": 0.9844703272323905, |
|
"eval_runtime": 45.6531, |
|
"eval_samples_per_second": 9.397, |
|
"eval_steps_per_second": 1.577, |
|
"step": 1540 |
|
}, |
|
{ |
|
"epoch": 5.18, |
|
"eval_accuracy": 0.9971478602318856, |
|
"eval_f1": 0.9807878369039392, |
|
"eval_loss": 0.014275978319346905, |
|
"eval_precision": 0.9776798015982364, |
|
"eval_recall": 0.9839156960621187, |
|
"eval_runtime": 45.7198, |
|
"eval_samples_per_second": 9.383, |
|
"eval_steps_per_second": 1.575, |
|
"step": 1550 |
|
}, |
|
{ |
|
"epoch": 5.22, |
|
"eval_accuracy": 0.9970682656337057, |
|
"eval_f1": 0.9792703150912107, |
|
"eval_loss": 0.01468308549374342, |
|
"eval_precision": 0.9760330578512396, |
|
"eval_recall": 0.9825291181364393, |
|
"eval_runtime": 45.5952, |
|
"eval_samples_per_second": 9.409, |
|
"eval_steps_per_second": 1.579, |
|
"step": 1560 |
|
}, |
|
{ |
|
"epoch": 5.25, |
|
"eval_accuracy": 0.9970947971664323, |
|
"eval_f1": 0.9810695039380959, |
|
"eval_loss": 0.014422405511140823, |
|
"eval_precision": 0.977692095841366, |
|
"eval_recall": 0.9844703272323905, |
|
"eval_runtime": 45.732, |
|
"eval_samples_per_second": 9.381, |
|
"eval_steps_per_second": 1.574, |
|
"step": 1570 |
|
}, |
|
{ |
|
"epoch": 5.28, |
|
"eval_accuracy": 0.9970947971664323, |
|
"eval_f1": 0.9809075816270061, |
|
"eval_loss": 0.01434118952602148, |
|
"eval_precision": 0.9787410270568746, |
|
"eval_recall": 0.983083749306711, |
|
"eval_runtime": 45.5148, |
|
"eval_samples_per_second": 9.425, |
|
"eval_steps_per_second": 1.582, |
|
"step": 1580 |
|
}, |
|
{ |
|
"epoch": 5.32, |
|
"eval_accuracy": 0.9970019368018891, |
|
"eval_f1": 0.9791350006908941, |
|
"eval_loss": 0.014856048859655857, |
|
"eval_precision": 0.9757642522721014, |
|
"eval_recall": 0.9825291181364393, |
|
"eval_runtime": 46.2893, |
|
"eval_samples_per_second": 9.268, |
|
"eval_steps_per_second": 1.555, |
|
"step": 1590 |
|
}, |
|
{ |
|
"epoch": 5.35, |
|
"eval_accuracy": 0.9970549998673424, |
|
"eval_f1": 0.9803541781959049, |
|
"eval_loss": 0.015461008064448833, |
|
"eval_precision": 0.9781888459414688, |
|
"eval_recall": 0.9825291181364393, |
|
"eval_runtime": 45.2253, |
|
"eval_samples_per_second": 9.486, |
|
"eval_steps_per_second": 1.592, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 5.38, |
|
"eval_accuracy": 0.9970549998673424, |
|
"eval_f1": 0.9800884955752212, |
|
"eval_loss": 0.01574764773249626, |
|
"eval_precision": 0.9773855488141202, |
|
"eval_recall": 0.9828064337215752, |
|
"eval_runtime": 45.056, |
|
"eval_samples_per_second": 9.521, |
|
"eval_steps_per_second": 1.598, |
|
"step": 1610 |
|
}, |
|
{ |
|
"epoch": 5.42, |
|
"eval_accuracy": 0.997041734100979, |
|
"eval_f1": 0.9792645839093173, |
|
"eval_loss": 0.015540325082838535, |
|
"eval_precision": 0.976295479603087, |
|
"eval_recall": 0.9822518025513034, |
|
"eval_runtime": 45.1752, |
|
"eval_samples_per_second": 9.496, |
|
"eval_steps_per_second": 1.594, |
|
"step": 1620 |
|
}, |
|
{ |
|
"epoch": 5.45, |
|
"eval_accuracy": 0.9969621395027991, |
|
"eval_f1": 0.9781526548672567, |
|
"eval_loss": 0.015259744599461555, |
|
"eval_precision": 0.9754550468836183, |
|
"eval_recall": 0.980865224625624, |
|
"eval_runtime": 45.477, |
|
"eval_samples_per_second": 9.433, |
|
"eval_steps_per_second": 1.583, |
|
"step": 1630 |
|
}, |
|
{ |
|
"epoch": 5.48, |
|
"eval_accuracy": 0.997041734100979, |
|
"eval_f1": 0.9809075816270061, |
|
"eval_loss": 0.01531192846596241, |
|
"eval_precision": 0.9787410270568746, |
|
"eval_recall": 0.983083749306711, |
|
"eval_runtime": 45.3307, |
|
"eval_samples_per_second": 9.464, |
|
"eval_steps_per_second": 1.588, |
|
"step": 1640 |
|
}, |
|
{ |
|
"epoch": 5.52, |
|
"eval_accuracy": 0.9970152025682524, |
|
"eval_f1": 0.9804790253357331, |
|
"eval_loss": 0.015362209640443325, |
|
"eval_precision": 0.9789881116947746, |
|
"eval_recall": 0.9819744869661675, |
|
"eval_runtime": 45.5289, |
|
"eval_samples_per_second": 9.423, |
|
"eval_steps_per_second": 1.581, |
|
"step": 1650 |
|
}, |
|
{ |
|
"epoch": 5.55, |
|
"eval_accuracy": 0.9968825449046191, |
|
"eval_f1": 0.9736151402127364, |
|
"eval_loss": 0.016267232596874237, |
|
"eval_precision": 0.9699972474538948, |
|
"eval_recall": 0.9772601220188575, |
|
"eval_runtime": 45.4269, |
|
"eval_samples_per_second": 9.444, |
|
"eval_steps_per_second": 1.585, |
|
"step": 1660 |
|
}, |
|
{ |
|
"epoch": 5.59, |
|
"eval_accuracy": 0.9970152025682524, |
|
"eval_f1": 0.9776181265542968, |
|
"eval_loss": 0.01579289324581623, |
|
"eval_precision": 0.9741189427312775, |
|
"eval_recall": 0.9811425402107599, |
|
"eval_runtime": 46.1943, |
|
"eval_samples_per_second": 9.287, |
|
"eval_steps_per_second": 1.559, |
|
"step": 1670 |
|
}, |
|
{ |
|
"epoch": 5.62, |
|
"eval_accuracy": 0.9970284683346157, |
|
"eval_f1": 0.9785407725321887, |
|
"eval_loss": 0.01532789133489132, |
|
"eval_precision": 0.9770528061929776, |
|
"eval_recall": 0.9800332778702163, |
|
"eval_runtime": 46.2745, |
|
"eval_samples_per_second": 9.271, |
|
"eval_steps_per_second": 1.556, |
|
"step": 1680 |
|
}, |
|
{ |
|
"epoch": 5.65, |
|
"eval_accuracy": 0.9970549998673424, |
|
"eval_f1": 0.979665237238899, |
|
"eval_loss": 0.01536885742098093, |
|
"eval_precision": 0.9773668230747999, |
|
"eval_recall": 0.9819744869661675, |
|
"eval_runtime": 45.136, |
|
"eval_samples_per_second": 9.505, |
|
"eval_steps_per_second": 1.595, |
|
"step": 1690 |
|
}, |
|
{ |
|
"epoch": 5.69, |
|
"eval_accuracy": 0.9969488737364357, |
|
"eval_f1": 0.9772445179975174, |
|
"eval_loss": 0.01578596606850624, |
|
"eval_precision": 0.9720164609053498, |
|
"eval_recall": 0.9825291181364393, |
|
"eval_runtime": 45.0296, |
|
"eval_samples_per_second": 9.527, |
|
"eval_steps_per_second": 1.599, |
|
"step": 1700 |
|
}, |
|
{ |
|
"epoch": 5.72, |
|
"eval_accuracy": 0.9968560133718924, |
|
"eval_f1": 0.9757040309221425, |
|
"eval_loss": 0.01535722240805626, |
|
"eval_precision": 0.971412864211105, |
|
"eval_recall": 0.9800332778702163, |
|
"eval_runtime": 45.2636, |
|
"eval_samples_per_second": 9.478, |
|
"eval_steps_per_second": 1.591, |
|
"step": 1710 |
|
}, |
|
{ |
|
"epoch": 5.75, |
|
"eval_accuracy": 0.9970947971664323, |
|
"eval_f1": 0.9769496204278812, |
|
"eval_loss": 0.01525976974517107, |
|
"eval_precision": 0.9725199230557846, |
|
"eval_recall": 0.9814198557958957, |
|
"eval_runtime": 45.5287, |
|
"eval_samples_per_second": 9.423, |
|
"eval_steps_per_second": 1.581, |
|
"step": 1720 |
|
}, |
|
{ |
|
"epoch": 5.79, |
|
"eval_accuracy": 0.9970682656337057, |
|
"eval_f1": 0.9776181265542968, |
|
"eval_loss": 0.014473304152488708, |
|
"eval_precision": 0.9741189427312775, |
|
"eval_recall": 0.9811425402107599, |
|
"eval_runtime": 45.6773, |
|
"eval_samples_per_second": 9.392, |
|
"eval_steps_per_second": 1.576, |
|
"step": 1730 |
|
}, |
|
{ |
|
"epoch": 5.82, |
|
"eval_accuracy": 0.9971345944655223, |
|
"eval_f1": 0.9802349689011749, |
|
"eval_loss": 0.013995842076838017, |
|
"eval_precision": 0.9771286855883163, |
|
"eval_recall": 0.9833610648918469, |
|
"eval_runtime": 45.5912, |
|
"eval_samples_per_second": 9.41, |
|
"eval_steps_per_second": 1.579, |
|
"step": 1740 |
|
}, |
|
{ |
|
"epoch": 5.85, |
|
"eval_accuracy": 0.9970947971664323, |
|
"eval_f1": 0.9808864265927978, |
|
"eval_loss": 0.014489100314676762, |
|
"eval_precision": 0.9798007747648035, |
|
"eval_recall": 0.9819744869661675, |
|
"eval_runtime": 45.3576, |
|
"eval_samples_per_second": 9.458, |
|
"eval_steps_per_second": 1.587, |
|
"step": 1750 |
|
}, |
|
{ |
|
"epoch": 5.89, |
|
"eval_accuracy": 0.9972274548300656, |
|
"eval_f1": 0.9808864265927978, |
|
"eval_loss": 0.014342778362333775, |
|
"eval_precision": 0.9798007747648035, |
|
"eval_recall": 0.9819744869661675, |
|
"eval_runtime": 45.5077, |
|
"eval_samples_per_second": 9.427, |
|
"eval_steps_per_second": 1.582, |
|
"step": 1760 |
|
}, |
|
{ |
|
"epoch": 5.92, |
|
"eval_accuracy": 0.9972805178955189, |
|
"eval_f1": 0.9800774764803543, |
|
"eval_loss": 0.014782003127038479, |
|
"eval_precision": 0.9779127553837659, |
|
"eval_recall": 0.9822518025513034, |
|
"eval_runtime": 45.3932, |
|
"eval_samples_per_second": 9.451, |
|
"eval_steps_per_second": 1.586, |
|
"step": 1770 |
|
}, |
|
{ |
|
"epoch": 5.95, |
|
"eval_accuracy": 0.9972009232973389, |
|
"eval_f1": 0.978852798894264, |
|
"eval_loss": 0.014779850840568542, |
|
"eval_precision": 0.9757508955635161, |
|
"eval_recall": 0.9819744869661675, |
|
"eval_runtime": 45.6592, |
|
"eval_samples_per_second": 9.396, |
|
"eval_steps_per_second": 1.577, |
|
"step": 1780 |
|
}, |
|
{ |
|
"epoch": 5.99, |
|
"eval_accuracy": 0.9971213286991589, |
|
"eval_f1": 0.9799141155284665, |
|
"eval_loss": 0.015209286473691463, |
|
"eval_precision": 0.9789648491558262, |
|
"eval_recall": 0.980865224625624, |
|
"eval_runtime": 46.4662, |
|
"eval_samples_per_second": 9.233, |
|
"eval_steps_per_second": 1.55, |
|
"step": 1790 |
|
}, |
|
{ |
|
"epoch": 6.02, |
|
"eval_accuracy": 0.9971876575309756, |
|
"eval_f1": 0.981011781011781, |
|
"eval_loss": 0.015130845829844475, |
|
"eval_precision": 0.9806040454419507, |
|
"eval_recall": 0.9814198557958957, |
|
"eval_runtime": 45.3314, |
|
"eval_samples_per_second": 9.464, |
|
"eval_steps_per_second": 1.588, |
|
"step": 1800 |
|
}, |
|
{ |
|
"epoch": 6.05, |
|
"eval_accuracy": 0.9971213286991589, |
|
"eval_f1": 0.9795297372060858, |
|
"eval_loss": 0.015158111229538918, |
|
"eval_precision": 0.9770971302428256, |
|
"eval_recall": 0.9819744869661675, |
|
"eval_runtime": 45.4446, |
|
"eval_samples_per_second": 9.44, |
|
"eval_steps_per_second": 1.584, |
|
"step": 1810 |
|
}, |
|
{ |
|
"epoch": 6.09, |
|
"eval_accuracy": 0.9970947971664323, |
|
"eval_f1": 0.9782638792745397, |
|
"eval_loss": 0.015132046304643154, |
|
"eval_precision": 0.9767763339784352, |
|
"eval_recall": 0.9797559622850804, |
|
"eval_runtime": 45.4433, |
|
"eval_samples_per_second": 9.44, |
|
"eval_steps_per_second": 1.584, |
|
"step": 1820 |
|
}, |
|
{ |
|
"epoch": 6.12, |
|
"eval_accuracy": 0.9968825449046191, |
|
"eval_f1": 0.9705516383243468, |
|
"eval_loss": 0.01593286544084549, |
|
"eval_precision": 0.967741935483871, |
|
"eval_recall": 0.9733777038269551, |
|
"eval_runtime": 45.4009, |
|
"eval_samples_per_second": 9.449, |
|
"eval_steps_per_second": 1.586, |
|
"step": 1830 |
|
}, |
|
{ |
|
"epoch": 6.15, |
|
"eval_accuracy": 0.9969356079700724, |
|
"eval_f1": 0.9730774540936076, |
|
"eval_loss": 0.014840428717434406, |
|
"eval_precision": 0.9689304371734946, |
|
"eval_recall": 0.9772601220188575, |
|
"eval_runtime": 45.3952, |
|
"eval_samples_per_second": 9.45, |
|
"eval_steps_per_second": 1.586, |
|
"step": 1840 |
|
}, |
|
{ |
|
"epoch": 6.19, |
|
"eval_accuracy": 0.9966570268764426, |
|
"eval_f1": 0.9764868603042877, |
|
"eval_loss": 0.016662631183862686, |
|
"eval_precision": 0.9740618101545254, |
|
"eval_recall": 0.9789240155296728, |
|
"eval_runtime": 45.439, |
|
"eval_samples_per_second": 9.441, |
|
"eval_steps_per_second": 1.585, |
|
"step": 1850 |
|
}, |
|
{ |
|
"epoch": 6.22, |
|
"eval_accuracy": 0.9965376349791727, |
|
"eval_f1": 0.9750761561894212, |
|
"eval_loss": 0.01773080602288246, |
|
"eval_precision": 0.9737278761061947, |
|
"eval_recall": 0.9764281752634498, |
|
"eval_runtime": 45.6526, |
|
"eval_samples_per_second": 9.397, |
|
"eval_steps_per_second": 1.577, |
|
"step": 1860 |
|
}, |
|
{ |
|
"epoch": 6.25, |
|
"eval_accuracy": 0.9964182430819029, |
|
"eval_f1": 0.9697221070095395, |
|
"eval_loss": 0.018397442996501923, |
|
"eval_precision": 0.9669148056244831, |
|
"eval_recall": 0.9725457570715474, |
|
"eval_runtime": 45.4014, |
|
"eval_samples_per_second": 9.449, |
|
"eval_steps_per_second": 1.586, |
|
"step": 1870 |
|
}, |
|
{ |
|
"epoch": 6.29, |
|
"eval_accuracy": 0.9966968241755326, |
|
"eval_f1": 0.9773292784075199, |
|
"eval_loss": 0.0170457661151886, |
|
"eval_precision": 0.9743660418963617, |
|
"eval_recall": 0.9803105934553522, |
|
"eval_runtime": 45.6124, |
|
"eval_samples_per_second": 9.405, |
|
"eval_steps_per_second": 1.579, |
|
"step": 1880 |
|
}, |
|
{ |
|
"epoch": 6.32, |
|
"eval_accuracy": 0.9968029503064392, |
|
"eval_f1": 0.9793046357615895, |
|
"eval_loss": 0.01652824692428112, |
|
"eval_precision": 0.9744645799011532, |
|
"eval_recall": 0.9841930116472546, |
|
"eval_runtime": 45.4345, |
|
"eval_samples_per_second": 9.442, |
|
"eval_steps_per_second": 1.585, |
|
"step": 1890 |
|
}, |
|
{ |
|
"epoch": 6.35, |
|
"eval_accuracy": 0.9967233557082593, |
|
"eval_f1": 0.978476821192053, |
|
"eval_loss": 0.016787514090538025, |
|
"eval_precision": 0.9736408566721582, |
|
"eval_recall": 0.9833610648918469, |
|
"eval_runtime": 45.5818, |
|
"eval_samples_per_second": 9.412, |
|
"eval_steps_per_second": 1.58, |
|
"step": 1900 |
|
}, |
|
{ |
|
"epoch": 6.39, |
|
"eval_accuracy": 0.9965641665118994, |
|
"eval_f1": 0.975320557010892, |
|
"eval_loss": 0.01782037876546383, |
|
"eval_precision": 0.9698382231971483, |
|
"eval_recall": 0.980865224625624, |
|
"eval_runtime": 45.9556, |
|
"eval_samples_per_second": 9.335, |
|
"eval_steps_per_second": 1.567, |
|
"step": 1910 |
|
}, |
|
{ |
|
"epoch": 6.42, |
|
"eval_accuracy": 0.9966702926428059, |
|
"eval_f1": 0.9768211920529801, |
|
"eval_loss": 0.017588861286640167, |
|
"eval_precision": 0.9719934102141681, |
|
"eval_recall": 0.9816971713810316, |
|
"eval_runtime": 45.1589, |
|
"eval_samples_per_second": 9.5, |
|
"eval_steps_per_second": 1.594, |
|
"step": 1920 |
|
}, |
|
{ |
|
"epoch": 6.45, |
|
"eval_accuracy": 0.9969488737364357, |
|
"eval_f1": 0.9810799613313078, |
|
"eval_loss": 0.016702750697731972, |
|
"eval_precision": 0.9771664374140303, |
|
"eval_recall": 0.9850249584026622, |
|
"eval_runtime": 45.117, |
|
"eval_samples_per_second": 9.509, |
|
"eval_steps_per_second": 1.596, |
|
"step": 1930 |
|
}, |
|
{ |
|
"epoch": 6.49, |
|
"eval_accuracy": 0.9968029503064392, |
|
"eval_f1": 0.9783179118906229, |
|
"eval_loss": 0.016243569552898407, |
|
"eval_precision": 0.9744154057771665, |
|
"eval_recall": 0.9822518025513034, |
|
"eval_runtime": 45.1078, |
|
"eval_samples_per_second": 9.511, |
|
"eval_steps_per_second": 1.596, |
|
"step": 1940 |
|
}, |
|
{ |
|
"epoch": 6.52, |
|
"eval_accuracy": 0.9968692791382558, |
|
"eval_f1": 0.9773418071290412, |
|
"eval_loss": 0.01623663119971752, |
|
"eval_precision": 0.9738436123348018, |
|
"eval_recall": 0.980865224625624, |
|
"eval_runtime": 45.7949, |
|
"eval_samples_per_second": 9.368, |
|
"eval_steps_per_second": 1.572, |
|
"step": 1950 |
|
}, |
|
{ |
|
"epoch": 6.56, |
|
"eval_accuracy": 0.9967896845400759, |
|
"eval_f1": 0.9769496204278812, |
|
"eval_loss": 0.016976099461317062, |
|
"eval_precision": 0.9725199230557846, |
|
"eval_recall": 0.9814198557958957, |
|
"eval_runtime": 45.3661, |
|
"eval_samples_per_second": 9.456, |
|
"eval_steps_per_second": 1.587, |
|
"step": 1960 |
|
}, |
|
{ |
|
"epoch": 6.59, |
|
"eval_accuracy": 0.9967233557082593, |
|
"eval_f1": 0.9759933774834438, |
|
"eval_loss": 0.017524730414152145, |
|
"eval_precision": 0.971169686985173, |
|
"eval_recall": 0.980865224625624, |
|
"eval_runtime": 45.7337, |
|
"eval_samples_per_second": 9.38, |
|
"eval_steps_per_second": 1.574, |
|
"step": 1970 |
|
}, |
|
{ |
|
"epoch": 6.62, |
|
"eval_accuracy": 0.9968029503064392, |
|
"eval_f1": 0.9794397681799365, |
|
"eval_loss": 0.016901282593607903, |
|
"eval_precision": 0.9747322164240593, |
|
"eval_recall": 0.9841930116472546, |
|
"eval_runtime": 45.4807, |
|
"eval_samples_per_second": 9.433, |
|
"eval_steps_per_second": 1.583, |
|
"step": 1980 |
|
}, |
|
{ |
|
"epoch": 6.66, |
|
"eval_accuracy": 0.9967896845400759, |
|
"eval_f1": 0.9788761562888305, |
|
"eval_loss": 0.01667814515531063, |
|
"eval_precision": 0.9747044267253231, |
|
"eval_recall": 0.983083749306711, |
|
"eval_runtime": 45.6668, |
|
"eval_samples_per_second": 9.394, |
|
"eval_steps_per_second": 1.577, |
|
"step": 1990 |
|
}, |
|
{ |
|
"epoch": 6.69, |
|
"learning_rate": 8.000000000000001e-06, |
|
"loss": 0.0064, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 6.69, |
|
"eval_accuracy": 0.9967100899418959, |
|
"eval_f1": 0.9776428374275461, |
|
"eval_loss": 0.016720809042453766, |
|
"eval_precision": 0.9730769230769231, |
|
"eval_recall": 0.9822518025513034, |
|
"eval_runtime": 45.4912, |
|
"eval_samples_per_second": 9.43, |
|
"eval_steps_per_second": 1.583, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 6.72, |
|
"eval_accuracy": 0.9966172295773527, |
|
"eval_f1": 0.9770781552057443, |
|
"eval_loss": 0.017004678025841713, |
|
"eval_precision": 0.9730473047304731, |
|
"eval_recall": 0.9811425402107599, |
|
"eval_runtime": 45.7222, |
|
"eval_samples_per_second": 9.383, |
|
"eval_steps_per_second": 1.575, |
|
"step": 2010 |
|
}, |
|
{ |
|
"epoch": 6.76, |
|
"eval_accuracy": 0.9966172295773527, |
|
"eval_f1": 0.9774892970584174, |
|
"eval_loss": 0.016945617273449898, |
|
"eval_precision": 0.9735900962861073, |
|
"eval_recall": 0.9814198557958957, |
|
"eval_runtime": 45.3731, |
|
"eval_samples_per_second": 9.455, |
|
"eval_steps_per_second": 1.587, |
|
"step": 2020 |
|
}, |
|
{ |
|
"epoch": 6.79, |
|
"eval_accuracy": 0.9967100899418959, |
|
"eval_f1": 0.9788994621431527, |
|
"eval_loss": 0.016928063705563545, |
|
"eval_precision": 0.9736625514403292, |
|
"eval_recall": 0.9841930116472546, |
|
"eval_runtime": 45.8513, |
|
"eval_samples_per_second": 9.356, |
|
"eval_steps_per_second": 1.57, |
|
"step": 2030 |
|
}, |
|
{ |
|
"epoch": 6.82, |
|
"eval_accuracy": 0.9967896845400759, |
|
"eval_f1": 0.9779675020655467, |
|
"eval_loss": 0.01666436158120632, |
|
"eval_precision": 0.9712800875273523, |
|
"eval_recall": 0.9847476428175264, |
|
"eval_runtime": 45.4258, |
|
"eval_samples_per_second": 9.444, |
|
"eval_steps_per_second": 1.585, |
|
"step": 2040 |
|
}, |
|
{ |
|
"epoch": 6.86, |
|
"eval_accuracy": 0.9968560133718924, |
|
"eval_f1": 0.9770130763936682, |
|
"eval_loss": 0.016234010457992554, |
|
"eval_precision": 0.969937141295436, |
|
"eval_recall": 0.9841930116472546, |
|
"eval_runtime": 45.6745, |
|
"eval_samples_per_second": 9.393, |
|
"eval_steps_per_second": 1.576, |
|
"step": 2050 |
|
}, |
|
{ |
|
"epoch": 6.89, |
|
"eval_accuracy": 0.9968029503064392, |
|
"eval_f1": 0.9758986365514392, |
|
"eval_loss": 0.015693064779043198, |
|
"eval_precision": 0.9693570451436389, |
|
"eval_recall": 0.9825291181364393, |
|
"eval_runtime": 46.507, |
|
"eval_samples_per_second": 9.224, |
|
"eval_steps_per_second": 1.548, |
|
"step": 2060 |
|
}, |
|
{ |
|
"epoch": 6.92, |
|
"eval_accuracy": 0.9968825449046191, |
|
"eval_f1": 0.978476821192053, |
|
"eval_loss": 0.015247814357280731, |
|
"eval_precision": 0.9736408566721582, |
|
"eval_recall": 0.9833610648918469, |
|
"eval_runtime": 45.4327, |
|
"eval_samples_per_second": 9.443, |
|
"eval_steps_per_second": 1.585, |
|
"step": 2070 |
|
}, |
|
{ |
|
"epoch": 6.96, |
|
"eval_accuracy": 0.9968692791382558, |
|
"eval_f1": 0.9795636564484949, |
|
"eval_loss": 0.01587117277085781, |
|
"eval_precision": 0.9755225522552256, |
|
"eval_recall": 0.9836383804769828, |
|
"eval_runtime": 45.1551, |
|
"eval_samples_per_second": 9.501, |
|
"eval_steps_per_second": 1.595, |
|
"step": 2080 |
|
}, |
|
{ |
|
"epoch": 6.99, |
|
"eval_accuracy": 0.9967100899418959, |
|
"eval_f1": 0.9783776339347198, |
|
"eval_loss": 0.017061389982700348, |
|
"eval_precision": 0.9718194254445964, |
|
"eval_recall": 0.9850249584026622, |
|
"eval_runtime": 45.1957, |
|
"eval_samples_per_second": 9.492, |
|
"eval_steps_per_second": 1.593, |
|
"step": 2090 |
|
}, |
|
{ |
|
"epoch": 7.02, |
|
"eval_accuracy": 0.9965906980446261, |
|
"eval_f1": 0.9775821757667446, |
|
"eval_loss": 0.018233157694339752, |
|
"eval_precision": 0.9697135061391542, |
|
"eval_recall": 0.985579589572934, |
|
"eval_runtime": 45.2503, |
|
"eval_samples_per_second": 9.481, |
|
"eval_steps_per_second": 1.591, |
|
"step": 2100 |
|
}, |
|
{ |
|
"epoch": 7.06, |
|
"eval_accuracy": 0.9970019368018891, |
|
"eval_f1": 0.9790113228389947, |
|
"eval_loss": 0.01590120792388916, |
|
"eval_precision": 0.974972497249725, |
|
"eval_recall": 0.983083749306711, |
|
"eval_runtime": 45.4565, |
|
"eval_samples_per_second": 9.438, |
|
"eval_steps_per_second": 1.584, |
|
"step": 2110 |
|
}, |
|
{ |
|
"epoch": 7.09, |
|
"eval_accuracy": 0.9968692791382558, |
|
"eval_f1": 0.9770971302428255, |
|
"eval_loss": 0.015739668160676956, |
|
"eval_precision": 0.972267984623833, |
|
"eval_recall": 0.9819744869661675, |
|
"eval_runtime": 46.0012, |
|
"eval_samples_per_second": 9.326, |
|
"eval_steps_per_second": 1.565, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 7.12, |
|
"eval_accuracy": 0.9969223422037091, |
|
"eval_f1": 0.9790113228389947, |
|
"eval_loss": 0.015736253932118416, |
|
"eval_precision": 0.974972497249725, |
|
"eval_recall": 0.983083749306711, |
|
"eval_runtime": 45.4255, |
|
"eval_samples_per_second": 9.444, |
|
"eval_steps_per_second": 1.585, |
|
"step": 2130 |
|
}, |
|
{ |
|
"epoch": 7.16, |
|
"eval_accuracy": 0.9968825449046191, |
|
"eval_f1": 0.9784827586206897, |
|
"eval_loss": 0.016040045768022537, |
|
"eval_precision": 0.9733809001097695, |
|
"eval_recall": 0.9836383804769828, |
|
"eval_runtime": 45.5296, |
|
"eval_samples_per_second": 9.422, |
|
"eval_steps_per_second": 1.581, |
|
"step": 2140 |
|
}, |
|
{ |
|
"epoch": 7.19, |
|
"eval_accuracy": 0.9969223422037091, |
|
"eval_f1": 0.9786413118368471, |
|
"eval_loss": 0.01620173640549183, |
|
"eval_precision": 0.9726102437688304, |
|
"eval_recall": 0.9847476428175264, |
|
"eval_runtime": 45.6034, |
|
"eval_samples_per_second": 9.407, |
|
"eval_steps_per_second": 1.579, |
|
"step": 2150 |
|
}, |
|
{ |
|
"epoch": 7.22, |
|
"eval_accuracy": 0.9969886710355257, |
|
"eval_f1": 0.9798565121412803, |
|
"eval_loss": 0.0158588457852602, |
|
"eval_precision": 0.9750137287204832, |
|
"eval_recall": 0.9847476428175264, |
|
"eval_runtime": 45.789, |
|
"eval_samples_per_second": 9.369, |
|
"eval_steps_per_second": 1.572, |
|
"step": 2160 |
|
}, |
|
{ |
|
"epoch": 7.26, |
|
"eval_accuracy": 0.9969488737364357, |
|
"eval_f1": 0.9791522849647936, |
|
"eval_loss": 0.015738798305392265, |
|
"eval_precision": 0.9749793786087435, |
|
"eval_recall": 0.9833610648918469, |
|
"eval_runtime": 45.511, |
|
"eval_samples_per_second": 9.426, |
|
"eval_steps_per_second": 1.582, |
|
"step": 2170 |
|
}, |
|
{ |
|
"epoch": 7.29, |
|
"eval_accuracy": 0.9970549998673424, |
|
"eval_f1": 0.9794113582976371, |
|
"eval_loss": 0.015642931684851646, |
|
"eval_precision": 0.976039658496282, |
|
"eval_recall": 0.9828064337215752, |
|
"eval_runtime": 45.1132, |
|
"eval_samples_per_second": 9.509, |
|
"eval_steps_per_second": 1.596, |
|
"step": 2180 |
|
}, |
|
{ |
|
"epoch": 7.32, |
|
"eval_accuracy": 0.9971611259982489, |
|
"eval_f1": 0.9811998894111142, |
|
"eval_loss": 0.015118683688342571, |
|
"eval_precision": 0.9782249173098125, |
|
"eval_recall": 0.9841930116472546, |
|
"eval_runtime": 45.0629, |
|
"eval_samples_per_second": 9.52, |
|
"eval_steps_per_second": 1.598, |
|
"step": 2190 |
|
}, |
|
{ |
|
"epoch": 7.36, |
|
"eval_accuracy": 0.9973601124936987, |
|
"eval_f1": 0.982160143825197, |
|
"eval_loss": 0.015025600790977478, |
|
"eval_precision": 0.9795862068965517, |
|
"eval_recall": 0.9847476428175264, |
|
"eval_runtime": 45.3715, |
|
"eval_samples_per_second": 9.455, |
|
"eval_steps_per_second": 1.587, |
|
"step": 2200 |
|
}, |
|
{ |
|
"epoch": 7.39, |
|
"eval_accuracy": 0.9972539863627922, |
|
"eval_f1": 0.9786821705426357, |
|
"eval_loss": 0.014340460300445557, |
|
"eval_precision": 0.9770591487009398, |
|
"eval_recall": 0.9803105934553522, |
|
"eval_runtime": 45.1287, |
|
"eval_samples_per_second": 9.506, |
|
"eval_steps_per_second": 1.595, |
|
"step": 2210 |
|
}, |
|
{ |
|
"epoch": 7.42, |
|
"eval_accuracy": 0.9973335809609721, |
|
"eval_f1": 0.9813097051086805, |
|
"eval_loss": 0.0135923121124506, |
|
"eval_precision": 0.979817528338402, |
|
"eval_recall": 0.9828064337215752, |
|
"eval_runtime": 45.1943, |
|
"eval_samples_per_second": 9.492, |
|
"eval_steps_per_second": 1.593, |
|
"step": 2220 |
|
}, |
|
{ |
|
"epoch": 7.46, |
|
"eval_accuracy": 0.9972009232973389, |
|
"eval_f1": 0.978570441034149, |
|
"eval_loss": 0.014164491556584835, |
|
"eval_precision": 0.9757375241246209, |
|
"eval_recall": 0.9814198557958957, |
|
"eval_runtime": 45.309, |
|
"eval_samples_per_second": 9.468, |
|
"eval_steps_per_second": 1.589, |
|
"step": 2230 |
|
}, |
|
{ |
|
"epoch": 7.49, |
|
"eval_accuracy": 0.9972672521291555, |
|
"eval_f1": 0.9806308799114555, |
|
"eval_loss": 0.01402602344751358, |
|
"eval_precision": 0.9784649364991718, |
|
"eval_recall": 0.9828064337215752, |
|
"eval_runtime": 45.5204, |
|
"eval_samples_per_second": 9.424, |
|
"eval_steps_per_second": 1.582, |
|
"step": 2240 |
|
}, |
|
{ |
|
"epoch": 7.53, |
|
"eval_accuracy": 0.9972539863627922, |
|
"eval_f1": 0.9809181415929205, |
|
"eval_loss": 0.014084520749747753, |
|
"eval_precision": 0.9782129067843354, |
|
"eval_recall": 0.9836383804769828, |
|
"eval_runtime": 45.1882, |
|
"eval_samples_per_second": 9.494, |
|
"eval_steps_per_second": 1.593, |
|
"step": 2250 |
|
}, |
|
{ |
|
"epoch": 7.56, |
|
"eval_accuracy": 0.9972937836618821, |
|
"eval_f1": 0.9835111542192047, |
|
"eval_loss": 0.014140544459223747, |
|
"eval_precision": 0.9828302409304902, |
|
"eval_recall": 0.9841930116472546, |
|
"eval_runtime": 45.1162, |
|
"eval_samples_per_second": 9.509, |
|
"eval_steps_per_second": 1.596, |
|
"step": 2260 |
|
}, |
|
{ |
|
"epoch": 7.59, |
|
"eval_accuracy": 0.9971213286991589, |
|
"eval_f1": 0.980484429065744, |
|
"eval_loss": 0.015128599479794502, |
|
"eval_precision": 0.9787234042553191, |
|
"eval_recall": 0.9822518025513034, |
|
"eval_runtime": 45.1622, |
|
"eval_samples_per_second": 9.499, |
|
"eval_steps_per_second": 1.594, |
|
"step": 2270 |
|
}, |
|
{ |
|
"epoch": 7.63, |
|
"eval_accuracy": 0.9971743917646122, |
|
"eval_f1": 0.9838017444275232, |
|
"eval_loss": 0.014916467480361462, |
|
"eval_precision": 0.9823057782692839, |
|
"eval_recall": 0.9853022739877981, |
|
"eval_runtime": 45.3078, |
|
"eval_samples_per_second": 9.469, |
|
"eval_steps_per_second": 1.589, |
|
"step": 2280 |
|
}, |
|
{ |
|
"epoch": 7.66, |
|
"eval_accuracy": 0.9971876575309756, |
|
"eval_f1": 0.9826989619377162, |
|
"eval_loss": 0.014806441031396389, |
|
"eval_precision": 0.980933959657364, |
|
"eval_recall": 0.9844703272323905, |
|
"eval_runtime": 45.215, |
|
"eval_samples_per_second": 9.488, |
|
"eval_steps_per_second": 1.592, |
|
"step": 2290 |
|
}, |
|
{ |
|
"epoch": 7.69, |
|
"eval_accuracy": 0.9973335809609721, |
|
"eval_f1": 0.9828444936358606, |
|
"eval_loss": 0.014511052519083023, |
|
"eval_precision": 0.9806736609607951, |
|
"eval_recall": 0.9850249584026622, |
|
"eval_runtime": 45.1721, |
|
"eval_samples_per_second": 9.497, |
|
"eval_steps_per_second": 1.594, |
|
"step": 2300 |
|
}, |
|
{ |
|
"epoch": 7.73, |
|
"eval_accuracy": 0.9973070494282454, |
|
"eval_f1": 0.9824124082537044, |
|
"eval_loss": 0.014819289557635784, |
|
"eval_precision": 0.9811894882434301, |
|
"eval_recall": 0.9836383804769828, |
|
"eval_runtime": 45.484, |
|
"eval_samples_per_second": 9.432, |
|
"eval_steps_per_second": 1.583, |
|
"step": 2310 |
|
}, |
|
{ |
|
"epoch": 7.76, |
|
"eval_accuracy": 0.9971611259982489, |
|
"eval_f1": 0.9818935729094679, |
|
"eval_loss": 0.015233664773404598, |
|
"eval_precision": 0.9787820336180766, |
|
"eval_recall": 0.9850249584026622, |
|
"eval_runtime": 45.245, |
|
"eval_samples_per_second": 9.482, |
|
"eval_steps_per_second": 1.591, |
|
"step": 2320 |
|
}, |
|
{ |
|
"epoch": 7.79, |
|
"eval_accuracy": 0.9970549998673424, |
|
"eval_f1": 0.9814865985078752, |
|
"eval_loss": 0.01592710055410862, |
|
"eval_precision": 0.9779735682819384, |
|
"eval_recall": 0.9850249584026622, |
|
"eval_runtime": 45.1068, |
|
"eval_samples_per_second": 9.511, |
|
"eval_steps_per_second": 1.596, |
|
"step": 2330 |
|
}, |
|
{ |
|
"epoch": 7.83, |
|
"eval_accuracy": 0.9970019368018891, |
|
"eval_f1": 0.9807984528249758, |
|
"eval_loss": 0.01635568030178547, |
|
"eval_precision": 0.9771538673272777, |
|
"eval_recall": 0.9844703272323905, |
|
"eval_runtime": 45.3054, |
|
"eval_samples_per_second": 9.469, |
|
"eval_steps_per_second": 1.589, |
|
"step": 2340 |
|
}, |
|
{ |
|
"epoch": 7.86, |
|
"eval_accuracy": 0.9971213286991589, |
|
"eval_f1": 0.9810747340792927, |
|
"eval_loss": 0.015507887117564678, |
|
"eval_precision": 0.9774291219377924, |
|
"eval_recall": 0.9847476428175264, |
|
"eval_runtime": 45.3049, |
|
"eval_samples_per_second": 9.469, |
|
"eval_steps_per_second": 1.589, |
|
"step": 2350 |
|
}, |
|
{ |
|
"epoch": 7.89, |
|
"eval_accuracy": 0.9971743917646122, |
|
"eval_f1": 0.9814814814814814, |
|
"eval_loss": 0.01488608680665493, |
|
"eval_precision": 0.978236914600551, |
|
"eval_recall": 0.9847476428175264, |
|
"eval_runtime": 45.3669, |
|
"eval_samples_per_second": 9.456, |
|
"eval_steps_per_second": 1.587, |
|
"step": 2360 |
|
}, |
|
{ |
|
"epoch": 7.93, |
|
"eval_accuracy": 0.9969090764373458, |
|
"eval_f1": 0.9790055248618784, |
|
"eval_loss": 0.016140291467308998, |
|
"eval_precision": 0.9752339020363237, |
|
"eval_recall": 0.9828064337215752, |
|
"eval_runtime": 45.5755, |
|
"eval_samples_per_second": 9.413, |
|
"eval_steps_per_second": 1.58, |
|
"step": 2370 |
|
}, |
|
{ |
|
"epoch": 7.96, |
|
"eval_accuracy": 0.9968427476055292, |
|
"eval_f1": 0.980511402902557, |
|
"eval_loss": 0.01678432524204254, |
|
"eval_precision": 0.9774042435932764, |
|
"eval_recall": 0.9836383804769828, |
|
"eval_runtime": 45.3412, |
|
"eval_samples_per_second": 9.462, |
|
"eval_steps_per_second": 1.588, |
|
"step": 2380 |
|
}, |
|
{ |
|
"epoch": 7.99, |
|
"eval_accuracy": 0.9968162160728026, |
|
"eval_f1": 0.9803704727674868, |
|
"eval_loss": 0.016629330813884735, |
|
"eval_precision": 0.9773980154355016, |
|
"eval_recall": 0.9833610648918469, |
|
"eval_runtime": 45.5099, |
|
"eval_samples_per_second": 9.427, |
|
"eval_steps_per_second": 1.582, |
|
"step": 2390 |
|
}, |
|
{ |
|
"epoch": 8.03, |
|
"eval_accuracy": 0.9968560133718924, |
|
"eval_f1": 0.9798119469026549, |
|
"eval_loss": 0.01662250980734825, |
|
"eval_precision": 0.9771097628240485, |
|
"eval_recall": 0.9825291181364393, |
|
"eval_runtime": 45.337, |
|
"eval_samples_per_second": 9.462, |
|
"eval_steps_per_second": 1.588, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 8.06, |
|
"eval_accuracy": 0.9970019368018891, |
|
"eval_f1": 0.9813355454168395, |
|
"eval_loss": 0.0163425225764513, |
|
"eval_precision": 0.978494623655914, |
|
"eval_recall": 0.9841930116472546, |
|
"eval_runtime": 45.4794, |
|
"eval_samples_per_second": 9.433, |
|
"eval_steps_per_second": 1.583, |
|
"step": 2410 |
|
}, |
|
{ |
|
"epoch": 8.09, |
|
"eval_accuracy": 0.9970947971664323, |
|
"eval_f1": 0.9811842833425568, |
|
"eval_loss": 0.016381612047553062, |
|
"eval_precision": 0.9790171176145775, |
|
"eval_recall": 0.9833610648918469, |
|
"eval_runtime": 45.1726, |
|
"eval_samples_per_second": 9.497, |
|
"eval_steps_per_second": 1.594, |
|
"step": 2420 |
|
}, |
|
{ |
|
"epoch": 8.13, |
|
"eval_accuracy": 0.9971213286991589, |
|
"eval_f1": 0.9817528338401991, |
|
"eval_loss": 0.016340401023626328, |
|
"eval_precision": 0.9787761852260198, |
|
"eval_recall": 0.9847476428175264, |
|
"eval_runtime": 45.3524, |
|
"eval_samples_per_second": 9.459, |
|
"eval_steps_per_second": 1.588, |
|
"step": 2430 |
|
}, |
|
{ |
|
"epoch": 8.16, |
|
"eval_accuracy": 0.9970019368018891, |
|
"eval_f1": 0.980771890994605, |
|
"eval_loss": 0.016326354816555977, |
|
"eval_precision": 0.9784708804857852, |
|
"eval_recall": 0.983083749306711, |
|
"eval_runtime": 45.2927, |
|
"eval_samples_per_second": 9.472, |
|
"eval_steps_per_second": 1.59, |
|
"step": 2440 |
|
}, |
|
{ |
|
"epoch": 8.19, |
|
"eval_accuracy": 0.9970682656337057, |
|
"eval_f1": 0.9817275747508305, |
|
"eval_loss": 0.015510362572968006, |
|
"eval_precision": 0.9800995024875622, |
|
"eval_recall": 0.9833610648918469, |
|
"eval_runtime": 45.5096, |
|
"eval_samples_per_second": 9.427, |
|
"eval_steps_per_second": 1.582, |
|
"step": 2450 |
|
}, |
|
{ |
|
"epoch": 8.23, |
|
"eval_accuracy": 0.9971345944655223, |
|
"eval_f1": 0.9824464409122322, |
|
"eval_loss": 0.015236412174999714, |
|
"eval_precision": 0.9793331496279967, |
|
"eval_recall": 0.985579589572934, |
|
"eval_runtime": 45.3704, |
|
"eval_samples_per_second": 9.455, |
|
"eval_steps_per_second": 1.587, |
|
"step": 2460 |
|
}, |
|
{ |
|
"epoch": 8.26, |
|
"eval_accuracy": 0.9971345944655223, |
|
"eval_f1": 0.9814865985078752, |
|
"eval_loss": 0.015579747967422009, |
|
"eval_precision": 0.9779735682819384, |
|
"eval_recall": 0.9850249584026622, |
|
"eval_runtime": 45.2219, |
|
"eval_samples_per_second": 9.487, |
|
"eval_steps_per_second": 1.592, |
|
"step": 2470 |
|
}, |
|
{ |
|
"epoch": 8.29, |
|
"eval_accuracy": 0.9972009232973389, |
|
"eval_f1": 0.9789590254706533, |
|
"eval_loss": 0.014976629987359047, |
|
"eval_precision": 0.9773355444997236, |
|
"eval_recall": 0.9805879090404881, |
|
"eval_runtime": 45.5521, |
|
"eval_samples_per_second": 9.418, |
|
"eval_steps_per_second": 1.581, |
|
"step": 2480 |
|
}, |
|
{ |
|
"epoch": 8.33, |
|
"eval_accuracy": 0.9973335809609721, |
|
"eval_f1": 0.9824318716281643, |
|
"eval_loss": 0.014180959202349186, |
|
"eval_precision": 0.9801269666022633, |
|
"eval_recall": 0.9847476428175264, |
|
"eval_runtime": 45.6388, |
|
"eval_samples_per_second": 9.4, |
|
"eval_steps_per_second": 1.578, |
|
"step": 2490 |
|
}, |
|
{ |
|
"epoch": 8.36, |
|
"learning_rate": 7.500000000000001e-06, |
|
"loss": 0.0051, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 8.36, |
|
"eval_accuracy": 0.9972274548300656, |
|
"eval_f1": 0.9791522849647936, |
|
"eval_loss": 0.014656171202659607, |
|
"eval_precision": 0.9749793786087435, |
|
"eval_recall": 0.9833610648918469, |
|
"eval_runtime": 45.2727, |
|
"eval_samples_per_second": 9.476, |
|
"eval_steps_per_second": 1.59, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 8.39, |
|
"eval_accuracy": 0.9971213286991589, |
|
"eval_f1": 0.9780477702609416, |
|
"eval_loss": 0.014881155453622341, |
|
"eval_precision": 0.9738795710750618, |
|
"eval_recall": 0.9822518025513034, |
|
"eval_runtime": 45.7124, |
|
"eval_samples_per_second": 9.385, |
|
"eval_steps_per_second": 1.575, |
|
"step": 2510 |
|
}, |
|
{ |
|
"epoch": 8.43, |
|
"eval_accuracy": 0.9972141890637022, |
|
"eval_f1": 0.9806629834254144, |
|
"eval_loss": 0.014929546974599361, |
|
"eval_precision": 0.976884975233902, |
|
"eval_recall": 0.9844703272323905, |
|
"eval_runtime": 45.3886, |
|
"eval_samples_per_second": 9.452, |
|
"eval_steps_per_second": 1.586, |
|
"step": 2520 |
|
}, |
|
{ |
|
"epoch": 8.46, |
|
"eval_accuracy": 0.9972009232973389, |
|
"eval_f1": 0.9802404311178665, |
|
"eval_loss": 0.014953644014894962, |
|
"eval_precision": 0.976865877168824, |
|
"eval_recall": 0.9836383804769828, |
|
"eval_runtime": 45.8505, |
|
"eval_samples_per_second": 9.356, |
|
"eval_steps_per_second": 1.57, |
|
"step": 2530 |
|
}, |
|
{ |
|
"epoch": 8.49, |
|
"eval_accuracy": 0.9971345944655223, |
|
"eval_f1": 0.9813252178724583, |
|
"eval_loss": 0.014914426021277905, |
|
"eval_precision": 0.979022909191278, |
|
"eval_recall": 0.9836383804769828, |
|
"eval_runtime": 45.5694, |
|
"eval_samples_per_second": 9.414, |
|
"eval_steps_per_second": 1.58, |
|
"step": 2540 |
|
}, |
|
{ |
|
"epoch": 8.53, |
|
"eval_accuracy": 0.9972672521291555, |
|
"eval_f1": 0.9826941713969264, |
|
"eval_loss": 0.014766544103622437, |
|
"eval_precision": 0.9811998894111141, |
|
"eval_recall": 0.9841930116472546, |
|
"eval_runtime": 45.2509, |
|
"eval_samples_per_second": 9.48, |
|
"eval_steps_per_second": 1.591, |
|
"step": 2550 |
|
}, |
|
{ |
|
"epoch": 8.56, |
|
"eval_accuracy": 0.9972407205964289, |
|
"eval_f1": 0.9839468585662884, |
|
"eval_loss": 0.015172240324318409, |
|
"eval_precision": 0.9820441988950276, |
|
"eval_recall": 0.9858569051580699, |
|
"eval_runtime": 45.7001, |
|
"eval_samples_per_second": 9.387, |
|
"eval_steps_per_second": 1.575, |
|
"step": 2560 |
|
}, |
|
{ |
|
"epoch": 8.6, |
|
"eval_accuracy": 0.9971345944655223, |
|
"eval_f1": 0.9829993089149965, |
|
"eval_loss": 0.015841683372855186, |
|
"eval_precision": 0.9798842656379168, |
|
"eval_recall": 0.9861342207432058, |
|
"eval_runtime": 45.6884, |
|
"eval_samples_per_second": 9.39, |
|
"eval_steps_per_second": 1.576, |
|
"step": 2570 |
|
}, |
|
{ |
|
"epoch": 8.63, |
|
"eval_accuracy": 0.997041734100979, |
|
"eval_f1": 0.9813407049067036, |
|
"eval_loss": 0.016232503578066826, |
|
"eval_precision": 0.9782309176081565, |
|
"eval_recall": 0.9844703272323905, |
|
"eval_runtime": 45.3554, |
|
"eval_samples_per_second": 9.459, |
|
"eval_steps_per_second": 1.587, |
|
"step": 2580 |
|
}, |
|
{ |
|
"epoch": 8.66, |
|
"eval_accuracy": 0.9969621395027991, |
|
"eval_f1": 0.9763714246234628, |
|
"eval_loss": 0.015989486128091812, |
|
"eval_precision": 0.9730101900302947, |
|
"eval_recall": 0.9797559622850804, |
|
"eval_runtime": 45.3338, |
|
"eval_samples_per_second": 9.463, |
|
"eval_steps_per_second": 1.588, |
|
"step": 2590 |
|
}, |
|
{ |
|
"epoch": 8.7, |
|
"eval_accuracy": 0.9969223422037091, |
|
"eval_f1": 0.9746922970543493, |
|
"eval_loss": 0.015164612792432308, |
|
"eval_precision": 0.9721379310344828, |
|
"eval_recall": 0.9772601220188575, |
|
"eval_runtime": 45.3618, |
|
"eval_samples_per_second": 9.457, |
|
"eval_steps_per_second": 1.587, |
|
"step": 2600 |
|
}, |
|
{ |
|
"epoch": 8.73, |
|
"eval_accuracy": 0.9970284683346157, |
|
"eval_f1": 0.9752111895859299, |
|
"eval_loss": 0.015361527912318707, |
|
"eval_precision": 0.9739972337482711, |
|
"eval_recall": 0.9764281752634498, |
|
"eval_runtime": 45.7043, |
|
"eval_samples_per_second": 9.386, |
|
"eval_steps_per_second": 1.575, |
|
"step": 2610 |
|
}, |
|
{ |
|
"epoch": 8.76, |
|
"eval_accuracy": 0.9970947971664323, |
|
"eval_f1": 0.9776057506220625, |
|
"eval_loss": 0.015215002000331879, |
|
"eval_precision": 0.9746416758544653, |
|
"eval_recall": 0.9805879090404881, |
|
"eval_runtime": 45.5622, |
|
"eval_samples_per_second": 9.416, |
|
"eval_steps_per_second": 1.58, |
|
"step": 2620 |
|
}, |
|
{ |
|
"epoch": 8.8, |
|
"eval_accuracy": 0.9970815314000689, |
|
"eval_f1": 0.9777470628887354, |
|
"eval_loss": 0.014545532874763012, |
|
"eval_precision": 0.974648663543676, |
|
"eval_recall": 0.980865224625624, |
|
"eval_runtime": 45.4027, |
|
"eval_samples_per_second": 9.449, |
|
"eval_steps_per_second": 1.586, |
|
"step": 2630 |
|
}, |
|
{ |
|
"epoch": 8.83, |
|
"eval_accuracy": 0.9971611259982489, |
|
"eval_f1": 0.9813355454168395, |
|
"eval_loss": 0.014298198744654655, |
|
"eval_precision": 0.978494623655914, |
|
"eval_recall": 0.9841930116472546, |
|
"eval_runtime": 45.6015, |
|
"eval_samples_per_second": 9.408, |
|
"eval_steps_per_second": 1.579, |
|
"step": 2640 |
|
}, |
|
{ |
|
"epoch": 8.86, |
|
"eval_accuracy": 0.9971213286991589, |
|
"eval_f1": 0.9804952275556785, |
|
"eval_loss": 0.014669723808765411, |
|
"eval_precision": 0.978194866133039, |
|
"eval_recall": 0.9828064337215752, |
|
"eval_runtime": 45.6583, |
|
"eval_samples_per_second": 9.396, |
|
"eval_steps_per_second": 1.577, |
|
"step": 2650 |
|
}, |
|
{ |
|
"epoch": 8.9, |
|
"eval_accuracy": 0.9970549998673424, |
|
"eval_f1": 0.9749550297495504, |
|
"eval_loss": 0.014710523188114166, |
|
"eval_precision": 0.9729356531344933, |
|
"eval_recall": 0.9769828064337216, |
|
"eval_runtime": 45.2863, |
|
"eval_samples_per_second": 9.473, |
|
"eval_steps_per_second": 1.59, |
|
"step": 2660 |
|
}, |
|
{ |
|
"epoch": 8.93, |
|
"eval_accuracy": 0.9972141890637022, |
|
"eval_f1": 0.9820094104622197, |
|
"eval_loss": 0.014592879451811314, |
|
"eval_precision": 0.980110497237569, |
|
"eval_recall": 0.9839156960621187, |
|
"eval_runtime": 45.3618, |
|
"eval_samples_per_second": 9.457, |
|
"eval_steps_per_second": 1.587, |
|
"step": 2670 |
|
}, |
|
{ |
|
"epoch": 8.96, |
|
"eval_accuracy": 0.9971876575309756, |
|
"eval_f1": 0.9817477876106194, |
|
"eval_loss": 0.014163294807076454, |
|
"eval_precision": 0.9790402647545504, |
|
"eval_recall": 0.9844703272323905, |
|
"eval_runtime": 45.3659, |
|
"eval_samples_per_second": 9.456, |
|
"eval_steps_per_second": 1.587, |
|
"step": 2680 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_accuracy": 0.9971345944655223, |
|
"eval_f1": 0.9792932081722805, |
|
"eval_loss": 0.01418287307024002, |
|
"eval_precision": 0.9749862561847169, |
|
"eval_recall": 0.9836383804769828, |
|
"eval_runtime": 45.6259, |
|
"eval_samples_per_second": 9.403, |
|
"eval_steps_per_second": 1.578, |
|
"step": 2690 |
|
}, |
|
{ |
|
"epoch": 9.03, |
|
"eval_accuracy": 0.9971478602318856, |
|
"eval_f1": 0.9809286898839138, |
|
"eval_loss": 0.014496715739369392, |
|
"eval_precision": 0.9776859504132231, |
|
"eval_recall": 0.9841930116472546, |
|
"eval_runtime": 45.371, |
|
"eval_samples_per_second": 9.455, |
|
"eval_steps_per_second": 1.587, |
|
"step": 2700 |
|
}, |
|
{ |
|
"epoch": 9.06, |
|
"eval_accuracy": 0.9970947971664323, |
|
"eval_f1": 0.9802295036637633, |
|
"eval_loss": 0.014654590748250484, |
|
"eval_precision": 0.9773917838433968, |
|
"eval_recall": 0.983083749306711, |
|
"eval_runtime": 45.386, |
|
"eval_samples_per_second": 9.452, |
|
"eval_steps_per_second": 1.586, |
|
"step": 2710 |
|
}, |
|
{ |
|
"epoch": 9.1, |
|
"eval_accuracy": 0.9970682656337057, |
|
"eval_f1": 0.9795410561238596, |
|
"eval_loss": 0.014612732455134392, |
|
"eval_precision": 0.9765711135611908, |
|
"eval_recall": 0.9825291181364393, |
|
"eval_runtime": 45.3853, |
|
"eval_samples_per_second": 9.452, |
|
"eval_steps_per_second": 1.586, |
|
"step": 2720 |
|
}, |
|
{ |
|
"epoch": 9.13, |
|
"eval_accuracy": 0.9970947971664323, |
|
"eval_f1": 0.9796989366109652, |
|
"eval_loss": 0.014642550610005856, |
|
"eval_precision": 0.9757909215955983, |
|
"eval_recall": 0.9836383804769828, |
|
"eval_runtime": 45.583, |
|
"eval_samples_per_second": 9.411, |
|
"eval_steps_per_second": 1.58, |
|
"step": 2730 |
|
}, |
|
{ |
|
"epoch": 9.16, |
|
"eval_accuracy": 0.9970815314000689, |
|
"eval_f1": 0.9792817679558011, |
|
"eval_loss": 0.014756478369235992, |
|
"eval_precision": 0.9755090809025867, |
|
"eval_recall": 0.983083749306711, |
|
"eval_runtime": 45.3958, |
|
"eval_samples_per_second": 9.45, |
|
"eval_steps_per_second": 1.586, |
|
"step": 2740 |
|
}, |
|
{ |
|
"epoch": 9.2, |
|
"eval_accuracy": 0.9971611259982489, |
|
"eval_f1": 0.9781526548672567, |
|
"eval_loss": 0.014514540322124958, |
|
"eval_precision": 0.9754550468836183, |
|
"eval_recall": 0.980865224625624, |
|
"eval_runtime": 45.3479, |
|
"eval_samples_per_second": 9.46, |
|
"eval_steps_per_second": 1.588, |
|
"step": 2750 |
|
}, |
|
{ |
|
"epoch": 9.23, |
|
"eval_accuracy": 0.9971876575309756, |
|
"eval_f1": 0.9780234968901176, |
|
"eval_loss": 0.014607676304876804, |
|
"eval_precision": 0.974924221548636, |
|
"eval_recall": 0.9811425402107599, |
|
"eval_runtime": 45.3679, |
|
"eval_samples_per_second": 9.456, |
|
"eval_steps_per_second": 1.587, |
|
"step": 2760 |
|
}, |
|
{ |
|
"epoch": 9.26, |
|
"eval_accuracy": 0.9971213286991589, |
|
"eval_f1": 0.9799585348997927, |
|
"eval_loss": 0.014230134896934032, |
|
"eval_precision": 0.9768531275833563, |
|
"eval_recall": 0.983083749306711, |
|
"eval_runtime": 45.6606, |
|
"eval_samples_per_second": 9.395, |
|
"eval_steps_per_second": 1.577, |
|
"step": 2770 |
|
}, |
|
{ |
|
"epoch": 9.3, |
|
"eval_accuracy": 0.9970815314000689, |
|
"eval_f1": 0.9814814814814814, |
|
"eval_loss": 0.014004090800881386, |
|
"eval_precision": 0.978236914600551, |
|
"eval_recall": 0.9847476428175264, |
|
"eval_runtime": 45.4655, |
|
"eval_samples_per_second": 9.436, |
|
"eval_steps_per_second": 1.584, |
|
"step": 2780 |
|
}, |
|
{ |
|
"epoch": 9.33, |
|
"eval_accuracy": 0.9971080629327956, |
|
"eval_f1": 0.980359612724758, |
|
"eval_loss": 0.013850794173777103, |
|
"eval_precision": 0.977924944812362, |
|
"eval_recall": 0.9828064337215752, |
|
"eval_runtime": 45.4768, |
|
"eval_samples_per_second": 9.433, |
|
"eval_steps_per_second": 1.583, |
|
"step": 2790 |
|
}, |
|
{ |
|
"epoch": 9.36, |
|
"eval_accuracy": 0.9970549998673424, |
|
"eval_f1": 0.9795070617557464, |
|
"eval_loss": 0.014602423645555973, |
|
"eval_precision": 0.9781526548672567, |
|
"eval_recall": 0.980865224625624, |
|
"eval_runtime": 46.0797, |
|
"eval_samples_per_second": 9.31, |
|
"eval_steps_per_second": 1.563, |
|
"step": 2800 |
|
}, |
|
{ |
|
"epoch": 9.4, |
|
"eval_accuracy": 0.9971345944655223, |
|
"eval_f1": 0.9811738648947951, |
|
"eval_loss": 0.01487213745713234, |
|
"eval_precision": 0.9795467108899945, |
|
"eval_recall": 0.9828064337215752, |
|
"eval_runtime": 45.4621, |
|
"eval_samples_per_second": 9.436, |
|
"eval_steps_per_second": 1.584, |
|
"step": 2810 |
|
}, |
|
{ |
|
"epoch": 9.43, |
|
"eval_accuracy": 0.9971345944655223, |
|
"eval_f1": 0.9789648491558263, |
|
"eval_loss": 0.01481552142649889, |
|
"eval_precision": 0.9770718232044199, |
|
"eval_recall": 0.980865224625624, |
|
"eval_runtime": 45.388, |
|
"eval_samples_per_second": 9.452, |
|
"eval_steps_per_second": 1.586, |
|
"step": 2820 |
|
}, |
|
{ |
|
"epoch": 9.46, |
|
"eval_accuracy": 0.9973601124936987, |
|
"eval_f1": 0.9822763777346994, |
|
"eval_loss": 0.01404637098312378, |
|
"eval_precision": 0.9809181415929203, |
|
"eval_recall": 0.9836383804769828, |
|
"eval_runtime": 45.4647, |
|
"eval_samples_per_second": 9.436, |
|
"eval_steps_per_second": 1.584, |
|
"step": 2830 |
|
}, |
|
{ |
|
"epoch": 9.5, |
|
"eval_accuracy": 0.9969488737364357, |
|
"eval_f1": 0.9712539925010416, |
|
"eval_loss": 0.014825278893113136, |
|
"eval_precision": 0.972739916550765, |
|
"eval_recall": 0.9697726012201886, |
|
"eval_runtime": 45.3762, |
|
"eval_samples_per_second": 9.454, |
|
"eval_steps_per_second": 1.587, |
|
"step": 2840 |
|
}, |
|
{ |
|
"epoch": 9.53, |
|
"eval_accuracy": 0.9964978376800828, |
|
"eval_f1": 0.9593767390094602, |
|
"eval_loss": 0.015539586544036865, |
|
"eval_precision": 0.9625907314349526, |
|
"eval_recall": 0.9561841375485303, |
|
"eval_runtime": 45.6548, |
|
"eval_samples_per_second": 9.397, |
|
"eval_steps_per_second": 1.577, |
|
"step": 2850 |
|
}, |
|
{ |
|
"epoch": 9.57, |
|
"eval_accuracy": 0.9964978376800828, |
|
"eval_f1": 0.9605006954102921, |
|
"eval_loss": 0.016403868794441223, |
|
"eval_precision": 0.9634486607142857, |
|
"eval_recall": 0.9575707154742097, |
|
"eval_runtime": 45.6372, |
|
"eval_samples_per_second": 9.4, |
|
"eval_steps_per_second": 1.578, |
|
"step": 2860 |
|
}, |
|
{ |
|
"epoch": 9.6, |
|
"eval_accuracy": 0.9970947971664323, |
|
"eval_f1": 0.9791350006908941, |
|
"eval_loss": 0.015382306650280952, |
|
"eval_precision": 0.9757642522721014, |
|
"eval_recall": 0.9825291181364393, |
|
"eval_runtime": 45.4505, |
|
"eval_samples_per_second": 9.439, |
|
"eval_steps_per_second": 1.584, |
|
"step": 2870 |
|
}, |
|
{ |
|
"epoch": 9.63, |
|
"eval_accuracy": 0.9970947971664323, |
|
"eval_f1": 0.9781647318960752, |
|
"eval_loss": 0.015797466039657593, |
|
"eval_precision": 0.974931129476584, |
|
"eval_recall": 0.9814198557958957, |
|
"eval_runtime": 45.42, |
|
"eval_samples_per_second": 9.445, |
|
"eval_steps_per_second": 1.585, |
|
"step": 2880 |
|
}, |
|
{ |
|
"epoch": 9.67, |
|
"eval_accuracy": 0.9969223422037091, |
|
"eval_f1": 0.9791637919138954, |
|
"eval_loss": 0.01617647521197796, |
|
"eval_precision": 0.9744575666025818, |
|
"eval_recall": 0.9839156960621187, |
|
"eval_runtime": 45.4393, |
|
"eval_samples_per_second": 9.441, |
|
"eval_steps_per_second": 1.585, |
|
"step": 2890 |
|
}, |
|
{ |
|
"epoch": 9.7, |
|
"eval_accuracy": 0.9969223422037091, |
|
"eval_f1": 0.978629532607197, |
|
"eval_loss": 0.0164639949798584, |
|
"eval_precision": 0.9731285988483686, |
|
"eval_recall": 0.9841930116472546, |
|
"eval_runtime": 45.4559, |
|
"eval_samples_per_second": 9.438, |
|
"eval_steps_per_second": 1.584, |
|
"step": 2900 |
|
}, |
|
{ |
|
"epoch": 9.73, |
|
"eval_accuracy": 0.9969886710355257, |
|
"eval_f1": 0.9791810285399146, |
|
"eval_loss": 0.016681063920259476, |
|
"eval_precision": 0.9736769947902385, |
|
"eval_recall": 0.9847476428175264, |
|
"eval_runtime": 45.5001, |
|
"eval_samples_per_second": 9.429, |
|
"eval_steps_per_second": 1.582, |
|
"step": 2910 |
|
}, |
|
{ |
|
"epoch": 9.77, |
|
"eval_accuracy": 0.9969621395027991, |
|
"eval_f1": 0.9808090570205716, |
|
"eval_loss": 0.016886161640286446, |
|
"eval_precision": 0.9766290899092659, |
|
"eval_recall": 0.9850249584026622, |
|
"eval_runtime": 45.9762, |
|
"eval_samples_per_second": 9.331, |
|
"eval_steps_per_second": 1.566, |
|
"step": 2920 |
|
}, |
|
{ |
|
"epoch": 9.8, |
|
"eval_accuracy": 0.9969621395027991, |
|
"eval_f1": 0.9787351560342448, |
|
"eval_loss": 0.017214221879839897, |
|
"eval_precision": 0.9746974697469747, |
|
"eval_recall": 0.9828064337215752, |
|
"eval_runtime": 45.4576, |
|
"eval_samples_per_second": 9.437, |
|
"eval_steps_per_second": 1.584, |
|
"step": 2930 |
|
}, |
|
{ |
|
"epoch": 9.83, |
|
"eval_accuracy": 0.9971213286991589, |
|
"eval_f1": 0.9816069699903195, |
|
"eval_loss": 0.016497749835252762, |
|
"eval_precision": 0.9790344827586207, |
|
"eval_recall": 0.9841930116472546, |
|
"eval_runtime": 45.3849, |
|
"eval_samples_per_second": 9.452, |
|
"eval_steps_per_second": 1.586, |
|
"step": 2940 |
|
}, |
|
{ |
|
"epoch": 9.87, |
|
"eval_accuracy": 0.9971876575309756, |
|
"eval_f1": 0.9821650767316467, |
|
"eval_loss": 0.01616404764354229, |
|
"eval_precision": 0.9793217535153019, |
|
"eval_recall": 0.9850249584026622, |
|
"eval_runtime": 45.4779, |
|
"eval_samples_per_second": 9.433, |
|
"eval_steps_per_second": 1.583, |
|
"step": 2950 |
|
}, |
|
{ |
|
"epoch": 9.9, |
|
"eval_accuracy": 0.9970682656337057, |
|
"eval_f1": 0.9790829754813686, |
|
"eval_loss": 0.016479264944791794, |
|
"eval_precision": 0.9781345142540825, |
|
"eval_recall": 0.9800332778702163, |
|
"eval_runtime": 45.8218, |
|
"eval_samples_per_second": 9.362, |
|
"eval_steps_per_second": 1.571, |
|
"step": 2960 |
|
}, |
|
{ |
|
"epoch": 9.93, |
|
"eval_accuracy": 0.9970947971664323, |
|
"eval_f1": 0.980060924951537, |
|
"eval_loss": 0.016018539667129517, |
|
"eval_precision": 0.9787057522123894, |
|
"eval_recall": 0.9814198557958957, |
|
"eval_runtime": 45.4831, |
|
"eval_samples_per_second": 9.432, |
|
"eval_steps_per_second": 1.583, |
|
"step": 2970 |
|
}, |
|
{ |
|
"epoch": 9.97, |
|
"eval_accuracy": 0.9970284683346157, |
|
"eval_f1": 0.9785348289710566, |
|
"eval_loss": 0.016076229512691498, |
|
"eval_precision": 0.9773167358229599, |
|
"eval_recall": 0.9797559622850804, |
|
"eval_runtime": 45.4108, |
|
"eval_samples_per_second": 9.447, |
|
"eval_steps_per_second": 1.586, |
|
"step": 2980 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_accuracy": 0.9970019368018891, |
|
"eval_f1": 0.9797895902547065, |
|
"eval_loss": 0.01618347130715847, |
|
"eval_precision": 0.9781647318960752, |
|
"eval_recall": 0.9814198557958957, |
|
"eval_runtime": 45.4332, |
|
"eval_samples_per_second": 9.442, |
|
"eval_steps_per_second": 1.585, |
|
"step": 2990 |
|
}, |
|
{ |
|
"epoch": 10.03, |
|
"learning_rate": 7e-06, |
|
"loss": 0.0046, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 10.03, |
|
"eval_accuracy": 0.9970019368018891, |
|
"eval_f1": 0.9791234619106871, |
|
"eval_loss": 0.016251519322395325, |
|
"eval_precision": 0.9762889440308795, |
|
"eval_recall": 0.9819744869661675, |
|
"eval_runtime": 45.7254, |
|
"eval_samples_per_second": 9.382, |
|
"eval_steps_per_second": 1.575, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 10.07, |
|
"eval_accuracy": 0.997041734100979, |
|
"eval_f1": 0.9806576402321082, |
|
"eval_loss": 0.0159316323697567, |
|
"eval_precision": 0.977147577092511, |
|
"eval_recall": 0.9841930116472546, |
|
"eval_runtime": 45.9937, |
|
"eval_samples_per_second": 9.327, |
|
"eval_steps_per_second": 1.565, |
|
"step": 3010 |
|
}, |
|
{ |
|
"epoch": 10.1, |
|
"eval_accuracy": 0.9970549998673424, |
|
"eval_f1": 0.9798007747648035, |
|
"eval_loss": 0.015915466472506523, |
|
"eval_precision": 0.9776366648260629, |
|
"eval_recall": 0.9819744869661675, |
|
"eval_runtime": 45.3335, |
|
"eval_samples_per_second": 9.463, |
|
"eval_steps_per_second": 1.588, |
|
"step": 3020 |
|
}, |
|
{ |
|
"epoch": 10.13, |
|
"eval_accuracy": 0.9971478602318856, |
|
"eval_f1": 0.9813200498132004, |
|
"eval_loss": 0.015171729028224945, |
|
"eval_precision": 0.9792874896437448, |
|
"eval_recall": 0.9833610648918469, |
|
"eval_runtime": 45.3108, |
|
"eval_samples_per_second": 9.468, |
|
"eval_steps_per_second": 1.589, |
|
"step": 3030 |
|
}, |
|
{ |
|
"epoch": 10.17, |
|
"eval_accuracy": 0.9966570268764426, |
|
"eval_f1": 0.9667917187717104, |
|
"eval_loss": 0.015076521784067154, |
|
"eval_precision": 0.9688109161793372, |
|
"eval_recall": 0.9647809206877427, |
|
"eval_runtime": 45.3556, |
|
"eval_samples_per_second": 9.459, |
|
"eval_steps_per_second": 1.587, |
|
"step": 3040 |
|
}, |
|
{ |
|
"epoch": 10.2, |
|
"eval_accuracy": 0.9968427476055292, |
|
"eval_f1": 0.9746922970543493, |
|
"eval_loss": 0.014860566705465317, |
|
"eval_precision": 0.9721379310344828, |
|
"eval_recall": 0.9772601220188575, |
|
"eval_runtime": 45.4321, |
|
"eval_samples_per_second": 9.443, |
|
"eval_steps_per_second": 1.585, |
|
"step": 3050 |
|
}, |
|
{ |
|
"epoch": 10.23, |
|
"eval_accuracy": 0.9970682656337057, |
|
"eval_f1": 0.980110497237569, |
|
"eval_loss": 0.014547467231750488, |
|
"eval_precision": 0.9763346175013758, |
|
"eval_recall": 0.9839156960621187, |
|
"eval_runtime": 45.3097, |
|
"eval_samples_per_second": 9.468, |
|
"eval_steps_per_second": 1.589, |
|
"step": 3060 |
|
}, |
|
{ |
|
"epoch": 10.27, |
|
"eval_accuracy": 0.997041734100979, |
|
"eval_f1": 0.9792760431058304, |
|
"eval_loss": 0.014211696572601795, |
|
"eval_precision": 0.9757709251101322, |
|
"eval_recall": 0.9828064337215752, |
|
"eval_runtime": 45.7056, |
|
"eval_samples_per_second": 9.386, |
|
"eval_steps_per_second": 1.575, |
|
"step": 3070 |
|
}, |
|
{ |
|
"epoch": 10.3, |
|
"eval_accuracy": 0.9970284683346157, |
|
"eval_f1": 0.9788469514724182, |
|
"eval_loss": 0.01424412615597248, |
|
"eval_precision": 0.9760132340777502, |
|
"eval_recall": 0.9816971713810316, |
|
"eval_runtime": 45.6738, |
|
"eval_samples_per_second": 9.393, |
|
"eval_steps_per_second": 1.576, |
|
"step": 3080 |
|
}, |
|
{ |
|
"epoch": 10.33, |
|
"eval_accuracy": 0.9969356079700724, |
|
"eval_f1": 0.9745293466223699, |
|
"eval_loss": 0.014736946672201157, |
|
"eval_precision": 0.9729132117191819, |
|
"eval_recall": 0.9761508596783139, |
|
"eval_runtime": 45.4811, |
|
"eval_samples_per_second": 9.432, |
|
"eval_steps_per_second": 1.583, |
|
"step": 3090 |
|
}, |
|
{ |
|
"epoch": 10.37, |
|
"eval_accuracy": 0.9970682656337057, |
|
"eval_f1": 0.9801050013815971, |
|
"eval_loss": 0.014717744663357735, |
|
"eval_precision": 0.9765969162995595, |
|
"eval_recall": 0.9836383804769828, |
|
"eval_runtime": 45.415, |
|
"eval_samples_per_second": 9.446, |
|
"eval_steps_per_second": 1.585, |
|
"step": 3100 |
|
}, |
|
{ |
|
"epoch": 10.4, |
|
"eval_accuracy": 0.9971080629327956, |
|
"eval_f1": 0.9810642709053213, |
|
"eval_loss": 0.015054759569466114, |
|
"eval_precision": 0.9779553596031965, |
|
"eval_recall": 0.9841930116472546, |
|
"eval_runtime": 45.7255, |
|
"eval_samples_per_second": 9.382, |
|
"eval_steps_per_second": 1.575, |
|
"step": 3110 |
|
}, |
|
{ |
|
"epoch": 10.43, |
|
"eval_accuracy": 0.9971080629327956, |
|
"eval_f1": 0.9807931463313527, |
|
"eval_loss": 0.01575205847620964, |
|
"eval_precision": 0.9774166896171853, |
|
"eval_recall": 0.9841930116472546, |
|
"eval_runtime": 45.3913, |
|
"eval_samples_per_second": 9.451, |
|
"eval_steps_per_second": 1.586, |
|
"step": 3120 |
|
}, |
|
{ |
|
"epoch": 10.47, |
|
"eval_accuracy": 0.9968162160728026, |
|
"eval_f1": 0.97202216066482, |
|
"eval_loss": 0.015902305021882057, |
|
"eval_precision": 0.9709463198671832, |
|
"eval_recall": 0.9731003882418192, |
|
"eval_runtime": 45.3669, |
|
"eval_samples_per_second": 9.456, |
|
"eval_steps_per_second": 1.587, |
|
"step": 3130 |
|
}, |
|
{ |
|
"epoch": 10.5, |
|
"eval_accuracy": 0.9966835584091693, |
|
"eval_f1": 0.9686633388796451, |
|
"eval_loss": 0.016264360398054123, |
|
"eval_precision": 0.9686633388796451, |
|
"eval_recall": 0.9686633388796451, |
|
"eval_runtime": 45.3009, |
|
"eval_samples_per_second": 9.47, |
|
"eval_steps_per_second": 1.589, |
|
"step": 3140 |
|
}, |
|
{ |
|
"epoch": 10.54, |
|
"eval_accuracy": 0.9969621395027991, |
|
"eval_f1": 0.9782698961937716, |
|
"eval_loss": 0.015213034115731716, |
|
"eval_precision": 0.9765128488532744, |
|
"eval_recall": 0.9800332778702163, |
|
"eval_runtime": 45.7467, |
|
"eval_samples_per_second": 9.378, |
|
"eval_steps_per_second": 1.574, |
|
"step": 3150 |
|
}, |
|
{ |
|
"epoch": 10.57, |
|
"eval_accuracy": 0.9969886710355257, |
|
"eval_f1": 0.978693967902601, |
|
"eval_loss": 0.014814727008342743, |
|
"eval_precision": 0.9765323025952513, |
|
"eval_recall": 0.980865224625624, |
|
"eval_runtime": 45.3386, |
|
"eval_samples_per_second": 9.462, |
|
"eval_steps_per_second": 1.588, |
|
"step": 3160 |
|
}, |
|
{ |
|
"epoch": 10.6, |
|
"eval_accuracy": 0.9970549998673424, |
|
"eval_f1": 0.9793828697938286, |
|
"eval_loss": 0.015096531249582767, |
|
"eval_precision": 0.9773543220104943, |
|
"eval_recall": 0.9814198557958957, |
|
"eval_runtime": 45.6502, |
|
"eval_samples_per_second": 9.398, |
|
"eval_steps_per_second": 1.577, |
|
"step": 3170 |
|
}, |
|
{ |
|
"epoch": 10.64, |
|
"eval_accuracy": 0.997041734100979, |
|
"eval_f1": 0.9764998617638928, |
|
"eval_loss": 0.015553129836916924, |
|
"eval_precision": 0.9735391400220507, |
|
"eval_recall": 0.9794786466999446, |
|
"eval_runtime": 45.4708, |
|
"eval_samples_per_second": 9.435, |
|
"eval_steps_per_second": 1.583, |
|
"step": 3180 |
|
}, |
|
{ |
|
"epoch": 10.67, |
|
"eval_accuracy": 0.9970152025682524, |
|
"eval_f1": 0.9774643992810729, |
|
"eval_loss": 0.0158841609954834, |
|
"eval_precision": 0.9746346843121036, |
|
"eval_recall": 0.9803105934553522, |
|
"eval_runtime": 45.4753, |
|
"eval_samples_per_second": 9.434, |
|
"eval_steps_per_second": 1.583, |
|
"step": 3190 |
|
}, |
|
{ |
|
"epoch": 10.7, |
|
"eval_accuracy": 0.9970682656337057, |
|
"eval_f1": 0.9800884955752212, |
|
"eval_loss": 0.016482515260577202, |
|
"eval_precision": 0.9773855488141202, |
|
"eval_recall": 0.9828064337215752, |
|
"eval_runtime": 45.5435, |
|
"eval_samples_per_second": 9.42, |
|
"eval_steps_per_second": 1.581, |
|
"step": 3200 |
|
}, |
|
{ |
|
"epoch": 10.74, |
|
"eval_accuracy": 0.9970815314000689, |
|
"eval_f1": 0.9795410561238596, |
|
"eval_loss": 0.016413580626249313, |
|
"eval_precision": 0.9765711135611908, |
|
"eval_recall": 0.9825291181364393, |
|
"eval_runtime": 45.616, |
|
"eval_samples_per_second": 9.405, |
|
"eval_steps_per_second": 1.578, |
|
"step": 3210 |
|
}, |
|
{ |
|
"epoch": 10.77, |
|
"eval_accuracy": 0.9969621395027991, |
|
"eval_f1": 0.9791176877333702, |
|
"eval_loss": 0.01622335985302925, |
|
"eval_precision": 0.976551724137931, |
|
"eval_recall": 0.9816971713810316, |
|
"eval_runtime": 45.7676, |
|
"eval_samples_per_second": 9.373, |
|
"eval_steps_per_second": 1.573, |
|
"step": 3220 |
|
}, |
|
{ |
|
"epoch": 10.8, |
|
"eval_accuracy": 0.9969621395027991, |
|
"eval_f1": 0.9803541781959049, |
|
"eval_loss": 0.015803754329681396, |
|
"eval_precision": 0.9781888459414688, |
|
"eval_recall": 0.9825291181364393, |
|
"eval_runtime": 45.7275, |
|
"eval_samples_per_second": 9.382, |
|
"eval_steps_per_second": 1.575, |
|
"step": 3230 |
|
}, |
|
{ |
|
"epoch": 10.84, |
|
"eval_accuracy": 0.9968958106709824, |
|
"eval_f1": 0.9793828697938286, |
|
"eval_loss": 0.015858009457588196, |
|
"eval_precision": 0.9773543220104943, |
|
"eval_recall": 0.9814198557958957, |
|
"eval_runtime": 45.806, |
|
"eval_samples_per_second": 9.366, |
|
"eval_steps_per_second": 1.572, |
|
"step": 3240 |
|
}, |
|
{ |
|
"epoch": 10.87, |
|
"eval_accuracy": 0.9966968241755326, |
|
"eval_f1": 0.9738263398421271, |
|
"eval_loss": 0.016643954440951347, |
|
"eval_precision": 0.9726141078838174, |
|
"eval_recall": 0.9750415973377704, |
|
"eval_runtime": 45.5359, |
|
"eval_samples_per_second": 9.421, |
|
"eval_steps_per_second": 1.581, |
|
"step": 3250 |
|
}, |
|
{ |
|
"epoch": 10.9, |
|
"eval_accuracy": 0.9969356079700724, |
|
"eval_f1": 0.977728593166413, |
|
"eval_loss": 0.016697365790605545, |
|
"eval_precision": 0.9754347226055755, |
|
"eval_recall": 0.9800332778702163, |
|
"eval_runtime": 45.7975, |
|
"eval_samples_per_second": 9.367, |
|
"eval_steps_per_second": 1.572, |
|
"step": 3260 |
|
}, |
|
{ |
|
"epoch": 10.94, |
|
"eval_accuracy": 0.9969223422037091, |
|
"eval_f1": 0.977297895902547, |
|
"eval_loss": 0.016878845170140266, |
|
"eval_precision": 0.9756771697070205, |
|
"eval_recall": 0.9789240155296728, |
|
"eval_runtime": 45.4916, |
|
"eval_samples_per_second": 9.43, |
|
"eval_steps_per_second": 1.583, |
|
"step": 3270 |
|
}, |
|
{ |
|
"epoch": 10.97, |
|
"eval_accuracy": 0.9969223422037091, |
|
"eval_f1": 0.9780052566053397, |
|
"eval_loss": 0.016803227365016937, |
|
"eval_precision": 0.9757107369583218, |
|
"eval_recall": 0.9803105934553522, |
|
"eval_runtime": 45.574, |
|
"eval_samples_per_second": 9.413, |
|
"eval_steps_per_second": 1.58, |
|
"step": 3280 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_accuracy": 0.9969754052691624, |
|
"eval_f1": 0.9811790755604761, |
|
"eval_loss": 0.016553932800889015, |
|
"eval_precision": 0.9792817679558011, |
|
"eval_recall": 0.983083749306711, |
|
"eval_runtime": 45.6533, |
|
"eval_samples_per_second": 9.397, |
|
"eval_steps_per_second": 1.577, |
|
"step": 3290 |
|
}, |
|
{ |
|
"epoch": 11.04, |
|
"eval_accuracy": 0.9971080629327956, |
|
"eval_f1": 0.9845132743362832, |
|
"eval_loss": 0.015565542504191399, |
|
"eval_precision": 0.9817981246552675, |
|
"eval_recall": 0.9872434830837493, |
|
"eval_runtime": 45.6303, |
|
"eval_samples_per_second": 9.402, |
|
"eval_steps_per_second": 1.578, |
|
"step": 3300 |
|
}, |
|
{ |
|
"epoch": 11.07, |
|
"eval_accuracy": 0.9971345944655223, |
|
"eval_f1": 0.9846579129232895, |
|
"eval_loss": 0.014836783520877361, |
|
"eval_precision": 0.981537613667677, |
|
"eval_recall": 0.9877981142540211, |
|
"eval_runtime": 45.5788, |
|
"eval_samples_per_second": 9.412, |
|
"eval_steps_per_second": 1.58, |
|
"step": 3310 |
|
}, |
|
{ |
|
"epoch": 11.1, |
|
"eval_accuracy": 0.9970549998673424, |
|
"eval_f1": 0.9835521769177609, |
|
"eval_loss": 0.015223776921629906, |
|
"eval_precision": 0.9804353816478368, |
|
"eval_recall": 0.9866888519134775, |
|
"eval_runtime": 45.8006, |
|
"eval_samples_per_second": 9.367, |
|
"eval_steps_per_second": 1.572, |
|
"step": 3320 |
|
}, |
|
{ |
|
"epoch": 11.14, |
|
"eval_accuracy": 0.9969754052691624, |
|
"eval_f1": 0.9827133176600746, |
|
"eval_loss": 0.015493294224143028, |
|
"eval_precision": 0.9801379310344828, |
|
"eval_recall": 0.9853022739877981, |
|
"eval_runtime": 46.0713, |
|
"eval_samples_per_second": 9.312, |
|
"eval_steps_per_second": 1.563, |
|
"step": 3330 |
|
}, |
|
{ |
|
"epoch": 11.17, |
|
"eval_accuracy": 0.9970019368018891, |
|
"eval_f1": 0.9827180976081846, |
|
"eval_loss": 0.014980579726397991, |
|
"eval_precision": 0.9798731734215606, |
|
"eval_recall": 0.985579589572934, |
|
"eval_runtime": 45.5835, |
|
"eval_samples_per_second": 9.411, |
|
"eval_steps_per_second": 1.58, |
|
"step": 3340 |
|
}, |
|
{ |
|
"epoch": 11.2, |
|
"eval_accuracy": 0.9970682656337057, |
|
"eval_f1": 0.9840918522617236, |
|
"eval_loss": 0.014826910570263863, |
|
"eval_precision": 0.9817830527187413, |
|
"eval_recall": 0.9864115363283417, |
|
"eval_runtime": 45.5689, |
|
"eval_samples_per_second": 9.414, |
|
"eval_steps_per_second": 1.58, |
|
"step": 3350 |
|
}, |
|
{ |
|
"epoch": 11.24, |
|
"eval_accuracy": 0.9970682656337057, |
|
"eval_f1": 0.983402489626556, |
|
"eval_loss": 0.015205192379653454, |
|
"eval_precision": 0.9809602649006622, |
|
"eval_recall": 0.9858569051580699, |
|
"eval_runtime": 45.5733, |
|
"eval_samples_per_second": 9.413, |
|
"eval_steps_per_second": 1.58, |
|
"step": 3360 |
|
}, |
|
{ |
|
"epoch": 11.27, |
|
"eval_accuracy": 0.9970815314000689, |
|
"eval_f1": 0.9835430784123911, |
|
"eval_loss": 0.015277662314474583, |
|
"eval_precision": 0.9809655172413793, |
|
"eval_recall": 0.9861342207432058, |
|
"eval_runtime": 45.8383, |
|
"eval_samples_per_second": 9.359, |
|
"eval_steps_per_second": 1.571, |
|
"step": 3370 |
|
}, |
|
{ |
|
"epoch": 11.3, |
|
"eval_accuracy": 0.9969090764373458, |
|
"eval_f1": 0.9803921568627452, |
|
"eval_loss": 0.015845883637666702, |
|
"eval_precision": 0.9763476347634763, |
|
"eval_recall": 0.9844703272323905, |
|
"eval_runtime": 45.6768, |
|
"eval_samples_per_second": 9.392, |
|
"eval_steps_per_second": 1.576, |
|
"step": 3380 |
|
}, |
|
{ |
|
"epoch": 11.34, |
|
"eval_accuracy": 0.9968958106709824, |
|
"eval_f1": 0.9808037563872393, |
|
"eval_loss": 0.016353582963347435, |
|
"eval_precision": 0.9768913342503439, |
|
"eval_recall": 0.9847476428175264, |
|
"eval_runtime": 45.6996, |
|
"eval_samples_per_second": 9.387, |
|
"eval_steps_per_second": 1.576, |
|
"step": 3390 |
|
}, |
|
{ |
|
"epoch": 11.37, |
|
"eval_accuracy": 0.9966835584091693, |
|
"eval_f1": 0.9728832318760378, |
|
"eval_loss": 0.01731358841061592, |
|
"eval_precision": 0.9707344008834898, |
|
"eval_recall": 0.9750415973377704, |
|
"eval_runtime": 45.9308, |
|
"eval_samples_per_second": 9.34, |
|
"eval_steps_per_second": 1.568, |
|
"step": 3400 |
|
}, |
|
{ |
|
"epoch": 11.4, |
|
"eval_accuracy": 0.9969090764373458, |
|
"eval_f1": 0.9787116394802323, |
|
"eval_loss": 0.015837378799915314, |
|
"eval_precision": 0.9757442116868799, |
|
"eval_recall": 0.9816971713810316, |
|
"eval_runtime": 45.8585, |
|
"eval_samples_per_second": 9.355, |
|
"eval_steps_per_second": 1.57, |
|
"step": 3410 |
|
}, |
|
{ |
|
"epoch": 11.44, |
|
"eval_accuracy": 0.9968029503064392, |
|
"eval_f1": 0.9741534208707672, |
|
"eval_loss": 0.0164649561047554, |
|
"eval_precision": 0.9710664094791954, |
|
"eval_recall": 0.9772601220188575, |
|
"eval_runtime": 45.5679, |
|
"eval_samples_per_second": 9.415, |
|
"eval_steps_per_second": 1.58, |
|
"step": 3420 |
|
}, |
|
{ |
|
"epoch": 11.47, |
|
"eval_accuracy": 0.9964182430819029, |
|
"eval_f1": 0.9646373595895161, |
|
"eval_loss": 0.017043212428689003, |
|
"eval_precision": 0.9647711511789182, |
|
"eval_recall": 0.9645036051026068, |
|
"eval_runtime": 45.6723, |
|
"eval_samples_per_second": 9.393, |
|
"eval_steps_per_second": 1.576, |
|
"step": 3430 |
|
}, |
|
{ |
|
"epoch": 11.51, |
|
"eval_accuracy": 0.9964182430819029, |
|
"eval_f1": 0.9653643668606262, |
|
"eval_loss": 0.017299339175224304, |
|
"eval_precision": 0.964562569213732, |
|
"eval_recall": 0.9661674986134221, |
|
"eval_runtime": 46.0069, |
|
"eval_samples_per_second": 9.325, |
|
"eval_steps_per_second": 1.565, |
|
"step": 3440 |
|
}, |
|
{ |
|
"epoch": 11.54, |
|
"eval_accuracy": 0.9964713061473561, |
|
"eval_f1": 0.968054211035818, |
|
"eval_loss": 0.01724633388221264, |
|
"eval_precision": 0.9655172413793104, |
|
"eval_recall": 0.9706045479755963, |
|
"eval_runtime": 45.6115, |
|
"eval_samples_per_second": 9.406, |
|
"eval_steps_per_second": 1.579, |
|
"step": 3450 |
|
}, |
|
{ |
|
"epoch": 11.57, |
|
"eval_accuracy": 0.9964845719137194, |
|
"eval_f1": 0.9670724958494743, |
|
"eval_loss": 0.017298314720392227, |
|
"eval_precision": 0.9649364991717283, |
|
"eval_recall": 0.9692179700499168, |
|
"eval_runtime": 45.5306, |
|
"eval_samples_per_second": 9.422, |
|
"eval_steps_per_second": 1.581, |
|
"step": 3460 |
|
}, |
|
{ |
|
"epoch": 11.61, |
|
"eval_accuracy": 0.9967366214746226, |
|
"eval_f1": 0.9718875502008032, |
|
"eval_loss": 0.015642836689949036, |
|
"eval_precision": 0.9706777316735823, |
|
"eval_recall": 0.9731003882418192, |
|
"eval_runtime": 46.9214, |
|
"eval_samples_per_second": 9.143, |
|
"eval_steps_per_second": 1.534, |
|
"step": 3470 |
|
}, |
|
{ |
|
"epoch": 11.64, |
|
"eval_accuracy": 0.9969356079700724, |
|
"eval_f1": 0.9768986028496335, |
|
"eval_loss": 0.015028764493763447, |
|
"eval_precision": 0.9746066795473365, |
|
"eval_recall": 0.9792013311148087, |
|
"eval_runtime": 45.682, |
|
"eval_samples_per_second": 9.391, |
|
"eval_steps_per_second": 1.576, |
|
"step": 3480 |
|
}, |
|
{ |
|
"epoch": 11.67, |
|
"eval_accuracy": 0.9969621395027991, |
|
"eval_f1": 0.9775747508305648, |
|
"eval_loss": 0.015305536799132824, |
|
"eval_precision": 0.9759535655058044, |
|
"eval_recall": 0.9792013311148087, |
|
"eval_runtime": 45.8278, |
|
"eval_samples_per_second": 9.361, |
|
"eval_steps_per_second": 1.571, |
|
"step": 3490 |
|
}, |
|
{ |
|
"epoch": 11.71, |
|
"learning_rate": 6.5000000000000004e-06, |
|
"loss": 0.0042, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 11.71, |
|
"eval_accuracy": 0.9969754052691624, |
|
"eval_f1": 0.9772853185595569, |
|
"eval_loss": 0.015260215848684311, |
|
"eval_precision": 0.9762036524626453, |
|
"eval_recall": 0.978369384359401, |
|
"eval_runtime": 45.5813, |
|
"eval_samples_per_second": 9.412, |
|
"eval_steps_per_second": 1.58, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 11.74, |
|
"eval_accuracy": 0.9971213286991589, |
|
"eval_f1": 0.9785407725321887, |
|
"eval_loss": 0.015263444744050503, |
|
"eval_precision": 0.9770528061929776, |
|
"eval_recall": 0.9800332778702163, |
|
"eval_runtime": 46.1625, |
|
"eval_samples_per_second": 9.293, |
|
"eval_steps_per_second": 1.56, |
|
"step": 3510 |
|
}, |
|
{ |
|
"epoch": 11.77, |
|
"eval_accuracy": 0.9970947971664323, |
|
"eval_f1": 0.9793771626297577, |
|
"eval_loss": 0.01575734093785286, |
|
"eval_precision": 0.9776181265542968, |
|
"eval_recall": 0.9811425402107599, |
|
"eval_runtime": 45.6916, |
|
"eval_samples_per_second": 9.389, |
|
"eval_steps_per_second": 1.576, |
|
"step": 3520 |
|
}, |
|
{ |
|
"epoch": 11.81, |
|
"eval_accuracy": 0.9970682656337057, |
|
"eval_f1": 0.9803541781959049, |
|
"eval_loss": 0.016223162412643433, |
|
"eval_precision": 0.9781888459414688, |
|
"eval_recall": 0.9825291181364393, |
|
"eval_runtime": 45.6681, |
|
"eval_samples_per_second": 9.394, |
|
"eval_steps_per_second": 1.577, |
|
"step": 3530 |
|
}, |
|
{ |
|
"epoch": 11.84, |
|
"eval_accuracy": 0.9970152025682524, |
|
"eval_f1": 0.9794056668970283, |
|
"eval_loss": 0.016862712800502777, |
|
"eval_precision": 0.9763020115734362, |
|
"eval_recall": 0.9825291181364393, |
|
"eval_runtime": 45.8595, |
|
"eval_samples_per_second": 9.355, |
|
"eval_steps_per_second": 1.57, |
|
"step": 3540 |
|
}, |
|
{ |
|
"epoch": 11.87, |
|
"eval_accuracy": 0.9969754052691624, |
|
"eval_f1": 0.9781526548672567, |
|
"eval_loss": 0.016722770407795906, |
|
"eval_precision": 0.9754550468836183, |
|
"eval_recall": 0.980865224625624, |
|
"eval_runtime": 45.6514, |
|
"eval_samples_per_second": 9.397, |
|
"eval_steps_per_second": 1.577, |
|
"step": 3550 |
|
}, |
|
{ |
|
"epoch": 11.91, |
|
"eval_accuracy": 0.997041734100979, |
|
"eval_f1": 0.9792473713337022, |
|
"eval_loss": 0.01629817485809326, |
|
"eval_precision": 0.9770844837106571, |
|
"eval_recall": 0.9814198557958957, |
|
"eval_runtime": 45.6901, |
|
"eval_samples_per_second": 9.389, |
|
"eval_steps_per_second": 1.576, |
|
"step": 3560 |
|
}, |
|
{ |
|
"epoch": 11.94, |
|
"eval_accuracy": 0.9970152025682524, |
|
"eval_f1": 0.9795240730492528, |
|
"eval_loss": 0.01616574078798294, |
|
"eval_precision": 0.97736057426836, |
|
"eval_recall": 0.9816971713810316, |
|
"eval_runtime": 46.0985, |
|
"eval_samples_per_second": 9.306, |
|
"eval_steps_per_second": 1.562, |
|
"step": 3570 |
|
}, |
|
{ |
|
"epoch": 11.97, |
|
"eval_accuracy": 0.9969488737364357, |
|
"eval_f1": 0.9778761061946902, |
|
"eval_loss": 0.01619311049580574, |
|
"eval_precision": 0.9751792608935466, |
|
"eval_recall": 0.9805879090404881, |
|
"eval_runtime": 45.9524, |
|
"eval_samples_per_second": 9.336, |
|
"eval_steps_per_second": 1.567, |
|
"step": 3580 |
|
}, |
|
{ |
|
"epoch": 12.01, |
|
"eval_accuracy": 0.9969886710355257, |
|
"eval_f1": 0.9785822854774078, |
|
"eval_loss": 0.01636885292828083, |
|
"eval_precision": 0.97521343982374, |
|
"eval_recall": 0.9819744869661675, |
|
"eval_runtime": 45.6302, |
|
"eval_samples_per_second": 9.402, |
|
"eval_steps_per_second": 1.578, |
|
"step": 3590 |
|
}, |
|
{ |
|
"epoch": 12.04, |
|
"eval_accuracy": 0.9969886710355257, |
|
"eval_f1": 0.9784470848300635, |
|
"eval_loss": 0.01634366624057293, |
|
"eval_precision": 0.9749449339207048, |
|
"eval_recall": 0.9819744869661675, |
|
"eval_runtime": 45.6457, |
|
"eval_samples_per_second": 9.398, |
|
"eval_steps_per_second": 1.577, |
|
"step": 3600 |
|
}, |
|
{ |
|
"epoch": 12.07, |
|
"eval_accuracy": 0.9969621395027991, |
|
"eval_f1": 0.9776119402985075, |
|
"eval_loss": 0.016408545896410942, |
|
"eval_precision": 0.9743801652892562, |
|
"eval_recall": 0.980865224625624, |
|
"eval_runtime": 46.0467, |
|
"eval_samples_per_second": 9.317, |
|
"eval_steps_per_second": 1.564, |
|
"step": 3610 |
|
}, |
|
{ |
|
"epoch": 12.11, |
|
"eval_accuracy": 0.9971345944655223, |
|
"eval_f1": 0.9778822228366049, |
|
"eval_loss": 0.01554455328732729, |
|
"eval_precision": 0.9749173098125689, |
|
"eval_recall": 0.980865224625624, |
|
"eval_runtime": 45.8672, |
|
"eval_samples_per_second": 9.353, |
|
"eval_steps_per_second": 1.57, |
|
"step": 3620 |
|
}, |
|
{ |
|
"epoch": 12.14, |
|
"eval_accuracy": 0.9971743917646122, |
|
"eval_f1": 0.9781284606866002, |
|
"eval_loss": 0.015367398969829082, |
|
"eval_precision": 0.9765063571033721, |
|
"eval_recall": 0.9797559622850804, |
|
"eval_runtime": 45.8306, |
|
"eval_samples_per_second": 9.361, |
|
"eval_steps_per_second": 1.571, |
|
"step": 3630 |
|
}, |
|
{ |
|
"epoch": 12.17, |
|
"eval_accuracy": 0.9970815314000689, |
|
"eval_f1": 0.9784172661870504, |
|
"eval_loss": 0.016077237203717232, |
|
"eval_precision": 0.9762562120375483, |
|
"eval_recall": 0.9805879090404881, |
|
"eval_runtime": 45.7148, |
|
"eval_samples_per_second": 9.384, |
|
"eval_steps_per_second": 1.575, |
|
"step": 3640 |
|
}, |
|
{ |
|
"epoch": 12.21, |
|
"eval_accuracy": 0.9968825449046191, |
|
"eval_f1": 0.9757986447241046, |
|
"eval_loss": 0.016824740916490555, |
|
"eval_precision": 0.9732413793103448, |
|
"eval_recall": 0.978369384359401, |
|
"eval_runtime": 46.1214, |
|
"eval_samples_per_second": 9.302, |
|
"eval_steps_per_second": 1.561, |
|
"step": 3650 |
|
}, |
|
{ |
|
"epoch": 12.24, |
|
"eval_accuracy": 0.9969223422037091, |
|
"eval_f1": 0.978146611341632, |
|
"eval_loss": 0.016822459176182747, |
|
"eval_precision": 0.9757174392935982, |
|
"eval_recall": 0.9805879090404881, |
|
"eval_runtime": 45.7927, |
|
"eval_samples_per_second": 9.368, |
|
"eval_steps_per_second": 1.572, |
|
"step": 3660 |
|
}, |
|
{ |
|
"epoch": 12.27, |
|
"eval_accuracy": 0.9968825449046191, |
|
"eval_f1": 0.9792588495575221, |
|
"eval_loss": 0.01815040595829487, |
|
"eval_precision": 0.9765581908439052, |
|
"eval_recall": 0.9819744869661675, |
|
"eval_runtime": 45.8912, |
|
"eval_samples_per_second": 9.348, |
|
"eval_steps_per_second": 1.569, |
|
"step": 3670 |
|
}, |
|
{ |
|
"epoch": 12.31, |
|
"eval_accuracy": 0.9967764187737126, |
|
"eval_f1": 0.9788586430841509, |
|
"eval_loss": 0.01881832629442215, |
|
"eval_precision": 0.9754888460479206, |
|
"eval_recall": 0.9822518025513034, |
|
"eval_runtime": 46.0893, |
|
"eval_samples_per_second": 9.308, |
|
"eval_steps_per_second": 1.562, |
|
"step": 3680 |
|
}, |
|
{ |
|
"epoch": 12.34, |
|
"eval_accuracy": 0.9968294818391659, |
|
"eval_f1": 0.976892209768922, |
|
"eval_loss": 0.017492154613137245, |
|
"eval_precision": 0.9748688207677437, |
|
"eval_recall": 0.9789240155296728, |
|
"eval_runtime": 45.8024, |
|
"eval_samples_per_second": 9.366, |
|
"eval_steps_per_second": 1.572, |
|
"step": 3690 |
|
}, |
|
{ |
|
"epoch": 12.37, |
|
"eval_accuracy": 0.9966172295773527, |
|
"eval_f1": 0.9710806697108068, |
|
"eval_loss": 0.018154501914978027, |
|
"eval_precision": 0.9690693178679922, |
|
"eval_recall": 0.9731003882418192, |
|
"eval_runtime": 46.0834, |
|
"eval_samples_per_second": 9.309, |
|
"eval_steps_per_second": 1.562, |
|
"step": 3700 |
|
}, |
|
{ |
|
"epoch": 12.41, |
|
"eval_accuracy": 0.9962457881191796, |
|
"eval_f1": 0.9614745011086475, |
|
"eval_loss": 0.01924285851418972, |
|
"eval_precision": 0.9609418282548476, |
|
"eval_recall": 0.9620077648363838, |
|
"eval_runtime": 45.696, |
|
"eval_samples_per_second": 9.388, |
|
"eval_steps_per_second": 1.576, |
|
"step": 3710 |
|
}, |
|
{ |
|
"epoch": 12.44, |
|
"eval_accuracy": 0.9964580403809928, |
|
"eval_f1": 0.9651259341267644, |
|
"eval_loss": 0.017841314896941185, |
|
"eval_precision": 0.9632596685082873, |
|
"eval_recall": 0.9669994453688298, |
|
"eval_runtime": 45.9939, |
|
"eval_samples_per_second": 9.327, |
|
"eval_steps_per_second": 1.565, |
|
"step": 3720 |
|
}, |
|
{ |
|
"epoch": 12.47, |
|
"eval_accuracy": 0.9966304953437161, |
|
"eval_f1": 0.970962389380531, |
|
"eval_loss": 0.016754455864429474, |
|
"eval_precision": 0.968284611141754, |
|
"eval_recall": 0.973655019412091, |
|
"eval_runtime": 45.8171, |
|
"eval_samples_per_second": 9.363, |
|
"eval_steps_per_second": 1.571, |
|
"step": 3730 |
|
}, |
|
{ |
|
"epoch": 12.51, |
|
"eval_accuracy": 0.9968294818391659, |
|
"eval_f1": 0.9774269491760144, |
|
"eval_loss": 0.015923812985420227, |
|
"eval_precision": 0.9762102351313969, |
|
"eval_recall": 0.9786466999445369, |
|
"eval_runtime": 45.7801, |
|
"eval_samples_per_second": 9.371, |
|
"eval_steps_per_second": 1.573, |
|
"step": 3740 |
|
}, |
|
{ |
|
"epoch": 12.54, |
|
"eval_accuracy": 0.9968825449046191, |
|
"eval_f1": 0.9772916089725838, |
|
"eval_loss": 0.015936698764562607, |
|
"eval_precision": 0.9759402654867256, |
|
"eval_recall": 0.9786466999445369, |
|
"eval_runtime": 45.9975, |
|
"eval_samples_per_second": 9.327, |
|
"eval_steps_per_second": 1.565, |
|
"step": 3750 |
|
}, |
|
{ |
|
"epoch": 12.58, |
|
"eval_accuracy": 0.9968029503064392, |
|
"eval_f1": 0.9736623232603271, |
|
"eval_loss": 0.016157541424036026, |
|
"eval_precision": 0.9733924611973392, |
|
"eval_recall": 0.9739323349972269, |
|
"eval_runtime": 45.7117, |
|
"eval_samples_per_second": 9.385, |
|
"eval_steps_per_second": 1.575, |
|
"step": 3760 |
|
}, |
|
{ |
|
"epoch": 12.61, |
|
"eval_accuracy": 0.9967366214746226, |
|
"eval_f1": 0.9694117647058823, |
|
"eval_loss": 0.01580197736620903, |
|
"eval_precision": 0.9676706272450953, |
|
"eval_recall": 0.971159179145868, |
|
"eval_runtime": 45.5828, |
|
"eval_samples_per_second": 9.411, |
|
"eval_steps_per_second": 1.58, |
|
"step": 3770 |
|
}, |
|
{ |
|
"epoch": 12.64, |
|
"eval_accuracy": 0.9969090764373458, |
|
"eval_f1": 0.971460238293156, |
|
"eval_loss": 0.015100532211363316, |
|
"eval_precision": 0.9706533776301218, |
|
"eval_recall": 0.9722684414864116, |
|
"eval_runtime": 45.7142, |
|
"eval_samples_per_second": 9.384, |
|
"eval_steps_per_second": 1.575, |
|
"step": 3780 |
|
}, |
|
{ |
|
"epoch": 12.68, |
|
"eval_accuracy": 0.9969488737364357, |
|
"eval_f1": 0.9725609756097561, |
|
"eval_loss": 0.015240387991070747, |
|
"eval_precision": 0.97202216066482, |
|
"eval_recall": 0.9731003882418192, |
|
"eval_runtime": 46.103, |
|
"eval_samples_per_second": 9.305, |
|
"eval_steps_per_second": 1.562, |
|
"step": 3790 |
|
}, |
|
{ |
|
"epoch": 12.71, |
|
"eval_accuracy": 0.9970284683346157, |
|
"eval_f1": 0.9779991697799916, |
|
"eval_loss": 0.015490233898162842, |
|
"eval_precision": 0.975973487986744, |
|
"eval_recall": 0.9800332778702163, |
|
"eval_runtime": 45.7054, |
|
"eval_samples_per_second": 9.386, |
|
"eval_steps_per_second": 1.575, |
|
"step": 3800 |
|
}, |
|
{ |
|
"epoch": 12.74, |
|
"eval_accuracy": 0.9971213286991589, |
|
"eval_f1": 0.980060924951537, |
|
"eval_loss": 0.014931376092135906, |
|
"eval_precision": 0.9787057522123894, |
|
"eval_recall": 0.9814198557958957, |
|
"eval_runtime": 45.8361, |
|
"eval_samples_per_second": 9.359, |
|
"eval_steps_per_second": 1.571, |
|
"step": 3810 |
|
}, |
|
{ |
|
"epoch": 12.78, |
|
"eval_accuracy": 0.9970947971664323, |
|
"eval_f1": 0.9769764216366158, |
|
"eval_loss": 0.013774119317531586, |
|
"eval_precision": 0.9772475027746947, |
|
"eval_recall": 0.9767054908485857, |
|
"eval_runtime": 46.4293, |
|
"eval_samples_per_second": 9.24, |
|
"eval_steps_per_second": 1.551, |
|
"step": 3820 |
|
}, |
|
{ |
|
"epoch": 12.81, |
|
"eval_accuracy": 0.9971611259982489, |
|
"eval_f1": 0.9775436650956474, |
|
"eval_loss": 0.01355548482388258, |
|
"eval_precision": 0.9772727272727273, |
|
"eval_recall": 0.9778147531891292, |
|
"eval_runtime": 45.7415, |
|
"eval_samples_per_second": 9.379, |
|
"eval_steps_per_second": 1.574, |
|
"step": 3830 |
|
}, |
|
{ |
|
"epoch": 12.84, |
|
"eval_accuracy": 0.9973335809609721, |
|
"eval_f1": 0.9824124082537044, |
|
"eval_loss": 0.013703616335988045, |
|
"eval_precision": 0.9811894882434301, |
|
"eval_recall": 0.9836383804769828, |
|
"eval_runtime": 45.73, |
|
"eval_samples_per_second": 9.381, |
|
"eval_steps_per_second": 1.574, |
|
"step": 3840 |
|
}, |
|
{ |
|
"epoch": 12.88, |
|
"eval_accuracy": 0.9973601124936987, |
|
"eval_f1": 0.9812102790826194, |
|
"eval_loss": 0.014531377702951431, |
|
"eval_precision": 0.9776982378854625, |
|
"eval_recall": 0.9847476428175264, |
|
"eval_runtime": 45.7852, |
|
"eval_samples_per_second": 9.37, |
|
"eval_steps_per_second": 1.573, |
|
"step": 3850 |
|
}, |
|
{ |
|
"epoch": 12.91, |
|
"eval_accuracy": 0.9968427476055292, |
|
"eval_f1": 0.977526540741762, |
|
"eval_loss": 0.016427284106612206, |
|
"eval_precision": 0.9720318069646284, |
|
"eval_recall": 0.983083749306711, |
|
"eval_runtime": 45.8438, |
|
"eval_samples_per_second": 9.358, |
|
"eval_steps_per_second": 1.571, |
|
"step": 3860 |
|
}, |
|
{ |
|
"epoch": 12.94, |
|
"eval_accuracy": 0.9960202700910031, |
|
"eval_f1": 0.9653931339977851, |
|
"eval_loss": 0.021676059812307358, |
|
"eval_precision": 0.9637921503593145, |
|
"eval_recall": 0.9669994453688298, |
|
"eval_runtime": 45.7888, |
|
"eval_samples_per_second": 9.369, |
|
"eval_steps_per_second": 1.572, |
|
"step": 3870 |
|
}, |
|
{ |
|
"epoch": 12.98, |
|
"eval_accuracy": 0.9967498872409859, |
|
"eval_f1": 0.9777900400055181, |
|
"eval_loss": 0.018003830686211586, |
|
"eval_precision": 0.9728245951139171, |
|
"eval_recall": 0.9828064337215752, |
|
"eval_runtime": 45.7325, |
|
"eval_samples_per_second": 9.381, |
|
"eval_steps_per_second": 1.574, |
|
"step": 3880 |
|
}, |
|
{ |
|
"epoch": 13.01, |
|
"eval_accuracy": 0.9968692791382558, |
|
"eval_f1": 0.977667493796526, |
|
"eval_loss": 0.01754719577729702, |
|
"eval_precision": 0.9720394736842105, |
|
"eval_recall": 0.9833610648918469, |
|
"eval_runtime": 46.1857, |
|
"eval_samples_per_second": 9.289, |
|
"eval_steps_per_second": 1.559, |
|
"step": 3890 |
|
}, |
|
{ |
|
"epoch": 13.04, |
|
"eval_accuracy": 0.9967631530073492, |
|
"eval_f1": 0.9739274382673472, |
|
"eval_loss": 0.01792616955935955, |
|
"eval_precision": 0.96898160856437, |
|
"eval_recall": 0.9789240155296728, |
|
"eval_runtime": 45.7326, |
|
"eval_samples_per_second": 9.381, |
|
"eval_steps_per_second": 1.574, |
|
"step": 3900 |
|
}, |
|
{ |
|
"epoch": 13.08, |
|
"eval_accuracy": 0.9967631530073492, |
|
"eval_f1": 0.9729431253451133, |
|
"eval_loss": 0.017918290570378304, |
|
"eval_precision": 0.9686641011544805, |
|
"eval_recall": 0.9772601220188575, |
|
"eval_runtime": 46.0978, |
|
"eval_samples_per_second": 9.306, |
|
"eval_steps_per_second": 1.562, |
|
"step": 3910 |
|
}, |
|
{ |
|
"epoch": 13.11, |
|
"eval_accuracy": 0.9968692791382558, |
|
"eval_f1": 0.9765323025952513, |
|
"eval_loss": 0.017354754731059074, |
|
"eval_precision": 0.9722374931280924, |
|
"eval_recall": 0.980865224625624, |
|
"eval_runtime": 46.21, |
|
"eval_samples_per_second": 9.284, |
|
"eval_steps_per_second": 1.558, |
|
"step": 3920 |
|
}, |
|
{ |
|
"epoch": 13.14, |
|
"eval_accuracy": 0.9969356079700724, |
|
"eval_f1": 0.9775017253278124, |
|
"eval_loss": 0.015932898968458176, |
|
"eval_precision": 0.9730695245946689, |
|
"eval_recall": 0.9819744869661675, |
|
"eval_runtime": 45.7375, |
|
"eval_samples_per_second": 9.38, |
|
"eval_steps_per_second": 1.574, |
|
"step": 3930 |
|
}, |
|
{ |
|
"epoch": 13.18, |
|
"eval_accuracy": 0.9969090764373458, |
|
"eval_f1": 0.9779005524861878, |
|
"eval_loss": 0.015960365533828735, |
|
"eval_precision": 0.9741331865712713, |
|
"eval_recall": 0.9816971713810316, |
|
"eval_runtime": 45.8882, |
|
"eval_samples_per_second": 9.349, |
|
"eval_steps_per_second": 1.569, |
|
"step": 3940 |
|
}, |
|
{ |
|
"epoch": 13.21, |
|
"eval_accuracy": 0.9967498872409859, |
|
"eval_f1": 0.9737569060773481, |
|
"eval_loss": 0.017051612958312035, |
|
"eval_precision": 0.9700055035773253, |
|
"eval_recall": 0.9775374376039934, |
|
"eval_runtime": 45.8012, |
|
"eval_samples_per_second": 9.367, |
|
"eval_steps_per_second": 1.572, |
|
"step": 3950 |
|
}, |
|
{ |
|
"epoch": 13.24, |
|
"eval_accuracy": 0.9966702926428059, |
|
"eval_f1": 0.9723527785457561, |
|
"eval_loss": 0.01766437292098999, |
|
"eval_precision": 0.9694046306504961, |
|
"eval_recall": 0.9753189129229063, |
|
"eval_runtime": 45.8759, |
|
"eval_samples_per_second": 9.351, |
|
"eval_steps_per_second": 1.569, |
|
"step": 3960 |
|
}, |
|
{ |
|
"epoch": 13.28, |
|
"eval_accuracy": 0.9966570268764426, |
|
"eval_f1": 0.9727411097274111, |
|
"eval_loss": 0.01822058856487274, |
|
"eval_precision": 0.9707263186964927, |
|
"eval_recall": 0.9747642817526345, |
|
"eval_runtime": 45.8529, |
|
"eval_samples_per_second": 9.356, |
|
"eval_steps_per_second": 1.57, |
|
"step": 3970 |
|
}, |
|
{ |
|
"epoch": 13.31, |
|
"eval_accuracy": 0.9966304953437161, |
|
"eval_f1": 0.9724872113922302, |
|
"eval_loss": 0.01849460043013096, |
|
"eval_precision": 0.9696719051557762, |
|
"eval_recall": 0.9753189129229063, |
|
"eval_runtime": 45.7611, |
|
"eval_samples_per_second": 9.375, |
|
"eval_steps_per_second": 1.573, |
|
"step": 3980 |
|
}, |
|
{ |
|
"epoch": 13.34, |
|
"eval_accuracy": 0.9968427476055292, |
|
"eval_f1": 0.9780417069465543, |
|
"eval_loss": 0.017539281398057938, |
|
"eval_precision": 0.9741403026134801, |
|
"eval_recall": 0.9819744869661675, |
|
"eval_runtime": 46.0339, |
|
"eval_samples_per_second": 9.319, |
|
"eval_steps_per_second": 1.564, |
|
"step": 3990 |
|
}, |
|
{ |
|
"epoch": 13.38, |
|
"learning_rate": 6e-06, |
|
"loss": 0.0037, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 13.38, |
|
"eval_accuracy": 0.9968958106709824, |
|
"eval_f1": 0.9792874896437448, |
|
"eval_loss": 0.017371075227856636, |
|
"eval_precision": 0.9752475247524752, |
|
"eval_recall": 0.9833610648918469, |
|
"eval_runtime": 45.7746, |
|
"eval_samples_per_second": 9.372, |
|
"eval_steps_per_second": 1.573, |
|
"step": 4000 |
|
} |
|
], |
|
"max_steps": 10000, |
|
"num_train_epochs": 34, |
|
"total_flos": 6370581676032000.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|