|
{ |
|
"best_metric": 0.8450403429578367, |
|
"best_model_checkpoint": "result/my-unsup-simcse-bert-base-uncased/SupCon-48-0.01-2e-7-0.07-0.00", |
|
"epoch": 1.0, |
|
"global_step": 15626, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.01, |
|
"eval_avg_sts": 0.6273981488926212, |
|
"eval_sickr_spearman": 0.6211010277251597, |
|
"eval_stsb_spearman": 0.6336952700600829, |
|
"step": 125 |
|
}, |
|
{ |
|
"epoch": 0.02, |
|
"eval_avg_sts": 0.6557459351486706, |
|
"eval_sickr_spearman": 0.6424095455671641, |
|
"eval_stsb_spearman": 0.6690823247301771, |
|
"step": 250 |
|
}, |
|
{ |
|
"epoch": 0.02, |
|
"eval_avg_sts": 0.709441256238345, |
|
"eval_sickr_spearman": 0.6938704999278709, |
|
"eval_stsb_spearman": 0.7250120125488192, |
|
"step": 375 |
|
}, |
|
{ |
|
"epoch": 0.03, |
|
"learning_rate": 2.9040061436068092e-05, |
|
"loss": 0.0093, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 0.03, |
|
"eval_avg_sts": 0.745161269369824, |
|
"eval_sickr_spearman": 0.7196067168248462, |
|
"eval_stsb_spearman": 0.7707158219148017, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 0.04, |
|
"eval_avg_sts": 0.7476897637271698, |
|
"eval_sickr_spearman": 0.7177654445512162, |
|
"eval_stsb_spearman": 0.7776140829031234, |
|
"step": 625 |
|
}, |
|
{ |
|
"epoch": 0.05, |
|
"eval_avg_sts": 0.7524926746389684, |
|
"eval_sickr_spearman": 0.7211576410902829, |
|
"eval_stsb_spearman": 0.7838277081876538, |
|
"step": 750 |
|
}, |
|
{ |
|
"epoch": 0.06, |
|
"eval_avg_sts": 0.7584753747432835, |
|
"eval_sickr_spearman": 0.7179680397370821, |
|
"eval_stsb_spearman": 0.7989827097494849, |
|
"step": 875 |
|
}, |
|
{ |
|
"epoch": 0.06, |
|
"learning_rate": 2.8080122872136184e-05, |
|
"loss": 0.0003, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 0.06, |
|
"eval_avg_sts": 0.7586746687828863, |
|
"eval_sickr_spearman": 0.718746960109104, |
|
"eval_stsb_spearman": 0.7986023774566684, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 0.07, |
|
"eval_avg_sts": 0.7574999857715704, |
|
"eval_sickr_spearman": 0.7175820618059254, |
|
"eval_stsb_spearman": 0.7974179097372154, |
|
"step": 1125 |
|
}, |
|
{ |
|
"epoch": 0.08, |
|
"eval_avg_sts": 0.7696978971940565, |
|
"eval_sickr_spearman": 0.7239500252345904, |
|
"eval_stsb_spearman": 0.8154457691535225, |
|
"step": 1250 |
|
}, |
|
{ |
|
"epoch": 0.09, |
|
"eval_avg_sts": 0.7711009245923006, |
|
"eval_sickr_spearman": 0.7253843780168369, |
|
"eval_stsb_spearman": 0.8168174711677644, |
|
"step": 1375 |
|
}, |
|
{ |
|
"epoch": 0.1, |
|
"learning_rate": 2.7120184308204276e-05, |
|
"loss": 0.0001, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 0.1, |
|
"eval_avg_sts": 0.7722992846813606, |
|
"eval_sickr_spearman": 0.7252976338476396, |
|
"eval_stsb_spearman": 0.8193009355150815, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 0.1, |
|
"eval_avg_sts": 0.773722019273226, |
|
"eval_sickr_spearman": 0.7276583624833227, |
|
"eval_stsb_spearman": 0.8197856760631294, |
|
"step": 1625 |
|
}, |
|
{ |
|
"epoch": 0.11, |
|
"eval_avg_sts": 0.7734992972011999, |
|
"eval_sickr_spearman": 0.7251570468137302, |
|
"eval_stsb_spearman": 0.8218415475886697, |
|
"step": 1750 |
|
}, |
|
{ |
|
"epoch": 0.12, |
|
"eval_avg_sts": 0.772300977896672, |
|
"eval_sickr_spearman": 0.7260308286110924, |
|
"eval_stsb_spearman": 0.8185711271822516, |
|
"step": 1875 |
|
}, |
|
{ |
|
"epoch": 0.13, |
|
"learning_rate": 2.6160245744272367e-05, |
|
"loss": 0.0001, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 0.13, |
|
"eval_avg_sts": 0.7741215013840628, |
|
"eval_sickr_spearman": 0.7290128395438775, |
|
"eval_stsb_spearman": 0.8192301632242479, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 0.14, |
|
"eval_avg_sts": 0.7845043729289752, |
|
"eval_sickr_spearman": 0.7357584234920489, |
|
"eval_stsb_spearman": 0.8332503223659016, |
|
"step": 2125 |
|
}, |
|
{ |
|
"epoch": 0.14, |
|
"eval_avg_sts": 0.7824068340883688, |
|
"eval_sickr_spearman": 0.7413625963456452, |
|
"eval_stsb_spearman": 0.8234510718310922, |
|
"step": 2250 |
|
}, |
|
{ |
|
"epoch": 0.15, |
|
"eval_avg_sts": 0.7801565471575205, |
|
"eval_sickr_spearman": 0.7272591759992707, |
|
"eval_stsb_spearman": 0.8330539183157702, |
|
"step": 2375 |
|
}, |
|
{ |
|
"epoch": 0.16, |
|
"learning_rate": 2.5200307180340456e-05, |
|
"loss": 0.0001, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 0.16, |
|
"eval_avg_sts": 0.7817040476834756, |
|
"eval_sickr_spearman": 0.7317218416960886, |
|
"eval_stsb_spearman": 0.8316862536708627, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 0.17, |
|
"eval_avg_sts": 0.7834051453081208, |
|
"eval_sickr_spearman": 0.7332758879831186, |
|
"eval_stsb_spearman": 0.8335344026331228, |
|
"step": 2625 |
|
}, |
|
{ |
|
"epoch": 0.18, |
|
"eval_avg_sts": 0.7846122957465609, |
|
"eval_sickr_spearman": 0.737042534988997, |
|
"eval_stsb_spearman": 0.8321820565041248, |
|
"step": 2750 |
|
}, |
|
{ |
|
"epoch": 0.18, |
|
"eval_avg_sts": 0.7930382359535035, |
|
"eval_sickr_spearman": 0.7410361289491703, |
|
"eval_stsb_spearman": 0.8450403429578367, |
|
"step": 2875 |
|
}, |
|
{ |
|
"epoch": 0.19, |
|
"learning_rate": 2.424036861640855e-05, |
|
"loss": 0.0001, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 0.19, |
|
"eval_avg_sts": 0.784546743206133, |
|
"eval_sickr_spearman": 0.7335979365182612, |
|
"eval_stsb_spearman": 0.8354955498940048, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 0.2, |
|
"eval_avg_sts": 0.7879357699638411, |
|
"eval_sickr_spearman": 0.7380969137277664, |
|
"eval_stsb_spearman": 0.8377746261999157, |
|
"step": 3125 |
|
}, |
|
{ |
|
"epoch": 0.21, |
|
"eval_avg_sts": 0.7885921401422298, |
|
"eval_sickr_spearman": 0.7360949774198258, |
|
"eval_stsb_spearman": 0.8410893028646337, |
|
"step": 3250 |
|
}, |
|
{ |
|
"epoch": 0.22, |
|
"eval_avg_sts": 0.7886813707449458, |
|
"eval_sickr_spearman": 0.7360677437853104, |
|
"eval_stsb_spearman": 0.8412949977045814, |
|
"step": 3375 |
|
}, |
|
{ |
|
"epoch": 0.22, |
|
"learning_rate": 2.3280430052476642e-05, |
|
"loss": 0.0002, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 0.22, |
|
"eval_avg_sts": 0.7885894531415549, |
|
"eval_sickr_spearman": 0.7365915229464931, |
|
"eval_stsb_spearman": 0.8405873833366166, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 0.23, |
|
"eval_avg_sts": 0.7907895913811233, |
|
"eval_sickr_spearman": 0.7414235958444714, |
|
"eval_stsb_spearman": 0.8401555869177751, |
|
"step": 3625 |
|
}, |
|
{ |
|
"epoch": 0.24, |
|
"eval_avg_sts": 0.7899099014596336, |
|
"eval_sickr_spearman": 0.7422593370094946, |
|
"eval_stsb_spearman": 0.8375604659097725, |
|
"step": 3750 |
|
}, |
|
{ |
|
"epoch": 0.25, |
|
"eval_avg_sts": 0.781954087673714, |
|
"eval_sickr_spearman": 0.7436439776017526, |
|
"eval_stsb_spearman": 0.8202641977456754, |
|
"step": 3875 |
|
}, |
|
{ |
|
"epoch": 0.26, |
|
"learning_rate": 2.2320491488544734e-05, |
|
"loss": 0.0001, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 0.26, |
|
"eval_avg_sts": 0.7846807378527296, |
|
"eval_sickr_spearman": 0.743132158184828, |
|
"eval_stsb_spearman": 0.8262293175206311, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 0.26, |
|
"eval_avg_sts": 0.7825345568897543, |
|
"eval_sickr_spearman": 0.7449149766080079, |
|
"eval_stsb_spearman": 0.8201541371715007, |
|
"step": 4125 |
|
}, |
|
{ |
|
"epoch": 0.27, |
|
"eval_avg_sts": 0.7860788226540287, |
|
"eval_sickr_spearman": 0.7454807349518474, |
|
"eval_stsb_spearman": 0.8266769103562102, |
|
"step": 4250 |
|
}, |
|
{ |
|
"epoch": 0.28, |
|
"eval_avg_sts": 0.7867018278295852, |
|
"eval_sickr_spearman": 0.7445308238587058, |
|
"eval_stsb_spearman": 0.8288728318004647, |
|
"step": 4375 |
|
}, |
|
{ |
|
"epoch": 0.29, |
|
"learning_rate": 2.1360552924612826e-05, |
|
"loss": 0.0001, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 0.29, |
|
"eval_avg_sts": 0.776783766738095, |
|
"eval_sickr_spearman": 0.7318758294072991, |
|
"eval_stsb_spearman": 0.8216917040688909, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 0.3, |
|
"eval_avg_sts": 0.7675528732476737, |
|
"eval_sickr_spearman": 0.7320309698649442, |
|
"eval_stsb_spearman": 0.8030747766304034, |
|
"step": 4625 |
|
}, |
|
{ |
|
"epoch": 0.3, |
|
"eval_avg_sts": 0.7715011023405255, |
|
"eval_sickr_spearman": 0.7350243641687703, |
|
"eval_stsb_spearman": 0.8079778405122807, |
|
"step": 4750 |
|
}, |
|
{ |
|
"epoch": 0.31, |
|
"eval_avg_sts": 0.7687077375569937, |
|
"eval_sickr_spearman": 0.7408402100864042, |
|
"eval_stsb_spearman": 0.7965752650275834, |
|
"step": 4875 |
|
}, |
|
{ |
|
"epoch": 0.32, |
|
"learning_rate": 2.0400614360680917e-05, |
|
"loss": 0.0001, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 0.32, |
|
"eval_avg_sts": 0.7738965818092367, |
|
"eval_sickr_spearman": 0.7445124279468551, |
|
"eval_stsb_spearman": 0.8032807356716183, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 0.33, |
|
"eval_avg_sts": 0.7793196132942312, |
|
"eval_sickr_spearman": 0.7457236762629214, |
|
"eval_stsb_spearman": 0.812915550325541, |
|
"step": 5125 |
|
}, |
|
{ |
|
"epoch": 0.34, |
|
"eval_avg_sts": 0.7836274650846277, |
|
"eval_sickr_spearman": 0.7464208957313971, |
|
"eval_stsb_spearman": 0.8208340344378582, |
|
"step": 5250 |
|
}, |
|
{ |
|
"epoch": 0.34, |
|
"eval_avg_sts": 0.7826458926642379, |
|
"eval_sickr_spearman": 0.7464102328268778, |
|
"eval_stsb_spearman": 0.818881552501598, |
|
"step": 5375 |
|
}, |
|
{ |
|
"epoch": 0.35, |
|
"learning_rate": 1.944067579674901e-05, |
|
"loss": 0.0001, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 0.35, |
|
"eval_avg_sts": 0.7837446296343489, |
|
"eval_sickr_spearman": 0.7486399806489393, |
|
"eval_stsb_spearman": 0.8188492786197583, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 0.36, |
|
"eval_avg_sts": 0.7830869728965355, |
|
"eval_sickr_spearman": 0.7479103882180944, |
|
"eval_stsb_spearman": 0.8182635575749767, |
|
"step": 5625 |
|
}, |
|
{ |
|
"epoch": 0.37, |
|
"eval_avg_sts": 0.783785645301962, |
|
"eval_sickr_spearman": 0.7470566353900319, |
|
"eval_stsb_spearman": 0.8205146552138923, |
|
"step": 5750 |
|
}, |
|
{ |
|
"epoch": 0.38, |
|
"eval_avg_sts": 0.7841049239457296, |
|
"eval_sickr_spearman": 0.7275643656178084, |
|
"eval_stsb_spearman": 0.8406454822736508, |
|
"step": 5875 |
|
}, |
|
{ |
|
"epoch": 0.38, |
|
"learning_rate": 1.84807372328171e-05, |
|
"loss": 0.0001, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 0.38, |
|
"eval_avg_sts": 0.7827015978431489, |
|
"eval_sickr_spearman": 0.7361094828124602, |
|
"eval_stsb_spearman": 0.8292937128738374, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 0.39, |
|
"eval_avg_sts": 0.7835582939326338, |
|
"eval_sickr_spearman": 0.7403639336845438, |
|
"eval_stsb_spearman": 0.8267526541807237, |
|
"step": 6125 |
|
}, |
|
{ |
|
"epoch": 0.4, |
|
"eval_avg_sts": 0.7833004559230021, |
|
"eval_sickr_spearman": 0.7409274345666157, |
|
"eval_stsb_spearman": 0.8256734772793887, |
|
"step": 6250 |
|
}, |
|
{ |
|
"epoch": 0.41, |
|
"eval_avg_sts": 0.783274693136238, |
|
"eval_sickr_spearman": 0.7396373672130896, |
|
"eval_stsb_spearman": 0.8269120190593864, |
|
"step": 6375 |
|
}, |
|
{ |
|
"epoch": 0.42, |
|
"learning_rate": 1.7520798668885192e-05, |
|
"loss": 0.0, |
|
"step": 6500 |
|
}, |
|
{ |
|
"epoch": 0.42, |
|
"eval_avg_sts": 0.7844400031801044, |
|
"eval_sickr_spearman": 0.7315539729965624, |
|
"eval_stsb_spearman": 0.8373260333636465, |
|
"step": 6500 |
|
}, |
|
{ |
|
"epoch": 0.42, |
|
"eval_avg_sts": 0.7830541155839421, |
|
"eval_sickr_spearman": 0.7372136217723195, |
|
"eval_stsb_spearman": 0.8288946093955648, |
|
"step": 6625 |
|
}, |
|
{ |
|
"epoch": 0.43, |
|
"eval_avg_sts": 0.7788362702655598, |
|
"eval_sickr_spearman": 0.7408482312803444, |
|
"eval_stsb_spearman": 0.8168243092507751, |
|
"step": 6750 |
|
}, |
|
{ |
|
"epoch": 0.44, |
|
"eval_avg_sts": 0.7825535757514819, |
|
"eval_sickr_spearman": 0.7452765067085325, |
|
"eval_stsb_spearman": 0.8198306447944311, |
|
"step": 6875 |
|
}, |
|
{ |
|
"epoch": 0.45, |
|
"learning_rate": 1.6560860104953284e-05, |
|
"loss": 0.0002, |
|
"step": 7000 |
|
}, |
|
{ |
|
"epoch": 0.45, |
|
"eval_avg_sts": 0.7831901309892826, |
|
"eval_sickr_spearman": 0.7458346761383449, |
|
"eval_stsb_spearman": 0.8205455858402203, |
|
"step": 7000 |
|
}, |
|
{ |
|
"epoch": 0.46, |
|
"eval_avg_sts": 0.7829404428906377, |
|
"eval_sickr_spearman": 0.7454985064593795, |
|
"eval_stsb_spearman": 0.8203823793218957, |
|
"step": 7125 |
|
}, |
|
{ |
|
"epoch": 0.46, |
|
"eval_avg_sts": 0.7827889218134074, |
|
"eval_sickr_spearman": 0.7466705133655709, |
|
"eval_stsb_spearman": 0.8189073302612438, |
|
"step": 7250 |
|
}, |
|
{ |
|
"epoch": 0.47, |
|
"eval_avg_sts": 0.7388870312908111, |
|
"eval_sickr_spearman": 0.7199674303966463, |
|
"eval_stsb_spearman": 0.7578066321849759, |
|
"step": 7375 |
|
}, |
|
{ |
|
"epoch": 0.48, |
|
"learning_rate": 1.5600921541021372e-05, |
|
"loss": 0.0001, |
|
"step": 7500 |
|
}, |
|
{ |
|
"epoch": 0.48, |
|
"eval_avg_sts": 0.7359950441852947, |
|
"eval_sickr_spearman": 0.7141863589964538, |
|
"eval_stsb_spearman": 0.7578037293741355, |
|
"step": 7500 |
|
}, |
|
{ |
|
"epoch": 0.49, |
|
"eval_avg_sts": 0.7514533824270638, |
|
"eval_sickr_spearman": 0.7285877642961502, |
|
"eval_stsb_spearman": 0.7743190005579774, |
|
"step": 7625 |
|
}, |
|
{ |
|
"epoch": 0.5, |
|
"eval_avg_sts": 0.7601125755242234, |
|
"eval_sickr_spearman": 0.7424667353055044, |
|
"eval_stsb_spearman": 0.7777584157429424, |
|
"step": 7750 |
|
}, |
|
{ |
|
"epoch": 0.5, |
|
"eval_avg_sts": 0.7621753865509604, |
|
"eval_sickr_spearman": 0.7417763842845344, |
|
"eval_stsb_spearman": 0.7825743888173865, |
|
"step": 7875 |
|
}, |
|
{ |
|
"epoch": 0.51, |
|
"learning_rate": 1.4640982977089467e-05, |
|
"loss": 0.0001, |
|
"step": 8000 |
|
}, |
|
{ |
|
"epoch": 0.51, |
|
"eval_avg_sts": 0.765106348392491, |
|
"eval_sickr_spearman": 0.743488885175209, |
|
"eval_stsb_spearman": 0.7867238116097731, |
|
"step": 8000 |
|
}, |
|
{ |
|
"epoch": 0.52, |
|
"eval_avg_sts": 0.7718140060309099, |
|
"eval_sickr_spearman": 0.7408926538151189, |
|
"eval_stsb_spearman": 0.8027353582467008, |
|
"step": 8125 |
|
}, |
|
{ |
|
"epoch": 0.53, |
|
"eval_avg_sts": 0.7689694127054261, |
|
"eval_sickr_spearman": 0.7398511536455906, |
|
"eval_stsb_spearman": 0.7980876717652616, |
|
"step": 8250 |
|
}, |
|
{ |
|
"epoch": 0.54, |
|
"eval_avg_sts": 0.7658098489708387, |
|
"eval_sickr_spearman": 0.7388756900064839, |
|
"eval_stsb_spearman": 0.7927440079351934, |
|
"step": 8375 |
|
}, |
|
{ |
|
"epoch": 0.54, |
|
"learning_rate": 1.368104441315756e-05, |
|
"loss": 0.0001, |
|
"step": 8500 |
|
}, |
|
{ |
|
"epoch": 0.54, |
|
"eval_avg_sts": 0.7748332537811696, |
|
"eval_sickr_spearman": 0.7417694197748259, |
|
"eval_stsb_spearman": 0.8078970877875133, |
|
"step": 8500 |
|
}, |
|
{ |
|
"epoch": 0.55, |
|
"eval_avg_sts": 0.7748339728955141, |
|
"eval_sickr_spearman": 0.7419876730997608, |
|
"eval_stsb_spearman": 0.8076802726912675, |
|
"step": 8625 |
|
}, |
|
{ |
|
"epoch": 0.56, |
|
"eval_avg_sts": 0.7709733616182656, |
|
"eval_sickr_spearman": 0.7395425057877492, |
|
"eval_stsb_spearman": 0.802404217448782, |
|
"step": 8750 |
|
}, |
|
{ |
|
"epoch": 0.57, |
|
"eval_avg_sts": 0.7564357671357971, |
|
"eval_sickr_spearman": 0.7294577516364988, |
|
"eval_stsb_spearman": 0.7834137826350953, |
|
"step": 8875 |
|
}, |
|
{ |
|
"epoch": 0.58, |
|
"learning_rate": 1.2721105849225649e-05, |
|
"loss": 0.0001, |
|
"step": 9000 |
|
}, |
|
{ |
|
"epoch": 0.58, |
|
"eval_avg_sts": 0.7576635056813905, |
|
"eval_sickr_spearman": 0.7307409985736208, |
|
"eval_stsb_spearman": 0.7845860127891603, |
|
"step": 9000 |
|
}, |
|
{ |
|
"epoch": 0.58, |
|
"eval_avg_sts": 0.7317573459891697, |
|
"eval_sickr_spearman": 0.6975396437978298, |
|
"eval_stsb_spearman": 0.7659750481805098, |
|
"step": 9125 |
|
}, |
|
{ |
|
"epoch": 0.59, |
|
"eval_avg_sts": 0.7296831294381873, |
|
"eval_sickr_spearman": 0.6969872861312915, |
|
"eval_stsb_spearman": 0.762378972745083, |
|
"step": 9250 |
|
}, |
|
{ |
|
"epoch": 0.6, |
|
"eval_avg_sts": 0.7711811922498575, |
|
"eval_sickr_spearman": 0.7350368042240428, |
|
"eval_stsb_spearman": 0.8073255802756722, |
|
"step": 9375 |
|
}, |
|
{ |
|
"epoch": 0.61, |
|
"learning_rate": 1.176116728529374e-05, |
|
"loss": 0.0002, |
|
"step": 9500 |
|
}, |
|
{ |
|
"epoch": 0.61, |
|
"eval_avg_sts": 0.7655418136173882, |
|
"eval_sickr_spearman": 0.7299852291924921, |
|
"eval_stsb_spearman": 0.8010983980422841, |
|
"step": 9500 |
|
}, |
|
{ |
|
"epoch": 0.62, |
|
"eval_avg_sts": 0.7550596227536142, |
|
"eval_sickr_spearman": 0.7207706545059959, |
|
"eval_stsb_spearman": 0.7893485910012326, |
|
"step": 9625 |
|
}, |
|
{ |
|
"epoch": 0.62, |
|
"eval_avg_sts": 0.7634673032356596, |
|
"eval_sickr_spearman": 0.7285461213312034, |
|
"eval_stsb_spearman": 0.7983884851401158, |
|
"step": 9750 |
|
}, |
|
{ |
|
"epoch": 0.63, |
|
"eval_avg_sts": 0.7638598931096033, |
|
"eval_sickr_spearman": 0.7283572630403488, |
|
"eval_stsb_spearman": 0.7993625231788579, |
|
"step": 9875 |
|
}, |
|
{ |
|
"epoch": 0.64, |
|
"learning_rate": 1.0801228721361832e-05, |
|
"loss": 0.0001, |
|
"step": 10000 |
|
}, |
|
{ |
|
"epoch": 0.64, |
|
"eval_avg_sts": 0.7667803597063858, |
|
"eval_sickr_spearman": 0.7305812951613392, |
|
"eval_stsb_spearman": 0.8029794242514324, |
|
"step": 10000 |
|
}, |
|
{ |
|
"epoch": 0.65, |
|
"eval_avg_sts": 0.7671530524779411, |
|
"eval_sickr_spearman": 0.7299761993454218, |
|
"eval_stsb_spearman": 0.8043299056104602, |
|
"step": 10125 |
|
}, |
|
{ |
|
"epoch": 0.66, |
|
"eval_avg_sts": 0.7744197669930808, |
|
"eval_sickr_spearman": 0.7359438715747014, |
|
"eval_stsb_spearman": 0.8128956624114603, |
|
"step": 10250 |
|
}, |
|
{ |
|
"epoch": 0.66, |
|
"eval_avg_sts": 0.7734565612749292, |
|
"eval_sickr_spearman": 0.7352129342730163, |
|
"eval_stsb_spearman": 0.8117001882768422, |
|
"step": 10375 |
|
}, |
|
{ |
|
"epoch": 0.67, |
|
"learning_rate": 9.841290157429926e-06, |
|
"loss": 0.0001, |
|
"step": 10500 |
|
}, |
|
{ |
|
"epoch": 0.67, |
|
"eval_avg_sts": 0.7702705095845273, |
|
"eval_sickr_spearman": 0.7336898680464138, |
|
"eval_stsb_spearman": 0.8068511511226406, |
|
"step": 10500 |
|
}, |
|
{ |
|
"epoch": 0.68, |
|
"eval_avg_sts": 0.7638028086321877, |
|
"eval_sickr_spearman": 0.7270147871880277, |
|
"eval_stsb_spearman": 0.8005908300763477, |
|
"step": 10625 |
|
}, |
|
{ |
|
"epoch": 0.69, |
|
"eval_avg_sts": 0.7647879756637017, |
|
"eval_sickr_spearman": 0.7278573073054794, |
|
"eval_stsb_spearman": 0.8017186440219239, |
|
"step": 10750 |
|
}, |
|
{ |
|
"epoch": 0.7, |
|
"eval_avg_sts": 0.7646746212752267, |
|
"eval_sickr_spearman": 0.7282990493454058, |
|
"eval_stsb_spearman": 0.8010501932050476, |
|
"step": 10875 |
|
}, |
|
{ |
|
"epoch": 0.7, |
|
"learning_rate": 8.881351593498018e-06, |
|
"loss": 0.0001, |
|
"step": 11000 |
|
}, |
|
{ |
|
"epoch": 0.7, |
|
"eval_avg_sts": 0.7595715432510943, |
|
"eval_sickr_spearman": 0.7220255630932696, |
|
"eval_stsb_spearman": 0.797117523408919, |
|
"step": 11000 |
|
}, |
|
{ |
|
"epoch": 0.71, |
|
"eval_avg_sts": 0.7637796865890665, |
|
"eval_sickr_spearman": 0.725214251855543, |
|
"eval_stsb_spearman": 0.80234512132259, |
|
"step": 11125 |
|
}, |
|
{ |
|
"epoch": 0.72, |
|
"eval_avg_sts": 0.7642527416188507, |
|
"eval_sickr_spearman": 0.7212445773838859, |
|
"eval_stsb_spearman": 0.8072609058538154, |
|
"step": 11250 |
|
}, |
|
{ |
|
"epoch": 0.73, |
|
"eval_avg_sts": 0.7625844941093753, |
|
"eval_sickr_spearman": 0.7204506713082153, |
|
"eval_stsb_spearman": 0.8047183169105355, |
|
"step": 11375 |
|
}, |
|
{ |
|
"epoch": 0.74, |
|
"learning_rate": 7.921413029566108e-06, |
|
"loss": 0.0001, |
|
"step": 11500 |
|
}, |
|
{ |
|
"epoch": 0.74, |
|
"eval_avg_sts": 0.7631529336672214, |
|
"eval_sickr_spearman": 0.7210336728174711, |
|
"eval_stsb_spearman": 0.8052721945169715, |
|
"step": 11500 |
|
}, |
|
{ |
|
"epoch": 0.74, |
|
"eval_avg_sts": 0.7627819801067925, |
|
"eval_sickr_spearman": 0.7209199351692657, |
|
"eval_stsb_spearman": 0.8046440250443194, |
|
"step": 11625 |
|
}, |
|
{ |
|
"epoch": 0.75, |
|
"eval_avg_sts": 0.7612502434175876, |
|
"eval_sickr_spearman": 0.7199052781513854, |
|
"eval_stsb_spearman": 0.80259520868379, |
|
"step": 11750 |
|
}, |
|
{ |
|
"epoch": 0.76, |
|
"eval_avg_sts": 0.7549680843862416, |
|
"eval_sickr_spearman": 0.7153213339234363, |
|
"eval_stsb_spearman": 0.7946148348490468, |
|
"step": 11875 |
|
}, |
|
{ |
|
"epoch": 0.77, |
|
"learning_rate": 6.961474465634199e-06, |
|
"loss": 0.0001, |
|
"step": 12000 |
|
}, |
|
{ |
|
"epoch": 0.77, |
|
"eval_avg_sts": 0.7566929851670519, |
|
"eval_sickr_spearman": 0.7169140932782255, |
|
"eval_stsb_spearman": 0.7964718770558783, |
|
"step": 12000 |
|
}, |
|
{ |
|
"epoch": 0.78, |
|
"eval_avg_sts": 0.7582762962904481, |
|
"eval_sickr_spearman": 0.7181445060037657, |
|
"eval_stsb_spearman": 0.7984080865771305, |
|
"step": 12125 |
|
}, |
|
{ |
|
"epoch": 0.78, |
|
"eval_avg_sts": 0.7575591207437209, |
|
"eval_sickr_spearman": 0.7175433967692678, |
|
"eval_stsb_spearman": 0.7975748447181741, |
|
"step": 12250 |
|
}, |
|
{ |
|
"epoch": 0.79, |
|
"eval_avg_sts": 0.7574126393782543, |
|
"eval_sickr_spearman": 0.7182304336442386, |
|
"eval_stsb_spearman": 0.7965948451122701, |
|
"step": 12375 |
|
}, |
|
{ |
|
"epoch": 0.8, |
|
"learning_rate": 6.001535901702292e-06, |
|
"loss": 0.0001, |
|
"step": 12500 |
|
}, |
|
{ |
|
"epoch": 0.8, |
|
"eval_avg_sts": 0.7552374803740505, |
|
"eval_sickr_spearman": 0.7164459341325082, |
|
"eval_stsb_spearman": 0.7940290266155928, |
|
"step": 12500 |
|
}, |
|
{ |
|
"epoch": 0.81, |
|
"eval_avg_sts": 0.7551510628378968, |
|
"eval_sickr_spearman": 0.7162126951039248, |
|
"eval_stsb_spearman": 0.7940894305718689, |
|
"step": 12625 |
|
}, |
|
{ |
|
"epoch": 0.82, |
|
"eval_avg_sts": 0.7563770556022249, |
|
"eval_sickr_spearman": 0.7171387347396517, |
|
"eval_stsb_spearman": 0.7956153764647981, |
|
"step": 12750 |
|
}, |
|
{ |
|
"epoch": 0.82, |
|
"eval_avg_sts": 0.7568538616101905, |
|
"eval_sickr_spearman": 0.7173768249094804, |
|
"eval_stsb_spearman": 0.7963308983109005, |
|
"step": 12875 |
|
}, |
|
{ |
|
"epoch": 0.83, |
|
"learning_rate": 5.0415973377703825e-06, |
|
"loss": 0.0001, |
|
"step": 13000 |
|
}, |
|
{ |
|
"epoch": 0.83, |
|
"eval_avg_sts": 0.7559100330626112, |
|
"eval_sickr_spearman": 0.7166905085010312, |
|
"eval_stsb_spearman": 0.7951295576241912, |
|
"step": 13000 |
|
}, |
|
{ |
|
"epoch": 0.84, |
|
"eval_avg_sts": 0.7564848751035596, |
|
"eval_sickr_spearman": 0.7171825391041632, |
|
"eval_stsb_spearman": 0.795787211102956, |
|
"step": 13125 |
|
}, |
|
{ |
|
"epoch": 0.85, |
|
"eval_avg_sts": 0.7488530315390816, |
|
"eval_sickr_spearman": 0.7127996050357326, |
|
"eval_stsb_spearman": 0.7849064580424306, |
|
"step": 13250 |
|
}, |
|
{ |
|
"epoch": 0.86, |
|
"eval_avg_sts": 0.7484617861410546, |
|
"eval_sickr_spearman": 0.7117017581501617, |
|
"eval_stsb_spearman": 0.7852218141319476, |
|
"step": 13375 |
|
}, |
|
{ |
|
"epoch": 0.86, |
|
"learning_rate": 4.081658773838474e-06, |
|
"loss": 0.0001, |
|
"step": 13500 |
|
}, |
|
{ |
|
"epoch": 0.86, |
|
"eval_avg_sts": 0.7469284581969524, |
|
"eval_sickr_spearman": 0.7094133163221428, |
|
"eval_stsb_spearman": 0.784443600071762, |
|
"step": 13500 |
|
}, |
|
{ |
|
"epoch": 0.87, |
|
"eval_avg_sts": 0.7479276349305448, |
|
"eval_sickr_spearman": 0.7103837366955984, |
|
"eval_stsb_spearman": 0.7854715331654911, |
|
"step": 13625 |
|
}, |
|
{ |
|
"epoch": 0.88, |
|
"eval_avg_sts": 0.7420231480320236, |
|
"eval_sickr_spearman": 0.7062097379184235, |
|
"eval_stsb_spearman": 0.7778365581456238, |
|
"step": 13750 |
|
}, |
|
{ |
|
"epoch": 0.89, |
|
"eval_avg_sts": 0.7411633122563288, |
|
"eval_sickr_spearman": 0.7050106895021224, |
|
"eval_stsb_spearman": 0.7773159350105353, |
|
"step": 13875 |
|
}, |
|
{ |
|
"epoch": 0.9, |
|
"learning_rate": 3.121720209906566e-06, |
|
"loss": 0.0001, |
|
"step": 14000 |
|
}, |
|
{ |
|
"epoch": 0.9, |
|
"eval_avg_sts": 0.7412314874976924, |
|
"eval_sickr_spearman": 0.7050875872955249, |
|
"eval_stsb_spearman": 0.7773753876998599, |
|
"step": 14000 |
|
}, |
|
{ |
|
"epoch": 0.9, |
|
"eval_avg_sts": 0.732587447078523, |
|
"eval_sickr_spearman": 0.6977087132748919, |
|
"eval_stsb_spearman": 0.767466180882154, |
|
"step": 14125 |
|
}, |
|
{ |
|
"epoch": 0.91, |
|
"eval_avg_sts": 0.7298853871265888, |
|
"eval_sickr_spearman": 0.6949198834320908, |
|
"eval_stsb_spearman": 0.7648508908210868, |
|
"step": 14250 |
|
}, |
|
{ |
|
"epoch": 0.92, |
|
"eval_avg_sts": 0.7308218986367342, |
|
"eval_sickr_spearman": 0.6958364129097329, |
|
"eval_stsb_spearman": 0.7658073843637355, |
|
"step": 14375 |
|
}, |
|
{ |
|
"epoch": 0.93, |
|
"learning_rate": 2.1617816459746575e-06, |
|
"loss": 0.0, |
|
"step": 14500 |
|
}, |
|
{ |
|
"epoch": 0.93, |
|
"eval_avg_sts": 0.7317585701181548, |
|
"eval_sickr_spearman": 0.6965340166270201, |
|
"eval_stsb_spearman": 0.7669831236092894, |
|
"step": 14500 |
|
}, |
|
{ |
|
"epoch": 0.94, |
|
"eval_avg_sts": 0.732111710583657, |
|
"eval_sickr_spearman": 0.696954673013415, |
|
"eval_stsb_spearman": 0.7672687481538989, |
|
"step": 14625 |
|
}, |
|
{ |
|
"epoch": 0.94, |
|
"eval_avg_sts": 0.7375915728397734, |
|
"eval_sickr_spearman": 0.7017668130042967, |
|
"eval_stsb_spearman": 0.7734163326752501, |
|
"step": 14750 |
|
}, |
|
{ |
|
"epoch": 0.95, |
|
"eval_avg_sts": 0.737608211926382, |
|
"eval_sickr_spearman": 0.7017644594803262, |
|
"eval_stsb_spearman": 0.7734519643724378, |
|
"step": 14875 |
|
}, |
|
{ |
|
"epoch": 0.96, |
|
"learning_rate": 1.2018430820427492e-06, |
|
"loss": 0.0001, |
|
"step": 15000 |
|
}, |
|
{ |
|
"epoch": 0.96, |
|
"eval_avg_sts": 0.7377728901345266, |
|
"eval_sickr_spearman": 0.7023058180246352, |
|
"eval_stsb_spearman": 0.7732399622444179, |
|
"step": 15000 |
|
}, |
|
{ |
|
"epoch": 0.97, |
|
"eval_avg_sts": 0.7394088348935646, |
|
"eval_sickr_spearman": 0.7037121206436416, |
|
"eval_stsb_spearman": 0.7751055491434876, |
|
"step": 15125 |
|
}, |
|
{ |
|
"epoch": 0.98, |
|
"eval_avg_sts": 0.7393669904391786, |
|
"eval_sickr_spearman": 0.7033311859781359, |
|
"eval_stsb_spearman": 0.7754027949002213, |
|
"step": 15250 |
|
}, |
|
{ |
|
"epoch": 0.98, |
|
"eval_avg_sts": 0.7399944883836842, |
|
"eval_sickr_spearman": 0.7034986223977493, |
|
"eval_stsb_spearman": 0.776490354369619, |
|
"step": 15375 |
|
}, |
|
{ |
|
"epoch": 0.99, |
|
"learning_rate": 2.4190451811084087e-07, |
|
"loss": 0.0001, |
|
"step": 15500 |
|
}, |
|
{ |
|
"epoch": 0.99, |
|
"eval_avg_sts": 0.7400416501229861, |
|
"eval_sickr_spearman": 0.7035811878611213, |
|
"eval_stsb_spearman": 0.7765021123848508, |
|
"step": 15500 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_avg_sts": 0.7400548448254956, |
|
"eval_sickr_spearman": 0.7035970861556974, |
|
"eval_stsb_spearman": 0.7765126034952938, |
|
"step": 15625 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"step": 15626, |
|
"total_flos": 42723641240930304, |
|
"train_runtime": 11103.0207, |
|
"train_samples_per_second": 1.407 |
|
} |
|
], |
|
"max_steps": 15626, |
|
"num_train_epochs": 1, |
|
"total_flos": 42723641240930304, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|