{ "best_metric": 0.8450403429578367, "best_model_checkpoint": "result/my-unsup-simcse-bert-base-uncased/SupCon-48-0.01-2e-7-0.07-0.00", "epoch": 1.0, "global_step": 15626, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.01, "eval_avg_sts": 0.6273981488926212, "eval_sickr_spearman": 0.6211010277251597, "eval_stsb_spearman": 0.6336952700600829, "step": 125 }, { "epoch": 0.02, "eval_avg_sts": 0.6557459351486706, "eval_sickr_spearman": 0.6424095455671641, "eval_stsb_spearman": 0.6690823247301771, "step": 250 }, { "epoch": 0.02, "eval_avg_sts": 0.709441256238345, "eval_sickr_spearman": 0.6938704999278709, "eval_stsb_spearman": 0.7250120125488192, "step": 375 }, { "epoch": 0.03, "learning_rate": 2.9040061436068092e-05, "loss": 0.0093, "step": 500 }, { "epoch": 0.03, "eval_avg_sts": 0.745161269369824, "eval_sickr_spearman": 0.7196067168248462, "eval_stsb_spearman": 0.7707158219148017, "step": 500 }, { "epoch": 0.04, "eval_avg_sts": 0.7476897637271698, "eval_sickr_spearman": 0.7177654445512162, "eval_stsb_spearman": 0.7776140829031234, "step": 625 }, { "epoch": 0.05, "eval_avg_sts": 0.7524926746389684, "eval_sickr_spearman": 0.7211576410902829, "eval_stsb_spearman": 0.7838277081876538, "step": 750 }, { "epoch": 0.06, "eval_avg_sts": 0.7584753747432835, "eval_sickr_spearman": 0.7179680397370821, "eval_stsb_spearman": 0.7989827097494849, "step": 875 }, { "epoch": 0.06, "learning_rate": 2.8080122872136184e-05, "loss": 0.0003, "step": 1000 }, { "epoch": 0.06, "eval_avg_sts": 0.7586746687828863, "eval_sickr_spearman": 0.718746960109104, "eval_stsb_spearman": 0.7986023774566684, "step": 1000 }, { "epoch": 0.07, "eval_avg_sts": 0.7574999857715704, "eval_sickr_spearman": 0.7175820618059254, "eval_stsb_spearman": 0.7974179097372154, "step": 1125 }, { "epoch": 0.08, "eval_avg_sts": 0.7696978971940565, "eval_sickr_spearman": 0.7239500252345904, "eval_stsb_spearman": 0.8154457691535225, "step": 1250 }, { "epoch": 0.09, "eval_avg_sts": 0.7711009245923006, "eval_sickr_spearman": 0.7253843780168369, "eval_stsb_spearman": 0.8168174711677644, "step": 1375 }, { "epoch": 0.1, "learning_rate": 2.7120184308204276e-05, "loss": 0.0001, "step": 1500 }, { "epoch": 0.1, "eval_avg_sts": 0.7722992846813606, "eval_sickr_spearman": 0.7252976338476396, "eval_stsb_spearman": 0.8193009355150815, "step": 1500 }, { "epoch": 0.1, "eval_avg_sts": 0.773722019273226, "eval_sickr_spearman": 0.7276583624833227, "eval_stsb_spearman": 0.8197856760631294, "step": 1625 }, { "epoch": 0.11, "eval_avg_sts": 0.7734992972011999, "eval_sickr_spearman": 0.7251570468137302, "eval_stsb_spearman": 0.8218415475886697, "step": 1750 }, { "epoch": 0.12, "eval_avg_sts": 0.772300977896672, "eval_sickr_spearman": 0.7260308286110924, "eval_stsb_spearman": 0.8185711271822516, "step": 1875 }, { "epoch": 0.13, "learning_rate": 2.6160245744272367e-05, "loss": 0.0001, "step": 2000 }, { "epoch": 0.13, "eval_avg_sts": 0.7741215013840628, "eval_sickr_spearman": 0.7290128395438775, "eval_stsb_spearman": 0.8192301632242479, "step": 2000 }, { "epoch": 0.14, "eval_avg_sts": 0.7845043729289752, "eval_sickr_spearman": 0.7357584234920489, "eval_stsb_spearman": 0.8332503223659016, "step": 2125 }, { "epoch": 0.14, "eval_avg_sts": 0.7824068340883688, "eval_sickr_spearman": 0.7413625963456452, "eval_stsb_spearman": 0.8234510718310922, "step": 2250 }, { "epoch": 0.15, "eval_avg_sts": 0.7801565471575205, "eval_sickr_spearman": 0.7272591759992707, "eval_stsb_spearman": 0.8330539183157702, "step": 2375 }, { "epoch": 0.16, "learning_rate": 2.5200307180340456e-05, "loss": 0.0001, "step": 2500 }, { "epoch": 0.16, "eval_avg_sts": 0.7817040476834756, "eval_sickr_spearman": 0.7317218416960886, "eval_stsb_spearman": 0.8316862536708627, "step": 2500 }, { "epoch": 0.17, "eval_avg_sts": 0.7834051453081208, "eval_sickr_spearman": 0.7332758879831186, "eval_stsb_spearman": 0.8335344026331228, "step": 2625 }, { "epoch": 0.18, "eval_avg_sts": 0.7846122957465609, "eval_sickr_spearman": 0.737042534988997, "eval_stsb_spearman": 0.8321820565041248, "step": 2750 }, { "epoch": 0.18, "eval_avg_sts": 0.7930382359535035, "eval_sickr_spearman": 0.7410361289491703, "eval_stsb_spearman": 0.8450403429578367, "step": 2875 }, { "epoch": 0.19, "learning_rate": 2.424036861640855e-05, "loss": 0.0001, "step": 3000 }, { "epoch": 0.19, "eval_avg_sts": 0.784546743206133, "eval_sickr_spearman": 0.7335979365182612, "eval_stsb_spearman": 0.8354955498940048, "step": 3000 }, { "epoch": 0.2, "eval_avg_sts": 0.7879357699638411, "eval_sickr_spearman": 0.7380969137277664, "eval_stsb_spearman": 0.8377746261999157, "step": 3125 }, { "epoch": 0.21, "eval_avg_sts": 0.7885921401422298, "eval_sickr_spearman": 0.7360949774198258, "eval_stsb_spearman": 0.8410893028646337, "step": 3250 }, { "epoch": 0.22, "eval_avg_sts": 0.7886813707449458, "eval_sickr_spearman": 0.7360677437853104, "eval_stsb_spearman": 0.8412949977045814, "step": 3375 }, { "epoch": 0.22, "learning_rate": 2.3280430052476642e-05, "loss": 0.0002, "step": 3500 }, { "epoch": 0.22, "eval_avg_sts": 0.7885894531415549, "eval_sickr_spearman": 0.7365915229464931, "eval_stsb_spearman": 0.8405873833366166, "step": 3500 }, { "epoch": 0.23, "eval_avg_sts": 0.7907895913811233, "eval_sickr_spearman": 0.7414235958444714, "eval_stsb_spearman": 0.8401555869177751, "step": 3625 }, { "epoch": 0.24, "eval_avg_sts": 0.7899099014596336, "eval_sickr_spearman": 0.7422593370094946, "eval_stsb_spearman": 0.8375604659097725, "step": 3750 }, { "epoch": 0.25, "eval_avg_sts": 0.781954087673714, "eval_sickr_spearman": 0.7436439776017526, "eval_stsb_spearman": 0.8202641977456754, "step": 3875 }, { "epoch": 0.26, "learning_rate": 2.2320491488544734e-05, "loss": 0.0001, "step": 4000 }, { "epoch": 0.26, "eval_avg_sts": 0.7846807378527296, "eval_sickr_spearman": 0.743132158184828, "eval_stsb_spearman": 0.8262293175206311, "step": 4000 }, { "epoch": 0.26, "eval_avg_sts": 0.7825345568897543, "eval_sickr_spearman": 0.7449149766080079, "eval_stsb_spearman": 0.8201541371715007, "step": 4125 }, { "epoch": 0.27, "eval_avg_sts": 0.7860788226540287, "eval_sickr_spearman": 0.7454807349518474, "eval_stsb_spearman": 0.8266769103562102, "step": 4250 }, { "epoch": 0.28, "eval_avg_sts": 0.7867018278295852, "eval_sickr_spearman": 0.7445308238587058, "eval_stsb_spearman": 0.8288728318004647, "step": 4375 }, { "epoch": 0.29, "learning_rate": 2.1360552924612826e-05, "loss": 0.0001, "step": 4500 }, { "epoch": 0.29, "eval_avg_sts": 0.776783766738095, "eval_sickr_spearman": 0.7318758294072991, "eval_stsb_spearman": 0.8216917040688909, "step": 4500 }, { "epoch": 0.3, "eval_avg_sts": 0.7675528732476737, "eval_sickr_spearman": 0.7320309698649442, "eval_stsb_spearman": 0.8030747766304034, "step": 4625 }, { "epoch": 0.3, "eval_avg_sts": 0.7715011023405255, "eval_sickr_spearman": 0.7350243641687703, "eval_stsb_spearman": 0.8079778405122807, "step": 4750 }, { "epoch": 0.31, "eval_avg_sts": 0.7687077375569937, "eval_sickr_spearman": 0.7408402100864042, "eval_stsb_spearman": 0.7965752650275834, "step": 4875 }, { "epoch": 0.32, "learning_rate": 2.0400614360680917e-05, "loss": 0.0001, "step": 5000 }, { "epoch": 0.32, "eval_avg_sts": 0.7738965818092367, "eval_sickr_spearman": 0.7445124279468551, "eval_stsb_spearman": 0.8032807356716183, "step": 5000 }, { "epoch": 0.33, "eval_avg_sts": 0.7793196132942312, "eval_sickr_spearman": 0.7457236762629214, "eval_stsb_spearman": 0.812915550325541, "step": 5125 }, { "epoch": 0.34, "eval_avg_sts": 0.7836274650846277, "eval_sickr_spearman": 0.7464208957313971, "eval_stsb_spearman": 0.8208340344378582, "step": 5250 }, { "epoch": 0.34, "eval_avg_sts": 0.7826458926642379, "eval_sickr_spearman": 0.7464102328268778, "eval_stsb_spearman": 0.818881552501598, "step": 5375 }, { "epoch": 0.35, "learning_rate": 1.944067579674901e-05, "loss": 0.0001, "step": 5500 }, { "epoch": 0.35, "eval_avg_sts": 0.7837446296343489, "eval_sickr_spearman": 0.7486399806489393, "eval_stsb_spearman": 0.8188492786197583, "step": 5500 }, { "epoch": 0.36, "eval_avg_sts": 0.7830869728965355, "eval_sickr_spearman": 0.7479103882180944, "eval_stsb_spearman": 0.8182635575749767, "step": 5625 }, { "epoch": 0.37, "eval_avg_sts": 0.783785645301962, "eval_sickr_spearman": 0.7470566353900319, "eval_stsb_spearman": 0.8205146552138923, "step": 5750 }, { "epoch": 0.38, "eval_avg_sts": 0.7841049239457296, "eval_sickr_spearman": 0.7275643656178084, "eval_stsb_spearman": 0.8406454822736508, "step": 5875 }, { "epoch": 0.38, "learning_rate": 1.84807372328171e-05, "loss": 0.0001, "step": 6000 }, { "epoch": 0.38, "eval_avg_sts": 0.7827015978431489, "eval_sickr_spearman": 0.7361094828124602, "eval_stsb_spearman": 0.8292937128738374, "step": 6000 }, { "epoch": 0.39, "eval_avg_sts": 0.7835582939326338, "eval_sickr_spearman": 0.7403639336845438, "eval_stsb_spearman": 0.8267526541807237, "step": 6125 }, { "epoch": 0.4, "eval_avg_sts": 0.7833004559230021, "eval_sickr_spearman": 0.7409274345666157, "eval_stsb_spearman": 0.8256734772793887, "step": 6250 }, { "epoch": 0.41, "eval_avg_sts": 0.783274693136238, "eval_sickr_spearman": 0.7396373672130896, "eval_stsb_spearman": 0.8269120190593864, "step": 6375 }, { "epoch": 0.42, "learning_rate": 1.7520798668885192e-05, "loss": 0.0, "step": 6500 }, { "epoch": 0.42, "eval_avg_sts": 0.7844400031801044, "eval_sickr_spearman": 0.7315539729965624, "eval_stsb_spearman": 0.8373260333636465, "step": 6500 }, { "epoch": 0.42, "eval_avg_sts": 0.7830541155839421, "eval_sickr_spearman": 0.7372136217723195, "eval_stsb_spearman": 0.8288946093955648, "step": 6625 }, { "epoch": 0.43, "eval_avg_sts": 0.7788362702655598, "eval_sickr_spearman": 0.7408482312803444, "eval_stsb_spearman": 0.8168243092507751, "step": 6750 }, { "epoch": 0.44, "eval_avg_sts": 0.7825535757514819, "eval_sickr_spearman": 0.7452765067085325, "eval_stsb_spearman": 0.8198306447944311, "step": 6875 }, { "epoch": 0.45, "learning_rate": 1.6560860104953284e-05, "loss": 0.0002, "step": 7000 }, { "epoch": 0.45, "eval_avg_sts": 0.7831901309892826, "eval_sickr_spearman": 0.7458346761383449, "eval_stsb_spearman": 0.8205455858402203, "step": 7000 }, { "epoch": 0.46, "eval_avg_sts": 0.7829404428906377, "eval_sickr_spearman": 0.7454985064593795, "eval_stsb_spearman": 0.8203823793218957, "step": 7125 }, { "epoch": 0.46, "eval_avg_sts": 0.7827889218134074, "eval_sickr_spearman": 0.7466705133655709, "eval_stsb_spearman": 0.8189073302612438, "step": 7250 }, { "epoch": 0.47, "eval_avg_sts": 0.7388870312908111, "eval_sickr_spearman": 0.7199674303966463, "eval_stsb_spearman": 0.7578066321849759, "step": 7375 }, { "epoch": 0.48, "learning_rate": 1.5600921541021372e-05, "loss": 0.0001, "step": 7500 }, { "epoch": 0.48, "eval_avg_sts": 0.7359950441852947, "eval_sickr_spearman": 0.7141863589964538, "eval_stsb_spearman": 0.7578037293741355, "step": 7500 }, { "epoch": 0.49, "eval_avg_sts": 0.7514533824270638, "eval_sickr_spearman": 0.7285877642961502, "eval_stsb_spearman": 0.7743190005579774, "step": 7625 }, { "epoch": 0.5, "eval_avg_sts": 0.7601125755242234, "eval_sickr_spearman": 0.7424667353055044, "eval_stsb_spearman": 0.7777584157429424, "step": 7750 }, { "epoch": 0.5, "eval_avg_sts": 0.7621753865509604, "eval_sickr_spearman": 0.7417763842845344, "eval_stsb_spearman": 0.7825743888173865, "step": 7875 }, { "epoch": 0.51, "learning_rate": 1.4640982977089467e-05, "loss": 0.0001, "step": 8000 }, { "epoch": 0.51, "eval_avg_sts": 0.765106348392491, "eval_sickr_spearman": 0.743488885175209, "eval_stsb_spearman": 0.7867238116097731, "step": 8000 }, { "epoch": 0.52, "eval_avg_sts": 0.7718140060309099, "eval_sickr_spearman": 0.7408926538151189, "eval_stsb_spearman": 0.8027353582467008, "step": 8125 }, { "epoch": 0.53, "eval_avg_sts": 0.7689694127054261, "eval_sickr_spearman": 0.7398511536455906, "eval_stsb_spearman": 0.7980876717652616, "step": 8250 }, { "epoch": 0.54, "eval_avg_sts": 0.7658098489708387, "eval_sickr_spearman": 0.7388756900064839, "eval_stsb_spearman": 0.7927440079351934, "step": 8375 }, { "epoch": 0.54, "learning_rate": 1.368104441315756e-05, "loss": 0.0001, "step": 8500 }, { "epoch": 0.54, "eval_avg_sts": 0.7748332537811696, "eval_sickr_spearman": 0.7417694197748259, "eval_stsb_spearman": 0.8078970877875133, "step": 8500 }, { "epoch": 0.55, "eval_avg_sts": 0.7748339728955141, "eval_sickr_spearman": 0.7419876730997608, "eval_stsb_spearman": 0.8076802726912675, "step": 8625 }, { "epoch": 0.56, "eval_avg_sts": 0.7709733616182656, "eval_sickr_spearman": 0.7395425057877492, "eval_stsb_spearman": 0.802404217448782, "step": 8750 }, { "epoch": 0.57, "eval_avg_sts": 0.7564357671357971, "eval_sickr_spearman": 0.7294577516364988, "eval_stsb_spearman": 0.7834137826350953, "step": 8875 }, { "epoch": 0.58, "learning_rate": 1.2721105849225649e-05, "loss": 0.0001, "step": 9000 }, { "epoch": 0.58, "eval_avg_sts": 0.7576635056813905, "eval_sickr_spearman": 0.7307409985736208, "eval_stsb_spearman": 0.7845860127891603, "step": 9000 }, { "epoch": 0.58, "eval_avg_sts": 0.7317573459891697, "eval_sickr_spearman": 0.6975396437978298, "eval_stsb_spearman": 0.7659750481805098, "step": 9125 }, { "epoch": 0.59, "eval_avg_sts": 0.7296831294381873, "eval_sickr_spearman": 0.6969872861312915, "eval_stsb_spearman": 0.762378972745083, "step": 9250 }, { "epoch": 0.6, "eval_avg_sts": 0.7711811922498575, "eval_sickr_spearman": 0.7350368042240428, "eval_stsb_spearman": 0.8073255802756722, "step": 9375 }, { "epoch": 0.61, "learning_rate": 1.176116728529374e-05, "loss": 0.0002, "step": 9500 }, { "epoch": 0.61, "eval_avg_sts": 0.7655418136173882, "eval_sickr_spearman": 0.7299852291924921, "eval_stsb_spearman": 0.8010983980422841, "step": 9500 }, { "epoch": 0.62, "eval_avg_sts": 0.7550596227536142, "eval_sickr_spearman": 0.7207706545059959, "eval_stsb_spearman": 0.7893485910012326, "step": 9625 }, { "epoch": 0.62, "eval_avg_sts": 0.7634673032356596, "eval_sickr_spearman": 0.7285461213312034, "eval_stsb_spearman": 0.7983884851401158, "step": 9750 }, { "epoch": 0.63, "eval_avg_sts": 0.7638598931096033, "eval_sickr_spearman": 0.7283572630403488, "eval_stsb_spearman": 0.7993625231788579, "step": 9875 }, { "epoch": 0.64, "learning_rate": 1.0801228721361832e-05, "loss": 0.0001, "step": 10000 }, { "epoch": 0.64, "eval_avg_sts": 0.7667803597063858, "eval_sickr_spearman": 0.7305812951613392, "eval_stsb_spearman": 0.8029794242514324, "step": 10000 }, { "epoch": 0.65, "eval_avg_sts": 0.7671530524779411, "eval_sickr_spearman": 0.7299761993454218, "eval_stsb_spearman": 0.8043299056104602, "step": 10125 }, { "epoch": 0.66, "eval_avg_sts": 0.7744197669930808, "eval_sickr_spearman": 0.7359438715747014, "eval_stsb_spearman": 0.8128956624114603, "step": 10250 }, { "epoch": 0.66, "eval_avg_sts": 0.7734565612749292, "eval_sickr_spearman": 0.7352129342730163, "eval_stsb_spearman": 0.8117001882768422, "step": 10375 }, { "epoch": 0.67, "learning_rate": 9.841290157429926e-06, "loss": 0.0001, "step": 10500 }, { "epoch": 0.67, "eval_avg_sts": 0.7702705095845273, "eval_sickr_spearman": 0.7336898680464138, "eval_stsb_spearman": 0.8068511511226406, "step": 10500 }, { "epoch": 0.68, "eval_avg_sts": 0.7638028086321877, "eval_sickr_spearman": 0.7270147871880277, "eval_stsb_spearman": 0.8005908300763477, "step": 10625 }, { "epoch": 0.69, "eval_avg_sts": 0.7647879756637017, "eval_sickr_spearman": 0.7278573073054794, "eval_stsb_spearman": 0.8017186440219239, "step": 10750 }, { "epoch": 0.7, "eval_avg_sts": 0.7646746212752267, "eval_sickr_spearman": 0.7282990493454058, "eval_stsb_spearman": 0.8010501932050476, "step": 10875 }, { "epoch": 0.7, "learning_rate": 8.881351593498018e-06, "loss": 0.0001, "step": 11000 }, { "epoch": 0.7, "eval_avg_sts": 0.7595715432510943, "eval_sickr_spearman": 0.7220255630932696, "eval_stsb_spearman": 0.797117523408919, "step": 11000 }, { "epoch": 0.71, "eval_avg_sts": 0.7637796865890665, "eval_sickr_spearman": 0.725214251855543, "eval_stsb_spearman": 0.80234512132259, "step": 11125 }, { "epoch": 0.72, "eval_avg_sts": 0.7642527416188507, "eval_sickr_spearman": 0.7212445773838859, "eval_stsb_spearman": 0.8072609058538154, "step": 11250 }, { "epoch": 0.73, "eval_avg_sts": 0.7625844941093753, "eval_sickr_spearman": 0.7204506713082153, "eval_stsb_spearman": 0.8047183169105355, "step": 11375 }, { "epoch": 0.74, "learning_rate": 7.921413029566108e-06, "loss": 0.0001, "step": 11500 }, { "epoch": 0.74, "eval_avg_sts": 0.7631529336672214, "eval_sickr_spearman": 0.7210336728174711, "eval_stsb_spearman": 0.8052721945169715, "step": 11500 }, { "epoch": 0.74, "eval_avg_sts": 0.7627819801067925, "eval_sickr_spearman": 0.7209199351692657, "eval_stsb_spearman": 0.8046440250443194, "step": 11625 }, { "epoch": 0.75, "eval_avg_sts": 0.7612502434175876, "eval_sickr_spearman": 0.7199052781513854, "eval_stsb_spearman": 0.80259520868379, "step": 11750 }, { "epoch": 0.76, "eval_avg_sts": 0.7549680843862416, "eval_sickr_spearman": 0.7153213339234363, "eval_stsb_spearman": 0.7946148348490468, "step": 11875 }, { "epoch": 0.77, "learning_rate": 6.961474465634199e-06, "loss": 0.0001, "step": 12000 }, { "epoch": 0.77, "eval_avg_sts": 0.7566929851670519, "eval_sickr_spearman": 0.7169140932782255, "eval_stsb_spearman": 0.7964718770558783, "step": 12000 }, { "epoch": 0.78, "eval_avg_sts": 0.7582762962904481, "eval_sickr_spearman": 0.7181445060037657, "eval_stsb_spearman": 0.7984080865771305, "step": 12125 }, { "epoch": 0.78, "eval_avg_sts": 0.7575591207437209, "eval_sickr_spearman": 0.7175433967692678, "eval_stsb_spearman": 0.7975748447181741, "step": 12250 }, { "epoch": 0.79, "eval_avg_sts": 0.7574126393782543, "eval_sickr_spearman": 0.7182304336442386, "eval_stsb_spearman": 0.7965948451122701, "step": 12375 }, { "epoch": 0.8, "learning_rate": 6.001535901702292e-06, "loss": 0.0001, "step": 12500 }, { "epoch": 0.8, "eval_avg_sts": 0.7552374803740505, "eval_sickr_spearman": 0.7164459341325082, "eval_stsb_spearman": 0.7940290266155928, "step": 12500 }, { "epoch": 0.81, "eval_avg_sts": 0.7551510628378968, "eval_sickr_spearman": 0.7162126951039248, "eval_stsb_spearman": 0.7940894305718689, "step": 12625 }, { "epoch": 0.82, "eval_avg_sts": 0.7563770556022249, "eval_sickr_spearman": 0.7171387347396517, "eval_stsb_spearman": 0.7956153764647981, "step": 12750 }, { "epoch": 0.82, "eval_avg_sts": 0.7568538616101905, "eval_sickr_spearman": 0.7173768249094804, "eval_stsb_spearman": 0.7963308983109005, "step": 12875 }, { "epoch": 0.83, "learning_rate": 5.0415973377703825e-06, "loss": 0.0001, "step": 13000 }, { "epoch": 0.83, "eval_avg_sts": 0.7559100330626112, "eval_sickr_spearman": 0.7166905085010312, "eval_stsb_spearman": 0.7951295576241912, "step": 13000 }, { "epoch": 0.84, "eval_avg_sts": 0.7564848751035596, "eval_sickr_spearman": 0.7171825391041632, "eval_stsb_spearman": 0.795787211102956, "step": 13125 }, { "epoch": 0.85, "eval_avg_sts": 0.7488530315390816, "eval_sickr_spearman": 0.7127996050357326, "eval_stsb_spearman": 0.7849064580424306, "step": 13250 }, { "epoch": 0.86, "eval_avg_sts": 0.7484617861410546, "eval_sickr_spearman": 0.7117017581501617, "eval_stsb_spearman": 0.7852218141319476, "step": 13375 }, { "epoch": 0.86, "learning_rate": 4.081658773838474e-06, "loss": 0.0001, "step": 13500 }, { "epoch": 0.86, "eval_avg_sts": 0.7469284581969524, "eval_sickr_spearman": 0.7094133163221428, "eval_stsb_spearman": 0.784443600071762, "step": 13500 }, { "epoch": 0.87, "eval_avg_sts": 0.7479276349305448, "eval_sickr_spearman": 0.7103837366955984, "eval_stsb_spearman": 0.7854715331654911, "step": 13625 }, { "epoch": 0.88, "eval_avg_sts": 0.7420231480320236, "eval_sickr_spearman": 0.7062097379184235, "eval_stsb_spearman": 0.7778365581456238, "step": 13750 }, { "epoch": 0.89, "eval_avg_sts": 0.7411633122563288, "eval_sickr_spearman": 0.7050106895021224, "eval_stsb_spearman": 0.7773159350105353, "step": 13875 }, { "epoch": 0.9, "learning_rate": 3.121720209906566e-06, "loss": 0.0001, "step": 14000 }, { "epoch": 0.9, "eval_avg_sts": 0.7412314874976924, "eval_sickr_spearman": 0.7050875872955249, "eval_stsb_spearman": 0.7773753876998599, "step": 14000 }, { "epoch": 0.9, "eval_avg_sts": 0.732587447078523, "eval_sickr_spearman": 0.6977087132748919, "eval_stsb_spearman": 0.767466180882154, "step": 14125 }, { "epoch": 0.91, "eval_avg_sts": 0.7298853871265888, "eval_sickr_spearman": 0.6949198834320908, "eval_stsb_spearman": 0.7648508908210868, "step": 14250 }, { "epoch": 0.92, "eval_avg_sts": 0.7308218986367342, "eval_sickr_spearman": 0.6958364129097329, "eval_stsb_spearman": 0.7658073843637355, "step": 14375 }, { "epoch": 0.93, "learning_rate": 2.1617816459746575e-06, "loss": 0.0, "step": 14500 }, { "epoch": 0.93, "eval_avg_sts": 0.7317585701181548, "eval_sickr_spearman": 0.6965340166270201, "eval_stsb_spearman": 0.7669831236092894, "step": 14500 }, { "epoch": 0.94, "eval_avg_sts": 0.732111710583657, "eval_sickr_spearman": 0.696954673013415, "eval_stsb_spearman": 0.7672687481538989, "step": 14625 }, { "epoch": 0.94, "eval_avg_sts": 0.7375915728397734, "eval_sickr_spearman": 0.7017668130042967, "eval_stsb_spearman": 0.7734163326752501, "step": 14750 }, { "epoch": 0.95, "eval_avg_sts": 0.737608211926382, "eval_sickr_spearman": 0.7017644594803262, "eval_stsb_spearman": 0.7734519643724378, "step": 14875 }, { "epoch": 0.96, "learning_rate": 1.2018430820427492e-06, "loss": 0.0001, "step": 15000 }, { "epoch": 0.96, "eval_avg_sts": 0.7377728901345266, "eval_sickr_spearman": 0.7023058180246352, "eval_stsb_spearman": 0.7732399622444179, "step": 15000 }, { "epoch": 0.97, "eval_avg_sts": 0.7394088348935646, "eval_sickr_spearman": 0.7037121206436416, "eval_stsb_spearman": 0.7751055491434876, "step": 15125 }, { "epoch": 0.98, "eval_avg_sts": 0.7393669904391786, "eval_sickr_spearman": 0.7033311859781359, "eval_stsb_spearman": 0.7754027949002213, "step": 15250 }, { "epoch": 0.98, "eval_avg_sts": 0.7399944883836842, "eval_sickr_spearman": 0.7034986223977493, "eval_stsb_spearman": 0.776490354369619, "step": 15375 }, { "epoch": 0.99, "learning_rate": 2.4190451811084087e-07, "loss": 0.0001, "step": 15500 }, { "epoch": 0.99, "eval_avg_sts": 0.7400416501229861, "eval_sickr_spearman": 0.7035811878611213, "eval_stsb_spearman": 0.7765021123848508, "step": 15500 }, { "epoch": 1.0, "eval_avg_sts": 0.7400548448254956, "eval_sickr_spearman": 0.7035970861556974, "eval_stsb_spearman": 0.7765126034952938, "step": 15625 }, { "epoch": 1.0, "step": 15626, "total_flos": 42723641240930304, "train_runtime": 11103.0207, "train_samples_per_second": 1.407 } ], "max_steps": 15626, "num_train_epochs": 1, "total_flos": 42723641240930304, "trial_name": null, "trial_params": null }