unsup-AudioCSE-bert-base-uncased / trainer_state.json
gcyzsl's picture
Upload trainer_state.json with huggingface_hub
9e73009
raw
history blame
28.4 kB
{
"best_metric": 0.8450403429578367,
"best_model_checkpoint": "result/my-unsup-simcse-bert-base-uncased/SupCon-48-0.01-2e-7-0.07-0.00",
"epoch": 1.0,
"global_step": 15626,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.01,
"eval_avg_sts": 0.6273981488926212,
"eval_sickr_spearman": 0.6211010277251597,
"eval_stsb_spearman": 0.6336952700600829,
"step": 125
},
{
"epoch": 0.02,
"eval_avg_sts": 0.6557459351486706,
"eval_sickr_spearman": 0.6424095455671641,
"eval_stsb_spearman": 0.6690823247301771,
"step": 250
},
{
"epoch": 0.02,
"eval_avg_sts": 0.709441256238345,
"eval_sickr_spearman": 0.6938704999278709,
"eval_stsb_spearman": 0.7250120125488192,
"step": 375
},
{
"epoch": 0.03,
"learning_rate": 2.9040061436068092e-05,
"loss": 0.0093,
"step": 500
},
{
"epoch": 0.03,
"eval_avg_sts": 0.745161269369824,
"eval_sickr_spearman": 0.7196067168248462,
"eval_stsb_spearman": 0.7707158219148017,
"step": 500
},
{
"epoch": 0.04,
"eval_avg_sts": 0.7476897637271698,
"eval_sickr_spearman": 0.7177654445512162,
"eval_stsb_spearman": 0.7776140829031234,
"step": 625
},
{
"epoch": 0.05,
"eval_avg_sts": 0.7524926746389684,
"eval_sickr_spearman": 0.7211576410902829,
"eval_stsb_spearman": 0.7838277081876538,
"step": 750
},
{
"epoch": 0.06,
"eval_avg_sts": 0.7584753747432835,
"eval_sickr_spearman": 0.7179680397370821,
"eval_stsb_spearman": 0.7989827097494849,
"step": 875
},
{
"epoch": 0.06,
"learning_rate": 2.8080122872136184e-05,
"loss": 0.0003,
"step": 1000
},
{
"epoch": 0.06,
"eval_avg_sts": 0.7586746687828863,
"eval_sickr_spearman": 0.718746960109104,
"eval_stsb_spearman": 0.7986023774566684,
"step": 1000
},
{
"epoch": 0.07,
"eval_avg_sts": 0.7574999857715704,
"eval_sickr_spearman": 0.7175820618059254,
"eval_stsb_spearman": 0.7974179097372154,
"step": 1125
},
{
"epoch": 0.08,
"eval_avg_sts": 0.7696978971940565,
"eval_sickr_spearman": 0.7239500252345904,
"eval_stsb_spearman": 0.8154457691535225,
"step": 1250
},
{
"epoch": 0.09,
"eval_avg_sts": 0.7711009245923006,
"eval_sickr_spearman": 0.7253843780168369,
"eval_stsb_spearman": 0.8168174711677644,
"step": 1375
},
{
"epoch": 0.1,
"learning_rate": 2.7120184308204276e-05,
"loss": 0.0001,
"step": 1500
},
{
"epoch": 0.1,
"eval_avg_sts": 0.7722992846813606,
"eval_sickr_spearman": 0.7252976338476396,
"eval_stsb_spearman": 0.8193009355150815,
"step": 1500
},
{
"epoch": 0.1,
"eval_avg_sts": 0.773722019273226,
"eval_sickr_spearman": 0.7276583624833227,
"eval_stsb_spearman": 0.8197856760631294,
"step": 1625
},
{
"epoch": 0.11,
"eval_avg_sts": 0.7734992972011999,
"eval_sickr_spearman": 0.7251570468137302,
"eval_stsb_spearman": 0.8218415475886697,
"step": 1750
},
{
"epoch": 0.12,
"eval_avg_sts": 0.772300977896672,
"eval_sickr_spearman": 0.7260308286110924,
"eval_stsb_spearman": 0.8185711271822516,
"step": 1875
},
{
"epoch": 0.13,
"learning_rate": 2.6160245744272367e-05,
"loss": 0.0001,
"step": 2000
},
{
"epoch": 0.13,
"eval_avg_sts": 0.7741215013840628,
"eval_sickr_spearman": 0.7290128395438775,
"eval_stsb_spearman": 0.8192301632242479,
"step": 2000
},
{
"epoch": 0.14,
"eval_avg_sts": 0.7845043729289752,
"eval_sickr_spearman": 0.7357584234920489,
"eval_stsb_spearman": 0.8332503223659016,
"step": 2125
},
{
"epoch": 0.14,
"eval_avg_sts": 0.7824068340883688,
"eval_sickr_spearman": 0.7413625963456452,
"eval_stsb_spearman": 0.8234510718310922,
"step": 2250
},
{
"epoch": 0.15,
"eval_avg_sts": 0.7801565471575205,
"eval_sickr_spearman": 0.7272591759992707,
"eval_stsb_spearman": 0.8330539183157702,
"step": 2375
},
{
"epoch": 0.16,
"learning_rate": 2.5200307180340456e-05,
"loss": 0.0001,
"step": 2500
},
{
"epoch": 0.16,
"eval_avg_sts": 0.7817040476834756,
"eval_sickr_spearman": 0.7317218416960886,
"eval_stsb_spearman": 0.8316862536708627,
"step": 2500
},
{
"epoch": 0.17,
"eval_avg_sts": 0.7834051453081208,
"eval_sickr_spearman": 0.7332758879831186,
"eval_stsb_spearman": 0.8335344026331228,
"step": 2625
},
{
"epoch": 0.18,
"eval_avg_sts": 0.7846122957465609,
"eval_sickr_spearman": 0.737042534988997,
"eval_stsb_spearman": 0.8321820565041248,
"step": 2750
},
{
"epoch": 0.18,
"eval_avg_sts": 0.7930382359535035,
"eval_sickr_spearman": 0.7410361289491703,
"eval_stsb_spearman": 0.8450403429578367,
"step": 2875
},
{
"epoch": 0.19,
"learning_rate": 2.424036861640855e-05,
"loss": 0.0001,
"step": 3000
},
{
"epoch": 0.19,
"eval_avg_sts": 0.784546743206133,
"eval_sickr_spearman": 0.7335979365182612,
"eval_stsb_spearman": 0.8354955498940048,
"step": 3000
},
{
"epoch": 0.2,
"eval_avg_sts": 0.7879357699638411,
"eval_sickr_spearman": 0.7380969137277664,
"eval_stsb_spearman": 0.8377746261999157,
"step": 3125
},
{
"epoch": 0.21,
"eval_avg_sts": 0.7885921401422298,
"eval_sickr_spearman": 0.7360949774198258,
"eval_stsb_spearman": 0.8410893028646337,
"step": 3250
},
{
"epoch": 0.22,
"eval_avg_sts": 0.7886813707449458,
"eval_sickr_spearman": 0.7360677437853104,
"eval_stsb_spearman": 0.8412949977045814,
"step": 3375
},
{
"epoch": 0.22,
"learning_rate": 2.3280430052476642e-05,
"loss": 0.0002,
"step": 3500
},
{
"epoch": 0.22,
"eval_avg_sts": 0.7885894531415549,
"eval_sickr_spearman": 0.7365915229464931,
"eval_stsb_spearman": 0.8405873833366166,
"step": 3500
},
{
"epoch": 0.23,
"eval_avg_sts": 0.7907895913811233,
"eval_sickr_spearman": 0.7414235958444714,
"eval_stsb_spearman": 0.8401555869177751,
"step": 3625
},
{
"epoch": 0.24,
"eval_avg_sts": 0.7899099014596336,
"eval_sickr_spearman": 0.7422593370094946,
"eval_stsb_spearman": 0.8375604659097725,
"step": 3750
},
{
"epoch": 0.25,
"eval_avg_sts": 0.781954087673714,
"eval_sickr_spearman": 0.7436439776017526,
"eval_stsb_spearman": 0.8202641977456754,
"step": 3875
},
{
"epoch": 0.26,
"learning_rate": 2.2320491488544734e-05,
"loss": 0.0001,
"step": 4000
},
{
"epoch": 0.26,
"eval_avg_sts": 0.7846807378527296,
"eval_sickr_spearman": 0.743132158184828,
"eval_stsb_spearman": 0.8262293175206311,
"step": 4000
},
{
"epoch": 0.26,
"eval_avg_sts": 0.7825345568897543,
"eval_sickr_spearman": 0.7449149766080079,
"eval_stsb_spearman": 0.8201541371715007,
"step": 4125
},
{
"epoch": 0.27,
"eval_avg_sts": 0.7860788226540287,
"eval_sickr_spearman": 0.7454807349518474,
"eval_stsb_spearman": 0.8266769103562102,
"step": 4250
},
{
"epoch": 0.28,
"eval_avg_sts": 0.7867018278295852,
"eval_sickr_spearman": 0.7445308238587058,
"eval_stsb_spearman": 0.8288728318004647,
"step": 4375
},
{
"epoch": 0.29,
"learning_rate": 2.1360552924612826e-05,
"loss": 0.0001,
"step": 4500
},
{
"epoch": 0.29,
"eval_avg_sts": 0.776783766738095,
"eval_sickr_spearman": 0.7318758294072991,
"eval_stsb_spearman": 0.8216917040688909,
"step": 4500
},
{
"epoch": 0.3,
"eval_avg_sts": 0.7675528732476737,
"eval_sickr_spearman": 0.7320309698649442,
"eval_stsb_spearman": 0.8030747766304034,
"step": 4625
},
{
"epoch": 0.3,
"eval_avg_sts": 0.7715011023405255,
"eval_sickr_spearman": 0.7350243641687703,
"eval_stsb_spearman": 0.8079778405122807,
"step": 4750
},
{
"epoch": 0.31,
"eval_avg_sts": 0.7687077375569937,
"eval_sickr_spearman": 0.7408402100864042,
"eval_stsb_spearman": 0.7965752650275834,
"step": 4875
},
{
"epoch": 0.32,
"learning_rate": 2.0400614360680917e-05,
"loss": 0.0001,
"step": 5000
},
{
"epoch": 0.32,
"eval_avg_sts": 0.7738965818092367,
"eval_sickr_spearman": 0.7445124279468551,
"eval_stsb_spearman": 0.8032807356716183,
"step": 5000
},
{
"epoch": 0.33,
"eval_avg_sts": 0.7793196132942312,
"eval_sickr_spearman": 0.7457236762629214,
"eval_stsb_spearman": 0.812915550325541,
"step": 5125
},
{
"epoch": 0.34,
"eval_avg_sts": 0.7836274650846277,
"eval_sickr_spearman": 0.7464208957313971,
"eval_stsb_spearman": 0.8208340344378582,
"step": 5250
},
{
"epoch": 0.34,
"eval_avg_sts": 0.7826458926642379,
"eval_sickr_spearman": 0.7464102328268778,
"eval_stsb_spearman": 0.818881552501598,
"step": 5375
},
{
"epoch": 0.35,
"learning_rate": 1.944067579674901e-05,
"loss": 0.0001,
"step": 5500
},
{
"epoch": 0.35,
"eval_avg_sts": 0.7837446296343489,
"eval_sickr_spearman": 0.7486399806489393,
"eval_stsb_spearman": 0.8188492786197583,
"step": 5500
},
{
"epoch": 0.36,
"eval_avg_sts": 0.7830869728965355,
"eval_sickr_spearman": 0.7479103882180944,
"eval_stsb_spearman": 0.8182635575749767,
"step": 5625
},
{
"epoch": 0.37,
"eval_avg_sts": 0.783785645301962,
"eval_sickr_spearman": 0.7470566353900319,
"eval_stsb_spearman": 0.8205146552138923,
"step": 5750
},
{
"epoch": 0.38,
"eval_avg_sts": 0.7841049239457296,
"eval_sickr_spearman": 0.7275643656178084,
"eval_stsb_spearman": 0.8406454822736508,
"step": 5875
},
{
"epoch": 0.38,
"learning_rate": 1.84807372328171e-05,
"loss": 0.0001,
"step": 6000
},
{
"epoch": 0.38,
"eval_avg_sts": 0.7827015978431489,
"eval_sickr_spearman": 0.7361094828124602,
"eval_stsb_spearman": 0.8292937128738374,
"step": 6000
},
{
"epoch": 0.39,
"eval_avg_sts": 0.7835582939326338,
"eval_sickr_spearman": 0.7403639336845438,
"eval_stsb_spearman": 0.8267526541807237,
"step": 6125
},
{
"epoch": 0.4,
"eval_avg_sts": 0.7833004559230021,
"eval_sickr_spearman": 0.7409274345666157,
"eval_stsb_spearman": 0.8256734772793887,
"step": 6250
},
{
"epoch": 0.41,
"eval_avg_sts": 0.783274693136238,
"eval_sickr_spearman": 0.7396373672130896,
"eval_stsb_spearman": 0.8269120190593864,
"step": 6375
},
{
"epoch": 0.42,
"learning_rate": 1.7520798668885192e-05,
"loss": 0.0,
"step": 6500
},
{
"epoch": 0.42,
"eval_avg_sts": 0.7844400031801044,
"eval_sickr_spearman": 0.7315539729965624,
"eval_stsb_spearman": 0.8373260333636465,
"step": 6500
},
{
"epoch": 0.42,
"eval_avg_sts": 0.7830541155839421,
"eval_sickr_spearman": 0.7372136217723195,
"eval_stsb_spearman": 0.8288946093955648,
"step": 6625
},
{
"epoch": 0.43,
"eval_avg_sts": 0.7788362702655598,
"eval_sickr_spearman": 0.7408482312803444,
"eval_stsb_spearman": 0.8168243092507751,
"step": 6750
},
{
"epoch": 0.44,
"eval_avg_sts": 0.7825535757514819,
"eval_sickr_spearman": 0.7452765067085325,
"eval_stsb_spearman": 0.8198306447944311,
"step": 6875
},
{
"epoch": 0.45,
"learning_rate": 1.6560860104953284e-05,
"loss": 0.0002,
"step": 7000
},
{
"epoch": 0.45,
"eval_avg_sts": 0.7831901309892826,
"eval_sickr_spearman": 0.7458346761383449,
"eval_stsb_spearman": 0.8205455858402203,
"step": 7000
},
{
"epoch": 0.46,
"eval_avg_sts": 0.7829404428906377,
"eval_sickr_spearman": 0.7454985064593795,
"eval_stsb_spearman": 0.8203823793218957,
"step": 7125
},
{
"epoch": 0.46,
"eval_avg_sts": 0.7827889218134074,
"eval_sickr_spearman": 0.7466705133655709,
"eval_stsb_spearman": 0.8189073302612438,
"step": 7250
},
{
"epoch": 0.47,
"eval_avg_sts": 0.7388870312908111,
"eval_sickr_spearman": 0.7199674303966463,
"eval_stsb_spearman": 0.7578066321849759,
"step": 7375
},
{
"epoch": 0.48,
"learning_rate": 1.5600921541021372e-05,
"loss": 0.0001,
"step": 7500
},
{
"epoch": 0.48,
"eval_avg_sts": 0.7359950441852947,
"eval_sickr_spearman": 0.7141863589964538,
"eval_stsb_spearman": 0.7578037293741355,
"step": 7500
},
{
"epoch": 0.49,
"eval_avg_sts": 0.7514533824270638,
"eval_sickr_spearman": 0.7285877642961502,
"eval_stsb_spearman": 0.7743190005579774,
"step": 7625
},
{
"epoch": 0.5,
"eval_avg_sts": 0.7601125755242234,
"eval_sickr_spearman": 0.7424667353055044,
"eval_stsb_spearman": 0.7777584157429424,
"step": 7750
},
{
"epoch": 0.5,
"eval_avg_sts": 0.7621753865509604,
"eval_sickr_spearman": 0.7417763842845344,
"eval_stsb_spearman": 0.7825743888173865,
"step": 7875
},
{
"epoch": 0.51,
"learning_rate": 1.4640982977089467e-05,
"loss": 0.0001,
"step": 8000
},
{
"epoch": 0.51,
"eval_avg_sts": 0.765106348392491,
"eval_sickr_spearman": 0.743488885175209,
"eval_stsb_spearman": 0.7867238116097731,
"step": 8000
},
{
"epoch": 0.52,
"eval_avg_sts": 0.7718140060309099,
"eval_sickr_spearman": 0.7408926538151189,
"eval_stsb_spearman": 0.8027353582467008,
"step": 8125
},
{
"epoch": 0.53,
"eval_avg_sts": 0.7689694127054261,
"eval_sickr_spearman": 0.7398511536455906,
"eval_stsb_spearman": 0.7980876717652616,
"step": 8250
},
{
"epoch": 0.54,
"eval_avg_sts": 0.7658098489708387,
"eval_sickr_spearman": 0.7388756900064839,
"eval_stsb_spearman": 0.7927440079351934,
"step": 8375
},
{
"epoch": 0.54,
"learning_rate": 1.368104441315756e-05,
"loss": 0.0001,
"step": 8500
},
{
"epoch": 0.54,
"eval_avg_sts": 0.7748332537811696,
"eval_sickr_spearman": 0.7417694197748259,
"eval_stsb_spearman": 0.8078970877875133,
"step": 8500
},
{
"epoch": 0.55,
"eval_avg_sts": 0.7748339728955141,
"eval_sickr_spearman": 0.7419876730997608,
"eval_stsb_spearman": 0.8076802726912675,
"step": 8625
},
{
"epoch": 0.56,
"eval_avg_sts": 0.7709733616182656,
"eval_sickr_spearman": 0.7395425057877492,
"eval_stsb_spearman": 0.802404217448782,
"step": 8750
},
{
"epoch": 0.57,
"eval_avg_sts": 0.7564357671357971,
"eval_sickr_spearman": 0.7294577516364988,
"eval_stsb_spearman": 0.7834137826350953,
"step": 8875
},
{
"epoch": 0.58,
"learning_rate": 1.2721105849225649e-05,
"loss": 0.0001,
"step": 9000
},
{
"epoch": 0.58,
"eval_avg_sts": 0.7576635056813905,
"eval_sickr_spearman": 0.7307409985736208,
"eval_stsb_spearman": 0.7845860127891603,
"step": 9000
},
{
"epoch": 0.58,
"eval_avg_sts": 0.7317573459891697,
"eval_sickr_spearman": 0.6975396437978298,
"eval_stsb_spearman": 0.7659750481805098,
"step": 9125
},
{
"epoch": 0.59,
"eval_avg_sts": 0.7296831294381873,
"eval_sickr_spearman": 0.6969872861312915,
"eval_stsb_spearman": 0.762378972745083,
"step": 9250
},
{
"epoch": 0.6,
"eval_avg_sts": 0.7711811922498575,
"eval_sickr_spearman": 0.7350368042240428,
"eval_stsb_spearman": 0.8073255802756722,
"step": 9375
},
{
"epoch": 0.61,
"learning_rate": 1.176116728529374e-05,
"loss": 0.0002,
"step": 9500
},
{
"epoch": 0.61,
"eval_avg_sts": 0.7655418136173882,
"eval_sickr_spearman": 0.7299852291924921,
"eval_stsb_spearman": 0.8010983980422841,
"step": 9500
},
{
"epoch": 0.62,
"eval_avg_sts": 0.7550596227536142,
"eval_sickr_spearman": 0.7207706545059959,
"eval_stsb_spearman": 0.7893485910012326,
"step": 9625
},
{
"epoch": 0.62,
"eval_avg_sts": 0.7634673032356596,
"eval_sickr_spearman": 0.7285461213312034,
"eval_stsb_spearman": 0.7983884851401158,
"step": 9750
},
{
"epoch": 0.63,
"eval_avg_sts": 0.7638598931096033,
"eval_sickr_spearman": 0.7283572630403488,
"eval_stsb_spearman": 0.7993625231788579,
"step": 9875
},
{
"epoch": 0.64,
"learning_rate": 1.0801228721361832e-05,
"loss": 0.0001,
"step": 10000
},
{
"epoch": 0.64,
"eval_avg_sts": 0.7667803597063858,
"eval_sickr_spearman": 0.7305812951613392,
"eval_stsb_spearman": 0.8029794242514324,
"step": 10000
},
{
"epoch": 0.65,
"eval_avg_sts": 0.7671530524779411,
"eval_sickr_spearman": 0.7299761993454218,
"eval_stsb_spearman": 0.8043299056104602,
"step": 10125
},
{
"epoch": 0.66,
"eval_avg_sts": 0.7744197669930808,
"eval_sickr_spearman": 0.7359438715747014,
"eval_stsb_spearman": 0.8128956624114603,
"step": 10250
},
{
"epoch": 0.66,
"eval_avg_sts": 0.7734565612749292,
"eval_sickr_spearman": 0.7352129342730163,
"eval_stsb_spearman": 0.8117001882768422,
"step": 10375
},
{
"epoch": 0.67,
"learning_rate": 9.841290157429926e-06,
"loss": 0.0001,
"step": 10500
},
{
"epoch": 0.67,
"eval_avg_sts": 0.7702705095845273,
"eval_sickr_spearman": 0.7336898680464138,
"eval_stsb_spearman": 0.8068511511226406,
"step": 10500
},
{
"epoch": 0.68,
"eval_avg_sts": 0.7638028086321877,
"eval_sickr_spearman": 0.7270147871880277,
"eval_stsb_spearman": 0.8005908300763477,
"step": 10625
},
{
"epoch": 0.69,
"eval_avg_sts": 0.7647879756637017,
"eval_sickr_spearman": 0.7278573073054794,
"eval_stsb_spearman": 0.8017186440219239,
"step": 10750
},
{
"epoch": 0.7,
"eval_avg_sts": 0.7646746212752267,
"eval_sickr_spearman": 0.7282990493454058,
"eval_stsb_spearman": 0.8010501932050476,
"step": 10875
},
{
"epoch": 0.7,
"learning_rate": 8.881351593498018e-06,
"loss": 0.0001,
"step": 11000
},
{
"epoch": 0.7,
"eval_avg_sts": 0.7595715432510943,
"eval_sickr_spearman": 0.7220255630932696,
"eval_stsb_spearman": 0.797117523408919,
"step": 11000
},
{
"epoch": 0.71,
"eval_avg_sts": 0.7637796865890665,
"eval_sickr_spearman": 0.725214251855543,
"eval_stsb_spearman": 0.80234512132259,
"step": 11125
},
{
"epoch": 0.72,
"eval_avg_sts": 0.7642527416188507,
"eval_sickr_spearman": 0.7212445773838859,
"eval_stsb_spearman": 0.8072609058538154,
"step": 11250
},
{
"epoch": 0.73,
"eval_avg_sts": 0.7625844941093753,
"eval_sickr_spearman": 0.7204506713082153,
"eval_stsb_spearman": 0.8047183169105355,
"step": 11375
},
{
"epoch": 0.74,
"learning_rate": 7.921413029566108e-06,
"loss": 0.0001,
"step": 11500
},
{
"epoch": 0.74,
"eval_avg_sts": 0.7631529336672214,
"eval_sickr_spearman": 0.7210336728174711,
"eval_stsb_spearman": 0.8052721945169715,
"step": 11500
},
{
"epoch": 0.74,
"eval_avg_sts": 0.7627819801067925,
"eval_sickr_spearman": 0.7209199351692657,
"eval_stsb_spearman": 0.8046440250443194,
"step": 11625
},
{
"epoch": 0.75,
"eval_avg_sts": 0.7612502434175876,
"eval_sickr_spearman": 0.7199052781513854,
"eval_stsb_spearman": 0.80259520868379,
"step": 11750
},
{
"epoch": 0.76,
"eval_avg_sts": 0.7549680843862416,
"eval_sickr_spearman": 0.7153213339234363,
"eval_stsb_spearman": 0.7946148348490468,
"step": 11875
},
{
"epoch": 0.77,
"learning_rate": 6.961474465634199e-06,
"loss": 0.0001,
"step": 12000
},
{
"epoch": 0.77,
"eval_avg_sts": 0.7566929851670519,
"eval_sickr_spearman": 0.7169140932782255,
"eval_stsb_spearman": 0.7964718770558783,
"step": 12000
},
{
"epoch": 0.78,
"eval_avg_sts": 0.7582762962904481,
"eval_sickr_spearman": 0.7181445060037657,
"eval_stsb_spearman": 0.7984080865771305,
"step": 12125
},
{
"epoch": 0.78,
"eval_avg_sts": 0.7575591207437209,
"eval_sickr_spearman": 0.7175433967692678,
"eval_stsb_spearman": 0.7975748447181741,
"step": 12250
},
{
"epoch": 0.79,
"eval_avg_sts": 0.7574126393782543,
"eval_sickr_spearman": 0.7182304336442386,
"eval_stsb_spearman": 0.7965948451122701,
"step": 12375
},
{
"epoch": 0.8,
"learning_rate": 6.001535901702292e-06,
"loss": 0.0001,
"step": 12500
},
{
"epoch": 0.8,
"eval_avg_sts": 0.7552374803740505,
"eval_sickr_spearman": 0.7164459341325082,
"eval_stsb_spearman": 0.7940290266155928,
"step": 12500
},
{
"epoch": 0.81,
"eval_avg_sts": 0.7551510628378968,
"eval_sickr_spearman": 0.7162126951039248,
"eval_stsb_spearman": 0.7940894305718689,
"step": 12625
},
{
"epoch": 0.82,
"eval_avg_sts": 0.7563770556022249,
"eval_sickr_spearman": 0.7171387347396517,
"eval_stsb_spearman": 0.7956153764647981,
"step": 12750
},
{
"epoch": 0.82,
"eval_avg_sts": 0.7568538616101905,
"eval_sickr_spearman": 0.7173768249094804,
"eval_stsb_spearman": 0.7963308983109005,
"step": 12875
},
{
"epoch": 0.83,
"learning_rate": 5.0415973377703825e-06,
"loss": 0.0001,
"step": 13000
},
{
"epoch": 0.83,
"eval_avg_sts": 0.7559100330626112,
"eval_sickr_spearman": 0.7166905085010312,
"eval_stsb_spearman": 0.7951295576241912,
"step": 13000
},
{
"epoch": 0.84,
"eval_avg_sts": 0.7564848751035596,
"eval_sickr_spearman": 0.7171825391041632,
"eval_stsb_spearman": 0.795787211102956,
"step": 13125
},
{
"epoch": 0.85,
"eval_avg_sts": 0.7488530315390816,
"eval_sickr_spearman": 0.7127996050357326,
"eval_stsb_spearman": 0.7849064580424306,
"step": 13250
},
{
"epoch": 0.86,
"eval_avg_sts": 0.7484617861410546,
"eval_sickr_spearman": 0.7117017581501617,
"eval_stsb_spearman": 0.7852218141319476,
"step": 13375
},
{
"epoch": 0.86,
"learning_rate": 4.081658773838474e-06,
"loss": 0.0001,
"step": 13500
},
{
"epoch": 0.86,
"eval_avg_sts": 0.7469284581969524,
"eval_sickr_spearman": 0.7094133163221428,
"eval_stsb_spearman": 0.784443600071762,
"step": 13500
},
{
"epoch": 0.87,
"eval_avg_sts": 0.7479276349305448,
"eval_sickr_spearman": 0.7103837366955984,
"eval_stsb_spearman": 0.7854715331654911,
"step": 13625
},
{
"epoch": 0.88,
"eval_avg_sts": 0.7420231480320236,
"eval_sickr_spearman": 0.7062097379184235,
"eval_stsb_spearman": 0.7778365581456238,
"step": 13750
},
{
"epoch": 0.89,
"eval_avg_sts": 0.7411633122563288,
"eval_sickr_spearman": 0.7050106895021224,
"eval_stsb_spearman": 0.7773159350105353,
"step": 13875
},
{
"epoch": 0.9,
"learning_rate": 3.121720209906566e-06,
"loss": 0.0001,
"step": 14000
},
{
"epoch": 0.9,
"eval_avg_sts": 0.7412314874976924,
"eval_sickr_spearman": 0.7050875872955249,
"eval_stsb_spearman": 0.7773753876998599,
"step": 14000
},
{
"epoch": 0.9,
"eval_avg_sts": 0.732587447078523,
"eval_sickr_spearman": 0.6977087132748919,
"eval_stsb_spearman": 0.767466180882154,
"step": 14125
},
{
"epoch": 0.91,
"eval_avg_sts": 0.7298853871265888,
"eval_sickr_spearman": 0.6949198834320908,
"eval_stsb_spearman": 0.7648508908210868,
"step": 14250
},
{
"epoch": 0.92,
"eval_avg_sts": 0.7308218986367342,
"eval_sickr_spearman": 0.6958364129097329,
"eval_stsb_spearman": 0.7658073843637355,
"step": 14375
},
{
"epoch": 0.93,
"learning_rate": 2.1617816459746575e-06,
"loss": 0.0,
"step": 14500
},
{
"epoch": 0.93,
"eval_avg_sts": 0.7317585701181548,
"eval_sickr_spearman": 0.6965340166270201,
"eval_stsb_spearman": 0.7669831236092894,
"step": 14500
},
{
"epoch": 0.94,
"eval_avg_sts": 0.732111710583657,
"eval_sickr_spearman": 0.696954673013415,
"eval_stsb_spearman": 0.7672687481538989,
"step": 14625
},
{
"epoch": 0.94,
"eval_avg_sts": 0.7375915728397734,
"eval_sickr_spearman": 0.7017668130042967,
"eval_stsb_spearman": 0.7734163326752501,
"step": 14750
},
{
"epoch": 0.95,
"eval_avg_sts": 0.737608211926382,
"eval_sickr_spearman": 0.7017644594803262,
"eval_stsb_spearman": 0.7734519643724378,
"step": 14875
},
{
"epoch": 0.96,
"learning_rate": 1.2018430820427492e-06,
"loss": 0.0001,
"step": 15000
},
{
"epoch": 0.96,
"eval_avg_sts": 0.7377728901345266,
"eval_sickr_spearman": 0.7023058180246352,
"eval_stsb_spearman": 0.7732399622444179,
"step": 15000
},
{
"epoch": 0.97,
"eval_avg_sts": 0.7394088348935646,
"eval_sickr_spearman": 0.7037121206436416,
"eval_stsb_spearman": 0.7751055491434876,
"step": 15125
},
{
"epoch": 0.98,
"eval_avg_sts": 0.7393669904391786,
"eval_sickr_spearman": 0.7033311859781359,
"eval_stsb_spearman": 0.7754027949002213,
"step": 15250
},
{
"epoch": 0.98,
"eval_avg_sts": 0.7399944883836842,
"eval_sickr_spearman": 0.7034986223977493,
"eval_stsb_spearman": 0.776490354369619,
"step": 15375
},
{
"epoch": 0.99,
"learning_rate": 2.4190451811084087e-07,
"loss": 0.0001,
"step": 15500
},
{
"epoch": 0.99,
"eval_avg_sts": 0.7400416501229861,
"eval_sickr_spearman": 0.7035811878611213,
"eval_stsb_spearman": 0.7765021123848508,
"step": 15500
},
{
"epoch": 1.0,
"eval_avg_sts": 0.7400548448254956,
"eval_sickr_spearman": 0.7035970861556974,
"eval_stsb_spearman": 0.7765126034952938,
"step": 15625
},
{
"epoch": 1.0,
"step": 15626,
"total_flos": 42723641240930304,
"train_runtime": 11103.0207,
"train_samples_per_second": 1.407
}
],
"max_steps": 15626,
"num_train_epochs": 1,
"total_flos": 42723641240930304,
"trial_name": null,
"trial_params": null
}