InfoCSE-bert-large / trainer_state.json
root
init
88ed5da
{
"best_metric": 0.8631831216150027,
"best_model_checkpoint": "result/InfoCSE-bert-large",
"epoch": 2.0,
"global_step": 31252,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.01,
"eval_avg_sts": 0.6667446229182062,
"eval_sickr_spearman": 0.6627723790529534,
"eval_stsb_spearman": 0.6707168667834591,
"step": 125
},
{
"epoch": 0.02,
"eval_avg_sts": 0.7051305088963267,
"eval_sickr_spearman": 0.6969365172570714,
"eval_stsb_spearman": 0.713324500535582,
"step": 250
},
{
"epoch": 0.02,
"eval_avg_sts": 0.725875395370044,
"eval_sickr_spearman": 0.716654533206054,
"eval_stsb_spearman": 0.735096257534034,
"step": 375
},
{
"epoch": 0.03,
"learning_rate": 6.888007167541277e-06,
"loss": 0.001,
"step": 500
},
{
"epoch": 0.03,
"eval_avg_sts": 0.7357340574594278,
"eval_sickr_spearman": 0.7235103965631273,
"eval_stsb_spearman": 0.7479577183557282,
"step": 500
},
{
"epoch": 0.04,
"eval_avg_sts": 0.7464037729944727,
"eval_sickr_spearman": 0.7301059313504061,
"eval_stsb_spearman": 0.7627016146385392,
"step": 625
},
{
"epoch": 0.05,
"eval_avg_sts": 0.7591284137806686,
"eval_sickr_spearman": 0.7344878567657066,
"eval_stsb_spearman": 0.7837689707956308,
"step": 750
},
{
"epoch": 0.06,
"eval_avg_sts": 0.7608889169495914,
"eval_sickr_spearman": 0.7373875423906269,
"eval_stsb_spearman": 0.7843902915085559,
"step": 875
},
{
"epoch": 0.06,
"learning_rate": 6.776014335082554e-06,
"loss": 0.0002,
"step": 1000
},
{
"epoch": 0.06,
"eval_avg_sts": 0.7633437897321462,
"eval_sickr_spearman": 0.7394359247736582,
"eval_stsb_spearman": 0.7872516546906342,
"step": 1000
},
{
"epoch": 0.07,
"eval_avg_sts": 0.7689886003242912,
"eval_sickr_spearman": 0.7459672900094155,
"eval_stsb_spearman": 0.7920099106391669,
"step": 1125
},
{
"epoch": 0.08,
"eval_avg_sts": 0.7695141299706598,
"eval_sickr_spearman": 0.749662274611948,
"eval_stsb_spearman": 0.7893659853293715,
"step": 1250
},
{
"epoch": 0.09,
"eval_avg_sts": 0.771575990947651,
"eval_sickr_spearman": 0.7507335602984238,
"eval_stsb_spearman": 0.7924184215968783,
"step": 1375
},
{
"epoch": 0.1,
"learning_rate": 6.6640215026238325e-06,
"loss": 0.0003,
"step": 1500
},
{
"epoch": 0.1,
"eval_avg_sts": 0.7721249223821594,
"eval_sickr_spearman": 0.7508546947362507,
"eval_stsb_spearman": 0.7933951500280679,
"step": 1500
},
{
"epoch": 0.1,
"eval_avg_sts": 0.7736414601237904,
"eval_sickr_spearman": 0.7518223773369244,
"eval_stsb_spearman": 0.7954605429106565,
"step": 1625
},
{
"epoch": 0.11,
"eval_avg_sts": 0.7750895970401648,
"eval_sickr_spearman": 0.7527568224154028,
"eval_stsb_spearman": 0.7974223716649267,
"step": 1750
},
{
"epoch": 0.12,
"eval_avg_sts": 0.7776564224610277,
"eval_sickr_spearman": 0.7542352378193863,
"eval_stsb_spearman": 0.8010776071026692,
"step": 1875
},
{
"epoch": 0.13,
"learning_rate": 6.55202867016511e-06,
"loss": 0.0001,
"step": 2000
},
{
"epoch": 0.13,
"eval_avg_sts": 0.7785919822208553,
"eval_sickr_spearman": 0.7546353668237488,
"eval_stsb_spearman": 0.802548597617962,
"step": 2000
},
{
"epoch": 0.14,
"eval_avg_sts": 0.7804785012417673,
"eval_sickr_spearman": 0.7560601133857076,
"eval_stsb_spearman": 0.8048968890978271,
"step": 2125
},
{
"epoch": 0.14,
"eval_avg_sts": 0.7791958793390172,
"eval_sickr_spearman": 0.7571627153503209,
"eval_stsb_spearman": 0.8012290433277136,
"step": 2250
},
{
"epoch": 0.15,
"eval_avg_sts": 0.7808643358009081,
"eval_sickr_spearman": 0.757428807652288,
"eval_stsb_spearman": 0.8042998639495281,
"step": 2375
},
{
"epoch": 0.16,
"learning_rate": 6.440035837706387e-06,
"loss": 0.0005,
"step": 2500
},
{
"epoch": 0.16,
"eval_avg_sts": 0.7997499220712412,
"eval_sickr_spearman": 0.7682156324132593,
"eval_stsb_spearman": 0.8312842117292232,
"step": 2500
},
{
"epoch": 0.17,
"eval_avg_sts": 0.8000945443564438,
"eval_sickr_spearman": 0.769006603032424,
"eval_stsb_spearman": 0.8311824856804637,
"step": 2625
},
{
"epoch": 0.18,
"eval_avg_sts": 0.8015655863550484,
"eval_sickr_spearman": 0.7697635307193054,
"eval_stsb_spearman": 0.8333676419907914,
"step": 2750
},
{
"epoch": 0.18,
"eval_avg_sts": 0.8020135971999303,
"eval_sickr_spearman": 0.7738109675441908,
"eval_stsb_spearman": 0.8302162268556699,
"step": 2875
},
{
"epoch": 0.19,
"learning_rate": 6.328043005247664e-06,
"loss": 0.0001,
"step": 3000
},
{
"epoch": 0.19,
"eval_avg_sts": 0.8021055052889553,
"eval_sickr_spearman": 0.7723527913356312,
"eval_stsb_spearman": 0.8318582192422794,
"step": 3000
},
{
"epoch": 0.2,
"eval_avg_sts": 0.8034828561746414,
"eval_sickr_spearman": 0.7730187425570707,
"eval_stsb_spearman": 0.8339469697922121,
"step": 3125
},
{
"epoch": 0.21,
"eval_avg_sts": 0.809294388946485,
"eval_sickr_spearman": 0.7739637544778655,
"eval_stsb_spearman": 0.8446250234151045,
"step": 3250
},
{
"epoch": 0.22,
"eval_avg_sts": 0.8095468267478854,
"eval_sickr_spearman": 0.7742509804644655,
"eval_stsb_spearman": 0.8448426730313053,
"step": 3375
},
{
"epoch": 0.22,
"learning_rate": 6.2160501727889415e-06,
"loss": 0.0001,
"step": 3500
},
{
"epoch": 0.22,
"eval_avg_sts": 0.8075109934505635,
"eval_sickr_spearman": 0.7709388998025974,
"eval_stsb_spearman": 0.8440830870985296,
"step": 3500
},
{
"epoch": 0.23,
"eval_avg_sts": 0.8072613664062491,
"eval_sickr_spearman": 0.7727868483993274,
"eval_stsb_spearman": 0.8417358844131708,
"step": 3625
},
{
"epoch": 0.24,
"eval_avg_sts": 0.8035650181540979,
"eval_sickr_spearman": 0.7687000741023642,
"eval_stsb_spearman": 0.8384299622058315,
"step": 3750
},
{
"epoch": 0.25,
"eval_avg_sts": 0.8060855472554131,
"eval_sickr_spearman": 0.7709744428176617,
"eval_stsb_spearman": 0.8411966516931645,
"step": 3875
},
{
"epoch": 0.26,
"learning_rate": 6.104057340330219e-06,
"loss": 0.0004,
"step": 4000
},
{
"epoch": 0.26,
"eval_avg_sts": 0.803351813599069,
"eval_sickr_spearman": 0.7677387500328843,
"eval_stsb_spearman": 0.8389648771652538,
"step": 4000
},
{
"epoch": 0.26,
"eval_avg_sts": 0.802660483963512,
"eval_sickr_spearman": 0.7673760487601211,
"eval_stsb_spearman": 0.8379449191669028,
"step": 4125
},
{
"epoch": 0.27,
"eval_avg_sts": 0.8047314511229144,
"eval_sickr_spearman": 0.7691939779184522,
"eval_stsb_spearman": 0.8402689243273768,
"step": 4250
},
{
"epoch": 0.28,
"eval_avg_sts": 0.8040567267552472,
"eval_sickr_spearman": 0.7695367278583146,
"eval_stsb_spearman": 0.8385767256521798,
"step": 4375
},
{
"epoch": 0.29,
"learning_rate": 5.992064507871497e-06,
"loss": 0.0003,
"step": 4500
},
{
"epoch": 0.29,
"eval_avg_sts": 0.8031439674900422,
"eval_sickr_spearman": 0.7708419250087939,
"eval_stsb_spearman": 0.8354460099712906,
"step": 4500
},
{
"epoch": 0.3,
"eval_avg_sts": 0.8016452961027151,
"eval_sickr_spearman": 0.76836294380137,
"eval_stsb_spearman": 0.8349276484040601,
"step": 4625
},
{
"epoch": 0.3,
"eval_avg_sts": 0.8036856358976682,
"eval_sickr_spearman": 0.7702216513648221,
"eval_stsb_spearman": 0.8371496204305142,
"step": 4750
},
{
"epoch": 0.31,
"eval_avg_sts": 0.8061976413597232,
"eval_sickr_spearman": 0.7719798778640656,
"eval_stsb_spearman": 0.8404154048553806,
"step": 4875
},
{
"epoch": 0.32,
"learning_rate": 5.880071675412773e-06,
"loss": 0.0001,
"step": 5000
},
{
"epoch": 0.32,
"eval_avg_sts": 0.8067273899585344,
"eval_sickr_spearman": 0.7723029350523384,
"eval_stsb_spearman": 0.8411518448647305,
"step": 5000
},
{
"epoch": 0.33,
"eval_avg_sts": 0.8078358230567408,
"eval_sickr_spearman": 0.7726999601368258,
"eval_stsb_spearman": 0.8429716859766557,
"step": 5125
},
{
"epoch": 0.34,
"eval_avg_sts": 0.802548441043093,
"eval_sickr_spearman": 0.7676195664444124,
"eval_stsb_spearman": 0.8374773156417734,
"step": 5250
},
{
"epoch": 0.34,
"eval_avg_sts": 0.800628830120568,
"eval_sickr_spearman": 0.7634932625509655,
"eval_stsb_spearman": 0.8377643976901704,
"step": 5375
},
{
"epoch": 0.35,
"learning_rate": 5.7680788429540505e-06,
"loss": 0.0002,
"step": 5500
},
{
"epoch": 0.35,
"eval_avg_sts": 0.8020238168463023,
"eval_sickr_spearman": 0.7652266089396642,
"eval_stsb_spearman": 0.8388210247529404,
"step": 5500
},
{
"epoch": 0.36,
"eval_avg_sts": 0.8040364434874829,
"eval_sickr_spearman": 0.7675117846527851,
"eval_stsb_spearman": 0.8405611023221807,
"step": 5625
},
{
"epoch": 0.37,
"eval_avg_sts": 0.8016723711497669,
"eval_sickr_spearman": 0.7650260310600586,
"eval_stsb_spearman": 0.8383187112394752,
"step": 5750
},
{
"epoch": 0.38,
"eval_avg_sts": 0.8020864629480828,
"eval_sickr_spearman": 0.7653134972021658,
"eval_stsb_spearman": 0.8388594286939999,
"step": 5875
},
{
"epoch": 0.38,
"learning_rate": 5.656086010495328e-06,
"loss": 0.0001,
"step": 6000
},
{
"epoch": 0.38,
"eval_avg_sts": 0.8028151558848002,
"eval_sickr_spearman": 0.7671768637824573,
"eval_stsb_spearman": 0.838453447987143,
"step": 6000
},
{
"epoch": 0.39,
"eval_avg_sts": 0.8049514040827435,
"eval_sickr_spearman": 0.7685626571211498,
"eval_stsb_spearman": 0.8413401510443372,
"step": 6125
},
{
"epoch": 0.4,
"eval_avg_sts": 0.8059812583547672,
"eval_sickr_spearman": 0.7690958503782142,
"eval_stsb_spearman": 0.8428666663313202,
"step": 6250
},
{
"epoch": 0.41,
"eval_avg_sts": 0.8063265220940947,
"eval_sickr_spearman": 0.7693663135104123,
"eval_stsb_spearman": 0.8432867306777773,
"step": 6375
},
{
"epoch": 0.42,
"learning_rate": 5.544093178036605e-06,
"loss": 0.0001,
"step": 6500
},
{
"epoch": 0.42,
"eval_avg_sts": 0.8061105071256144,
"eval_sickr_spearman": 0.769672271626573,
"eval_stsb_spearman": 0.8425487426246557,
"step": 6500
},
{
"epoch": 0.42,
"eval_avg_sts": 0.8069978292318387,
"eval_sickr_spearman": 0.770697879735581,
"eval_stsb_spearman": 0.8432977787280964,
"step": 6625
},
{
"epoch": 0.43,
"eval_avg_sts": 0.8080712074218199,
"eval_sickr_spearman": 0.7709677664945618,
"eval_stsb_spearman": 0.8451746483490781,
"step": 6750
},
{
"epoch": 0.44,
"eval_avg_sts": 0.808918715708319,
"eval_sickr_spearman": 0.7720352577240238,
"eval_stsb_spearman": 0.8458021736926141,
"step": 6875
},
{
"epoch": 0.45,
"learning_rate": 5.432100345577883e-06,
"loss": 0.0001,
"step": 7000
},
{
"epoch": 0.45,
"eval_avg_sts": 0.8006026057334057,
"eval_sickr_spearman": 0.7608432425913206,
"eval_stsb_spearman": 0.8403619688754909,
"step": 7000
},
{
"epoch": 0.46,
"eval_avg_sts": 0.8020612965823335,
"eval_sickr_spearman": 0.7626692409746934,
"eval_stsb_spearman": 0.8414533521899736,
"step": 7125
},
{
"epoch": 0.46,
"eval_avg_sts": 0.810499992265102,
"eval_sickr_spearman": 0.7673374317545649,
"eval_stsb_spearman": 0.8536625527756392,
"step": 7250
},
{
"epoch": 0.47,
"eval_avg_sts": 0.8112538171528675,
"eval_sickr_spearman": 0.7687574232374812,
"eval_stsb_spearman": 0.8537502110682538,
"step": 7375
},
{
"epoch": 0.48,
"learning_rate": 5.32010751311916e-06,
"loss": 0.0002,
"step": 7500
},
{
"epoch": 0.48,
"eval_avg_sts": 0.8149817134253148,
"eval_sickr_spearman": 0.7774900538521474,
"eval_stsb_spearman": 0.852473372998482,
"step": 7500
},
{
"epoch": 0.49,
"eval_avg_sts": 0.8174625453813287,
"eval_sickr_spearman": 0.7815984901758593,
"eval_stsb_spearman": 0.8533266005867981,
"step": 7625
},
{
"epoch": 0.5,
"eval_avg_sts": 0.8176977199916579,
"eval_sickr_spearman": 0.782115160734029,
"eval_stsb_spearman": 0.8532802792492867,
"step": 7750
},
{
"epoch": 0.5,
"eval_avg_sts": 0.8178800789250669,
"eval_sickr_spearman": 0.782127648820403,
"eval_stsb_spearman": 0.8536325090297309,
"step": 7875
},
{
"epoch": 0.51,
"learning_rate": 5.2081146806604376e-06,
"loss": 0.0001,
"step": 8000
},
{
"epoch": 0.51,
"eval_avg_sts": 0.8181362028628546,
"eval_sickr_spearman": 0.7824101677590619,
"eval_stsb_spearman": 0.8538622379666473,
"step": 8000
},
{
"epoch": 0.52,
"eval_avg_sts": 0.8182071435777255,
"eval_sickr_spearman": 0.7826502752351511,
"eval_stsb_spearman": 0.8537640119202999,
"step": 8125
},
{
"epoch": 0.53,
"eval_avg_sts": 0.8175148093264073,
"eval_sickr_spearman": 0.7809989179366073,
"eval_stsb_spearman": 0.8540307007162073,
"step": 8250
},
{
"epoch": 0.54,
"eval_avg_sts": 0.817271425771201,
"eval_sickr_spearman": 0.7809910408359715,
"eval_stsb_spearman": 0.8535518107064306,
"step": 8375
},
{
"epoch": 0.54,
"learning_rate": 5.096121848201715e-06,
"loss": 0.0,
"step": 8500
},
{
"epoch": 0.54,
"eval_avg_sts": 0.8169878861543607,
"eval_sickr_spearman": 0.7807656308769224,
"eval_stsb_spearman": 0.8532101414317989,
"step": 8500
},
{
"epoch": 0.55,
"eval_avg_sts": 0.8163714998445242,
"eval_sickr_spearman": 0.7799410809585343,
"eval_stsb_spearman": 0.852801918730514,
"step": 8625
},
{
"epoch": 0.56,
"eval_avg_sts": 0.814914066335918,
"eval_sickr_spearman": 0.7796482833641676,
"eval_stsb_spearman": 0.8501798493076684,
"step": 8750
},
{
"epoch": 0.57,
"eval_avg_sts": 0.8150768291940962,
"eval_sickr_spearman": 0.7799102930225125,
"eval_stsb_spearman": 0.8502433653656799,
"step": 8875
},
{
"epoch": 0.58,
"learning_rate": 4.984129015742992e-06,
"loss": 0.0001,
"step": 9000
},
{
"epoch": 0.58,
"eval_avg_sts": 0.8157444131185677,
"eval_sickr_spearman": 0.7805133715321694,
"eval_stsb_spearman": 0.850975454704966,
"step": 9000
},
{
"epoch": 0.58,
"eval_avg_sts": 0.8194025294491036,
"eval_sickr_spearman": 0.7869190393754633,
"eval_stsb_spearman": 0.851886019522744,
"step": 9125
},
{
"epoch": 0.59,
"eval_avg_sts": 0.6858142517829269,
"eval_sickr_spearman": 0.6164898018315937,
"eval_stsb_spearman": 0.7551387017342599,
"step": 9250
},
{
"epoch": 0.6,
"eval_avg_sts": 0.8177747035338222,
"eval_sickr_spearman": 0.783078280380066,
"eval_stsb_spearman": 0.8524711266875784,
"step": 9375
},
{
"epoch": 0.61,
"learning_rate": 4.872136183284269e-06,
"loss": 0.0015,
"step": 9500
},
{
"epoch": 0.61,
"eval_avg_sts": 0.819985242900733,
"eval_sickr_spearman": 0.7850574019148235,
"eval_stsb_spearman": 0.8549130838866427,
"step": 9500
},
{
"epoch": 0.62,
"eval_avg_sts": 0.820612467391125,
"eval_sickr_spearman": 0.7860280624437863,
"eval_stsb_spearman": 0.8551968723384636,
"step": 9625
},
{
"epoch": 0.62,
"eval_avg_sts": 0.8210179120381628,
"eval_sickr_spearman": 0.7866489124609753,
"eval_stsb_spearman": 0.8553869116153502,
"step": 9750
},
{
"epoch": 0.63,
"eval_avg_sts": 0.821463549997331,
"eval_sickr_spearman": 0.787914243797261,
"eval_stsb_spearman": 0.8550128561974009,
"step": 9875
},
{
"epoch": 0.64,
"learning_rate": 4.760143350825547e-06,
"loss": 0.0002,
"step": 10000
},
{
"epoch": 0.64,
"eval_avg_sts": 0.8220538798411258,
"eval_sickr_spearman": 0.7882646787133534,
"eval_stsb_spearman": 0.8558430809688982,
"step": 10000
},
{
"epoch": 0.65,
"eval_avg_sts": 0.8227053843456922,
"eval_sickr_spearman": 0.7892594508552383,
"eval_stsb_spearman": 0.856151317836146,
"step": 10125
},
{
"epoch": 0.66,
"eval_avg_sts": 0.8211210354889169,
"eval_sickr_spearman": 0.7858874273787755,
"eval_stsb_spearman": 0.8563546435990582,
"step": 10250
},
{
"epoch": 0.66,
"eval_avg_sts": 0.8217109523377687,
"eval_sickr_spearman": 0.7865405062650296,
"eval_stsb_spearman": 0.8568813984105078,
"step": 10375
},
{
"epoch": 0.67,
"learning_rate": 4.648150518366825e-06,
"loss": 0.0002,
"step": 10500
},
{
"epoch": 0.67,
"eval_avg_sts": 0.8231847712907092,
"eval_sickr_spearman": 0.7883226042216879,
"eval_stsb_spearman": 0.8580469383597307,
"step": 10500
},
{
"epoch": 0.68,
"eval_avg_sts": 0.8231833094531285,
"eval_sickr_spearman": 0.7886680439032306,
"eval_stsb_spearman": 0.8576985750030263,
"step": 10625
},
{
"epoch": 0.69,
"eval_avg_sts": 0.8235797750151058,
"eval_sickr_spearman": 0.7894692507063199,
"eval_stsb_spearman": 0.8576902993238917,
"step": 10750
},
{
"epoch": 0.7,
"eval_avg_sts": 0.8239802387430818,
"eval_sickr_spearman": 0.7900059982648908,
"eval_stsb_spearman": 0.8579544792212728,
"step": 10875
},
{
"epoch": 0.7,
"learning_rate": 4.536157685908102e-06,
"loss": 0.0001,
"step": 11000
},
{
"epoch": 0.7,
"eval_avg_sts": 0.8228846723006884,
"eval_sickr_spearman": 0.7878013707088813,
"eval_stsb_spearman": 0.8579679738924955,
"step": 11000
},
{
"epoch": 0.71,
"eval_avg_sts": 0.8233402178257747,
"eval_sickr_spearman": 0.788485765873273,
"eval_stsb_spearman": 0.8581946697782764,
"step": 11125
},
{
"epoch": 0.72,
"eval_avg_sts": 0.8233165033728497,
"eval_sickr_spearman": 0.788493306756199,
"eval_stsb_spearman": 0.8581396999895003,
"step": 11250
},
{
"epoch": 0.73,
"eval_avg_sts": 0.8211286933035429,
"eval_sickr_spearman": 0.787368274267214,
"eval_stsb_spearman": 0.8548891123398719,
"step": 11375
},
{
"epoch": 0.74,
"learning_rate": 4.424164853449379e-06,
"loss": 0.0002,
"step": 11500
},
{
"epoch": 0.74,
"eval_avg_sts": 0.8222354006770852,
"eval_sickr_spearman": 0.7882437371531265,
"eval_stsb_spearman": 0.856227064201044,
"step": 11500
},
{
"epoch": 0.74,
"eval_avg_sts": 0.823058736106017,
"eval_sickr_spearman": 0.7882230837795081,
"eval_stsb_spearman": 0.8578943884325259,
"step": 11625
},
{
"epoch": 0.75,
"eval_avg_sts": 0.8240623262398707,
"eval_sickr_spearman": 0.7903270861780045,
"eval_stsb_spearman": 0.8577975663017371,
"step": 11750
},
{
"epoch": 0.76,
"eval_avg_sts": 0.8193741224170432,
"eval_sickr_spearman": 0.7834559008995725,
"eval_stsb_spearman": 0.8552923439345139,
"step": 11875
},
{
"epoch": 0.77,
"learning_rate": 4.312172020990656e-06,
"loss": 0.0004,
"step": 12000
},
{
"epoch": 0.77,
"eval_avg_sts": 0.8219118427006455,
"eval_sickr_spearman": 0.785794199010884,
"eval_stsb_spearman": 0.8580294863904071,
"step": 12000
},
{
"epoch": 0.78,
"eval_avg_sts": 0.823098023008008,
"eval_sickr_spearman": 0.7879260114171134,
"eval_stsb_spearman": 0.8582700345989028,
"step": 12125
},
{
"epoch": 0.78,
"eval_avg_sts": 0.8227772117211238,
"eval_sickr_spearman": 0.7878058376013152,
"eval_stsb_spearman": 0.8577485858409325,
"step": 12250
},
{
"epoch": 0.79,
"eval_avg_sts": 0.8244800942376741,
"eval_sickr_spearman": 0.7899311658088503,
"eval_stsb_spearman": 0.8590290226664979,
"step": 12375
},
{
"epoch": 0.8,
"learning_rate": 4.2001791885319345e-06,
"loss": 0.0003,
"step": 12500
},
{
"epoch": 0.8,
"eval_avg_sts": 0.8252546537289246,
"eval_sickr_spearman": 0.7905314585146238,
"eval_stsb_spearman": 0.8599778489432254,
"step": 12500
},
{
"epoch": 0.81,
"eval_avg_sts": 0.8242515246774704,
"eval_sickr_spearman": 0.7934860436884877,
"eval_stsb_spearman": 0.855017005666453,
"step": 12625
},
{
"epoch": 0.82,
"eval_avg_sts": 0.8251886392831695,
"eval_sickr_spearman": 0.7935808570827266,
"eval_stsb_spearman": 0.8567964214836123,
"step": 12750
},
{
"epoch": 0.82,
"eval_avg_sts": 0.8255732979417849,
"eval_sickr_spearman": 0.7939037701776952,
"eval_stsb_spearman": 0.8572428257058746,
"step": 12875
},
{
"epoch": 0.83,
"learning_rate": 4.088186356073212e-06,
"loss": 0.0002,
"step": 13000
},
{
"epoch": 0.83,
"eval_avg_sts": 0.8272525514506217,
"eval_sickr_spearman": 0.7954193915835747,
"eval_stsb_spearman": 0.8590857113176686,
"step": 13000
},
{
"epoch": 0.84,
"eval_avg_sts": 0.8276110249953785,
"eval_sickr_spearman": 0.7955957617880555,
"eval_stsb_spearman": 0.8596262882027015,
"step": 13125
},
{
"epoch": 0.85,
"eval_avg_sts": 0.8262806808137206,
"eval_sickr_spearman": 0.792061729406442,
"eval_stsb_spearman": 0.8604996322209992,
"step": 13250
},
{
"epoch": 0.86,
"eval_avg_sts": 0.8270413161061019,
"eval_sickr_spearman": 0.7918599027181991,
"eval_stsb_spearman": 0.8622227294940048,
"step": 13375
},
{
"epoch": 0.86,
"learning_rate": 3.976193523614489e-06,
"loss": 0.0002,
"step": 13500
},
{
"epoch": 0.86,
"eval_avg_sts": 0.8277173388272963,
"eval_sickr_spearman": 0.7929541472711621,
"eval_stsb_spearman": 0.8624805303834304,
"step": 13500
},
{
"epoch": 0.87,
"eval_avg_sts": 0.8280371802211439,
"eval_sickr_spearman": 0.7936189937772684,
"eval_stsb_spearman": 0.8624553666650194,
"step": 13625
},
{
"epoch": 0.88,
"eval_avg_sts": 0.8280087430461096,
"eval_sickr_spearman": 0.7934894538966899,
"eval_stsb_spearman": 0.8625280321955292,
"step": 13750
},
{
"epoch": 0.89,
"eval_avg_sts": 0.8279846750031183,
"eval_sickr_spearman": 0.7941465193643633,
"eval_stsb_spearman": 0.8618228306418733,
"step": 13875
},
{
"epoch": 0.9,
"learning_rate": 3.864200691155766e-06,
"loss": 0.0001,
"step": 14000
},
{
"epoch": 0.9,
"eval_avg_sts": 0.8281003824811937,
"eval_sickr_spearman": 0.7943439752223754,
"eval_stsb_spearman": 0.8618567897400118,
"step": 14000
},
{
"epoch": 0.9,
"eval_avg_sts": 0.8280440185035953,
"eval_sickr_spearman": 0.792904915392188,
"eval_stsb_spearman": 0.8631831216150027,
"step": 14125
},
{
"epoch": 0.91,
"eval_avg_sts": 0.8279193239585301,
"eval_sickr_spearman": 0.7931221120328913,
"eval_stsb_spearman": 0.8627165358841689,
"step": 14250
},
{
"epoch": 0.92,
"eval_avg_sts": 0.8275099017452278,
"eval_sickr_spearman": 0.793065195177687,
"eval_stsb_spearman": 0.8619546083127685,
"step": 14375
},
{
"epoch": 0.93,
"learning_rate": 3.7522078586970435e-06,
"loss": 0.0001,
"step": 14500
},
{
"epoch": 0.93,
"eval_avg_sts": 0.8275982959975564,
"eval_sickr_spearman": 0.7935053521912658,
"eval_stsb_spearman": 0.861691239803847,
"step": 14500
},
{
"epoch": 0.94,
"eval_avg_sts": 0.8276150816017793,
"eval_sickr_spearman": 0.7940267778284781,
"eval_stsb_spearman": 0.8612033853750805,
"step": 14625
},
{
"epoch": 0.94,
"eval_avg_sts": 0.8277678050001869,
"eval_sickr_spearman": 0.7940122244047422,
"eval_stsb_spearman": 0.8615233855956315,
"step": 14750
},
{
"epoch": 0.95,
"eval_avg_sts": 0.827775044421294,
"eval_sickr_spearman": 0.79435247672733,
"eval_stsb_spearman": 0.861197612115258,
"step": 14875
},
{
"epoch": 0.96,
"learning_rate": 3.6402150262383203e-06,
"loss": 0.0002,
"step": 15000
},
{
"epoch": 0.96,
"eval_avg_sts": 0.8265288786526938,
"eval_sickr_spearman": 0.7941830230014563,
"eval_stsb_spearman": 0.8588747343039312,
"step": 15000
},
{
"epoch": 0.97,
"eval_avg_sts": 0.826595528411173,
"eval_sickr_spearman": 0.7947538726420482,
"eval_stsb_spearman": 0.8584371841802979,
"step": 15125
},
{
"epoch": 0.98,
"eval_avg_sts": 0.8271259707838263,
"eval_sickr_spearman": 0.7952840399397222,
"eval_stsb_spearman": 0.8589679016279306,
"step": 15250
},
{
"epoch": 0.98,
"eval_avg_sts": 0.8269049666463504,
"eval_sickr_spearman": 0.7927316191781993,
"eval_stsb_spearman": 0.8610783141145013,
"step": 15375
},
{
"epoch": 0.99,
"learning_rate": 3.5282221937795976e-06,
"loss": 0.0003,
"step": 15500
},
{
"epoch": 0.99,
"eval_avg_sts": 0.82737580758211,
"eval_sickr_spearman": 0.7935406550508229,
"eval_stsb_spearman": 0.8612109601133972,
"step": 15500
},
{
"epoch": 1.0,
"eval_avg_sts": 0.8264028870845463,
"eval_sickr_spearman": 0.7940738673657366,
"eval_stsb_spearman": 0.8587319068033561,
"step": 15625
},
{
"epoch": 1.01,
"eval_avg_sts": 0.8268441102829658,
"eval_sickr_spearman": 0.7937048253555384,
"eval_stsb_spearman": 0.8599833952103932,
"step": 15750
},
{
"epoch": 1.02,
"eval_avg_sts": 0.8275739286019619,
"eval_sickr_spearman": 0.7947639591733503,
"eval_stsb_spearman": 0.8603838980305735,
"step": 15875
},
{
"epoch": 1.02,
"learning_rate": 3.4162293613208757e-06,
"loss": 0.0001,
"step": 16000
},
{
"epoch": 1.02,
"eval_avg_sts": 0.8277768410299685,
"eval_sickr_spearman": 0.7952131460339995,
"eval_stsb_spearman": 0.8603405360259375,
"step": 16000
},
{
"epoch": 1.03,
"eval_avg_sts": 0.8282682698041279,
"eval_sickr_spearman": 0.7963400997670419,
"eval_stsb_spearman": 0.860196439841214,
"step": 16125
},
{
"epoch": 1.04,
"eval_avg_sts": 0.8264618348746703,
"eval_sickr_spearman": 0.7934643816617393,
"eval_stsb_spearman": 0.8594592880876013,
"step": 16250
},
{
"epoch": 1.05,
"eval_avg_sts": 0.8264717428559492,
"eval_sickr_spearman": 0.7932766280862176,
"eval_stsb_spearman": 0.8596668576256806,
"step": 16375
},
{
"epoch": 1.06,
"learning_rate": 3.304236528862153e-06,
"loss": 0.0002,
"step": 16500
},
{
"epoch": 1.06,
"eval_avg_sts": 0.8274883631622513,
"eval_sickr_spearman": 0.7946689056236043,
"eval_stsb_spearman": 0.8603078207008983,
"step": 16500
},
{
"epoch": 1.06,
"eval_avg_sts": 0.8285054599151072,
"eval_sickr_spearman": 0.7953375465867241,
"eval_stsb_spearman": 0.8616733732434904,
"step": 16625
},
{
"epoch": 1.07,
"eval_avg_sts": 0.8267040342845151,
"eval_sickr_spearman": 0.7930167317963359,
"eval_stsb_spearman": 0.8603913367726943,
"step": 16750
},
{
"epoch": 1.08,
"eval_avg_sts": 0.8254063226482575,
"eval_sickr_spearman": 0.7925604363326739,
"eval_stsb_spearman": 0.8582522089638411,
"step": 16875
},
{
"epoch": 1.09,
"learning_rate": 3.19224369640343e-06,
"loss": 0.0003,
"step": 17000
},
{
"epoch": 1.09,
"eval_avg_sts": 0.8263459648804743,
"eval_sickr_spearman": 0.7938006474029073,
"eval_stsb_spearman": 0.8588912823580412,
"step": 17000
},
{
"epoch": 1.1,
"eval_avg_sts": 0.8265585284525776,
"eval_sickr_spearman": 0.7938499273129829,
"eval_stsb_spearman": 0.8592671295921722,
"step": 17125
},
{
"epoch": 1.1,
"eval_avg_sts": 0.8275713806370856,
"eval_sickr_spearman": 0.795413819975808,
"eval_stsb_spearman": 0.8597289412983632,
"step": 17250
},
{
"epoch": 1.11,
"eval_avg_sts": 0.8278030720022054,
"eval_sickr_spearman": 0.7957596439061624,
"eval_stsb_spearman": 0.8598465000982485,
"step": 17375
},
{
"epoch": 1.12,
"learning_rate": 3.0802508639447074e-06,
"loss": 0.0003,
"step": 17500
},
{
"epoch": 1.12,
"eval_avg_sts": 0.828665230451958,
"eval_sickr_spearman": 0.7959547942713053,
"eval_stsb_spearman": 0.8613756666326104,
"step": 17500
},
{
"epoch": 1.13,
"eval_avg_sts": 0.8288773890103436,
"eval_sickr_spearman": 0.7964317911396872,
"eval_stsb_spearman": 0.861322986881,
"step": 17625
},
{
"epoch": 1.14,
"eval_avg_sts": 0.8287921576974288,
"eval_sickr_spearman": 0.7965225699214054,
"eval_stsb_spearman": 0.8610617454734522,
"step": 17750
},
{
"epoch": 1.14,
"eval_avg_sts": 0.8287755856452497,
"eval_sickr_spearman": 0.7967101794036225,
"eval_stsb_spearman": 0.8608409918868768,
"step": 17875
},
{
"epoch": 1.15,
"learning_rate": 2.9682580314859847e-06,
"loss": 0.0001,
"step": 18000
},
{
"epoch": 1.15,
"eval_avg_sts": 0.8292774010789281,
"eval_sickr_spearman": 0.7969440428365246,
"eval_stsb_spearman": 0.8616107593213317,
"step": 18000
},
{
"epoch": 1.16,
"eval_avg_sts": 0.8293137062967321,
"eval_sickr_spearman": 0.7971494238262741,
"eval_stsb_spearman": 0.8614779887671901,
"step": 18125
},
{
"epoch": 1.17,
"eval_avg_sts": 0.8293003591512393,
"eval_sickr_spearman": 0.7972976478053122,
"eval_stsb_spearman": 0.8613030704971664,
"step": 18250
},
{
"epoch": 1.18,
"eval_avg_sts": 0.8269276043107123,
"eval_sickr_spearman": 0.7936150552269506,
"eval_stsb_spearman": 0.8602401533944739,
"step": 18375
},
{
"epoch": 1.18,
"learning_rate": 2.8562651990272623e-06,
"loss": 0.0001,
"step": 18500
},
{
"epoch": 1.18,
"eval_avg_sts": 0.8271598852494388,
"eval_sickr_spearman": 0.7938677468516165,
"eval_stsb_spearman": 0.8604520236472611,
"step": 18500
},
{
"epoch": 1.19,
"eval_avg_sts": 0.8273011691673453,
"eval_sickr_spearman": 0.7941100157272702,
"eval_stsb_spearman": 0.8604923226074204,
"step": 18625
},
{
"epoch": 1.2,
"eval_avg_sts": 0.8274659412451935,
"eval_sickr_spearman": 0.7943473373994759,
"eval_stsb_spearman": 0.860584545090911,
"step": 18750
},
{
"epoch": 1.21,
"eval_avg_sts": 0.8273871753451842,
"eval_sickr_spearman": 0.7941770191137765,
"eval_stsb_spearman": 0.8605973315765919,
"step": 18875
},
{
"epoch": 1.22,
"learning_rate": 2.7442723665685396e-06,
"loss": 0.0002,
"step": 19000
},
{
"epoch": 1.22,
"eval_avg_sts": 0.8268924907436139,
"eval_sickr_spearman": 0.7941484406084208,
"eval_stsb_spearman": 0.859636540878807,
"step": 19000
},
{
"epoch": 1.22,
"eval_avg_sts": 0.8258034139625235,
"eval_sickr_spearman": 0.7932116900370734,
"eval_stsb_spearman": 0.8583951378879737,
"step": 19125
},
{
"epoch": 1.23,
"eval_avg_sts": 0.8252544789859086,
"eval_sickr_spearman": 0.7925500616147634,
"eval_stsb_spearman": 0.857958896357054,
"step": 19250
},
{
"epoch": 1.24,
"eval_avg_sts": 0.8253536873185088,
"eval_sickr_spearman": 0.7926197067118486,
"eval_stsb_spearman": 0.858087667925169,
"step": 19375
},
{
"epoch": 1.25,
"learning_rate": 2.632279534109817e-06,
"loss": 0.0002,
"step": 19500
},
{
"epoch": 1.25,
"eval_avg_sts": 0.8259692031147807,
"eval_sickr_spearman": 0.7942922457261266,
"eval_stsb_spearman": 0.8576461605034348,
"step": 19500
},
{
"epoch": 1.26,
"eval_avg_sts": 0.8262977896726795,
"eval_sickr_spearman": 0.7945857637870148,
"eval_stsb_spearman": 0.8580098155583442,
"step": 19625
},
{
"epoch": 1.26,
"eval_avg_sts": 0.8265435124446001,
"eval_sickr_spearman": 0.7949808676274447,
"eval_stsb_spearman": 0.8581061572617555,
"step": 19750
},
{
"epoch": 1.27,
"eval_avg_sts": 0.82660901551375,
"eval_sickr_spearman": 0.795241820601558,
"eval_stsb_spearman": 0.8579762104259421,
"step": 19875
},
{
"epoch": 1.28,
"learning_rate": 2.5202867016510945e-06,
"loss": 0.0001,
"step": 20000
},
{
"epoch": 1.28,
"eval_avg_sts": 0.8249759667991925,
"eval_sickr_spearman": 0.7929103429066506,
"eval_stsb_spearman": 0.8570415906917342,
"step": 20000
},
{
"epoch": 1.29,
"eval_avg_sts": 0.8252695158247048,
"eval_sickr_spearman": 0.7941818702550217,
"eval_stsb_spearman": 0.8563571613943879,
"step": 20125
},
{
"epoch": 1.3,
"eval_avg_sts": 0.8254168575586551,
"eval_sickr_spearman": 0.794336146152841,
"eval_stsb_spearman": 0.8564975689644694,
"step": 20250
},
{
"epoch": 1.3,
"eval_avg_sts": 0.8259865535716795,
"eval_sickr_spearman": 0.7950048831781639,
"eval_stsb_spearman": 0.8569682239651952,
"step": 20375
},
{
"epoch": 1.31,
"learning_rate": 2.4082938691923718e-06,
"loss": 0.0001,
"step": 20500
},
{
"epoch": 1.31,
"eval_avg_sts": 0.826209318888689,
"eval_sickr_spearman": 0.7952033957204077,
"eval_stsb_spearman": 0.8572152420569702,
"step": 20500
},
{
"epoch": 1.32,
"eval_avg_sts": 0.8259891403986184,
"eval_sickr_spearman": 0.7948762078574111,
"eval_stsb_spearman": 0.8571020729398255,
"step": 20625
},
{
"epoch": 1.33,
"eval_avg_sts": 0.8259890083537097,
"eval_sickr_spearman": 0.7947911447767642,
"eval_stsb_spearman": 0.8571868719306552,
"step": 20750
},
{
"epoch": 1.34,
"eval_avg_sts": 0.8261152907691348,
"eval_sickr_spearman": 0.7949135280232285,
"eval_stsb_spearman": 0.8573170535150412,
"step": 20875
},
{
"epoch": 1.34,
"learning_rate": 2.296301036733649e-06,
"loss": 0.0001,
"step": 21000
},
{
"epoch": 1.34,
"eval_avg_sts": 0.826274962054796,
"eval_sickr_spearman": 0.7950501284757184,
"eval_stsb_spearman": 0.8574997956338737,
"step": 21000
},
{
"epoch": 1.35,
"eval_avg_sts": 0.8260486313726075,
"eval_sickr_spearman": 0.794899647034913,
"eval_stsb_spearman": 0.8571976157103021,
"step": 21125
},
{
"epoch": 1.36,
"eval_avg_sts": 0.825587114078729,
"eval_sickr_spearman": 0.7946725559873136,
"eval_stsb_spearman": 0.8565016721701444,
"step": 21250
},
{
"epoch": 1.37,
"eval_avg_sts": 0.8256303672089018,
"eval_sickr_spearman": 0.7944853787850091,
"eval_stsb_spearman": 0.8567753556327944,
"step": 21375
},
{
"epoch": 1.38,
"learning_rate": 2.1843082042749267e-06,
"loss": 0.0002,
"step": 21500
},
{
"epoch": 1.38,
"eval_avg_sts": 0.8254654257169443,
"eval_sickr_spearman": 0.7936856129149631,
"eval_stsb_spearman": 0.8572452385189255,
"step": 21500
},
{
"epoch": 1.38,
"eval_avg_sts": 0.8257646791990041,
"eval_sickr_spearman": 0.7941317738162218,
"eval_stsb_spearman": 0.8573975845817864,
"step": 21625
},
{
"epoch": 1.39,
"eval_avg_sts": 0.8263390736725806,
"eval_sickr_spearman": 0.7947459955414125,
"eval_stsb_spearman": 0.8579321518037489,
"step": 21750
},
{
"epoch": 1.4,
"eval_avg_sts": 0.825957826826842,
"eval_sickr_spearman": 0.7945194808670303,
"eval_stsb_spearman": 0.8573961727866538,
"step": 21875
},
{
"epoch": 1.41,
"learning_rate": 2.072315371816204e-06,
"loss": 0.0001,
"step": 22000
},
{
"epoch": 1.41,
"eval_avg_sts": 0.8257198535359889,
"eval_sickr_spearman": 0.7936219236744562,
"eval_stsb_spearman": 0.8578177833975217,
"step": 22000
},
{
"epoch": 1.42,
"eval_avg_sts": 0.8270054813778303,
"eval_sickr_spearman": 0.7958380306637094,
"eval_stsb_spearman": 0.858172932091951,
"step": 22125
},
{
"epoch": 1.42,
"eval_avg_sts": 0.8270091578481822,
"eval_sickr_spearman": 0.7962583028012928,
"eval_stsb_spearman": 0.8577600128950715,
"step": 22250
},
{
"epoch": 1.43,
"eval_avg_sts": 0.8259725703398417,
"eval_sickr_spearman": 0.7959245346773993,
"eval_stsb_spearman": 0.8560206060022842,
"step": 22375
},
{
"epoch": 1.44,
"learning_rate": 1.9603225393574807e-06,
"loss": 0.0002,
"step": 22500
},
{
"epoch": 1.44,
"eval_avg_sts": 0.8254714237214871,
"eval_sickr_spearman": 0.7955676635937141,
"eval_stsb_spearman": 0.8553751838492601,
"step": 22500
},
{
"epoch": 1.45,
"eval_avg_sts": 0.8243312613565763,
"eval_sickr_spearman": 0.7926490056837258,
"eval_stsb_spearman": 0.8560135170294269,
"step": 22625
},
{
"epoch": 1.46,
"eval_avg_sts": 0.8244931271533935,
"eval_sickr_spearman": 0.7931114971594734,
"eval_stsb_spearman": 0.8558747571473136,
"step": 22750
},
{
"epoch": 1.46,
"eval_avg_sts": 0.8245178381258861,
"eval_sickr_spearman": 0.7931850518122927,
"eval_stsb_spearman": 0.8558506244394795,
"step": 22875
},
{
"epoch": 1.47,
"learning_rate": 1.8483297068987584e-06,
"loss": 0.0002,
"step": 23000
},
{
"epoch": 1.47,
"eval_avg_sts": 0.8250123369922542,
"eval_sickr_spearman": 0.7931228324994128,
"eval_stsb_spearman": 0.8569018414850956,
"step": 23000
},
{
"epoch": 1.48,
"eval_avg_sts": 0.8254867372327745,
"eval_sickr_spearman": 0.7938168819151935,
"eval_stsb_spearman": 0.8571565925503556,
"step": 23125
},
{
"epoch": 1.49,
"eval_avg_sts": 0.8256499116596692,
"eval_sickr_spearman": 0.7939716381240272,
"eval_stsb_spearman": 0.8573281851953113,
"step": 23250
},
{
"epoch": 1.5,
"eval_avg_sts": 0.8258346679802114,
"eval_sickr_spearman": 0.7940527146232547,
"eval_stsb_spearman": 0.8576166213371682,
"step": 23375
},
{
"epoch": 1.5,
"learning_rate": 1.7363368744400357e-06,
"loss": 0.0001,
"step": 23500
},
{
"epoch": 1.5,
"eval_avg_sts": 0.825945269207895,
"eval_sickr_spearman": 0.7943781253354978,
"eval_stsb_spearman": 0.8575124130802922,
"step": 23500
},
{
"epoch": 1.51,
"eval_avg_sts": 0.8258713568091718,
"eval_sickr_spearman": 0.794315540810324,
"eval_stsb_spearman": 0.8574271728080196,
"step": 23625
},
{
"epoch": 1.52,
"eval_avg_sts": 0.8258355435328646,
"eval_sickr_spearman": 0.7940151062708286,
"eval_stsb_spearman": 0.8576559807949005,
"step": 23750
},
{
"epoch": 1.53,
"eval_avg_sts": 0.8257865803230886,
"eval_sickr_spearman": 0.7940416194388225,
"eval_stsb_spearman": 0.8575315412073548,
"step": 23875
},
{
"epoch": 1.54,
"learning_rate": 1.6243440419813131e-06,
"loss": 0.0002,
"step": 24000
},
{
"epoch": 1.54,
"eval_avg_sts": 0.8258057571249391,
"eval_sickr_spearman": 0.7941539161539849,
"eval_stsb_spearman": 0.8574575980958933,
"step": 24000
},
{
"epoch": 1.54,
"eval_avg_sts": 0.8258599414659757,
"eval_sickr_spearman": 0.7942335517201692,
"eval_stsb_spearman": 0.8574863312117823,
"step": 24125
},
{
"epoch": 1.55,
"eval_avg_sts": 0.8259837419138151,
"eval_sickr_spearman": 0.7943245706573944,
"eval_stsb_spearman": 0.8576429131702358,
"step": 24250
},
{
"epoch": 1.56,
"eval_avg_sts": 0.8273046944370666,
"eval_sickr_spearman": 0.7953777005875265,
"eval_stsb_spearman": 0.8592316882866066,
"step": 24375
},
{
"epoch": 1.57,
"learning_rate": 1.5123512095225906e-06,
"loss": 0.0001,
"step": 24500
},
{
"epoch": 1.57,
"eval_avg_sts": 0.8270336322444836,
"eval_sickr_spearman": 0.7948833644915253,
"eval_stsb_spearman": 0.8591838999974419,
"step": 24500
},
{
"epoch": 1.58,
"eval_avg_sts": 0.8268251999183458,
"eval_sickr_spearman": 0.7944777418398805,
"eval_stsb_spearman": 0.8591726579968111,
"step": 24625
},
{
"epoch": 1.58,
"eval_avg_sts": 0.8267020534374147,
"eval_sickr_spearman": 0.7943936393812624,
"eval_stsb_spearman": 0.8590104674935669,
"step": 24750
},
{
"epoch": 1.59,
"eval_avg_sts": 0.825917107993902,
"eval_sickr_spearman": 0.7938579965380246,
"eval_stsb_spearman": 0.8579762194497796,
"step": 24875
},
{
"epoch": 1.6,
"learning_rate": 1.4003583770638678e-06,
"loss": 0.0002,
"step": 25000
},
{
"epoch": 1.6,
"eval_avg_sts": 0.8263527703022291,
"eval_sickr_spearman": 0.7941290360434399,
"eval_stsb_spearman": 0.8585765045610182,
"step": 25000
},
{
"epoch": 1.61,
"eval_avg_sts": 0.8269584920385149,
"eval_sickr_spearman": 0.7941601601971716,
"eval_stsb_spearman": 0.8597568238798581,
"step": 25125
},
{
"epoch": 1.62,
"eval_avg_sts": 0.8264998215853827,
"eval_sickr_spearman": 0.7927663936956405,
"eval_stsb_spearman": 0.8602332494751249,
"step": 25250
},
{
"epoch": 1.62,
"eval_avg_sts": 0.825942745088348,
"eval_sickr_spearman": 0.7922521246925426,
"eval_stsb_spearman": 0.8596333654841534,
"step": 25375
},
{
"epoch": 1.63,
"learning_rate": 1.2883655446051453e-06,
"loss": 0.0001,
"step": 25500
},
{
"epoch": 1.63,
"eval_avg_sts": 0.8259010696773026,
"eval_sickr_spearman": 0.7922646127789166,
"eval_stsb_spearman": 0.8595375265756887,
"step": 25500
},
{
"epoch": 1.64,
"eval_avg_sts": 0.8259285307896478,
"eval_sickr_spearman": 0.7926812825838921,
"eval_stsb_spearman": 0.8591757789954035,
"step": 25625
},
{
"epoch": 1.65,
"eval_avg_sts": 0.8258391793675839,
"eval_sickr_spearman": 0.7926954517588166,
"eval_stsb_spearman": 0.858982906976351,
"step": 25750
},
{
"epoch": 1.66,
"eval_avg_sts": 0.8258409312899861,
"eval_sickr_spearman": 0.7928338293620596,
"eval_stsb_spearman": 0.8588480332179126,
"step": 25875
},
{
"epoch": 1.66,
"learning_rate": 1.1763727121464225e-06,
"loss": 0.0001,
"step": 26000
},
{
"epoch": 1.66,
"eval_avg_sts": 0.8251984305884675,
"eval_sickr_spearman": 0.7933060231202977,
"eval_stsb_spearman": 0.8570908380566373,
"step": 26000
},
{
"epoch": 1.67,
"eval_avg_sts": 0.8253196217152283,
"eval_sickr_spearman": 0.7932125065657978,
"eval_stsb_spearman": 0.8574267368646588,
"step": 26125
},
{
"epoch": 1.68,
"eval_avg_sts": 0.8253745698430313,
"eval_sickr_spearman": 0.7933913263564519,
"eval_stsb_spearman": 0.8573578133296105,
"step": 26250
},
{
"epoch": 1.69,
"eval_avg_sts": 0.825411316540875,
"eval_sickr_spearman": 0.7934114513879544,
"eval_stsb_spearman": 0.8574111816937955,
"step": 26375
},
{
"epoch": 1.7,
"learning_rate": 1.0643798796877e-06,
"loss": 0.0001,
"step": 26500
},
{
"epoch": 1.7,
"eval_avg_sts": 0.8249370852399975,
"eval_sickr_spearman": 0.7937128945805799,
"eval_stsb_spearman": 0.8561612758994152,
"step": 26500
},
{
"epoch": 1.7,
"eval_avg_sts": 0.825459765367129,
"eval_sickr_spearman": 0.7933420944774778,
"eval_stsb_spearman": 0.8575774362567802,
"step": 26625
},
{
"epoch": 1.71,
"eval_avg_sts": 0.826427995376563,
"eval_sickr_spearman": 0.7947685701590883,
"eval_stsb_spearman": 0.8580874205940376,
"step": 26750
},
{
"epoch": 1.72,
"eval_avg_sts": 0.8258856380174763,
"eval_sickr_spearman": 0.7942930142237495,
"eval_stsb_spearman": 0.857478261811203,
"step": 26875
},
{
"epoch": 1.73,
"learning_rate": 9.523870472289774e-07,
"loss": 0.0002,
"step": 27000
},
{
"epoch": 1.73,
"eval_avg_sts": 0.8258593024414255,
"eval_sickr_spearman": 0.7941693821686479,
"eval_stsb_spearman": 0.8575492227142031,
"step": 27000
},
{
"epoch": 1.74,
"eval_avg_sts": 0.8258720619743833,
"eval_sickr_spearman": 0.7941788923267327,
"eval_stsb_spearman": 0.857565231622034,
"step": 27125
},
{
"epoch": 1.74,
"eval_avg_sts": 0.8259531389747516,
"eval_sickr_spearman": 0.7941532917496662,
"eval_stsb_spearman": 0.8577529861998372,
"step": 27250
},
{
"epoch": 1.75,
"eval_avg_sts": 0.825969657799255,
"eval_sickr_spearman": 0.7942109771024933,
"eval_stsb_spearman": 0.8577283384960166,
"step": 27375
},
{
"epoch": 1.76,
"learning_rate": 8.403942147702547e-07,
"loss": 0.0002,
"step": 27500
},
{
"epoch": 1.76,
"eval_avg_sts": 0.8259987251545413,
"eval_sickr_spearman": 0.7943161171835413,
"eval_stsb_spearman": 0.8576813331255413,
"step": 27500
},
{
"epoch": 1.77,
"eval_avg_sts": 0.8252131722274082,
"eval_sickr_spearman": 0.793231382788663,
"eval_stsb_spearman": 0.8571949616661534,
"step": 27625
},
{
"epoch": 1.78,
"eval_avg_sts": 0.8252604604270115,
"eval_sickr_spearman": 0.7933024207876899,
"eval_stsb_spearman": 0.857218500066333,
"step": 27750
},
{
"epoch": 1.78,
"eval_avg_sts": 0.8251969961170478,
"eval_sickr_spearman": 0.793198385421975,
"eval_stsb_spearman": 0.8571956068121205,
"step": 27875
},
{
"epoch": 1.79,
"learning_rate": 7.284013823115321e-07,
"loss": 0.0002,
"step": 28000
},
{
"epoch": 1.79,
"eval_avg_sts": 0.825311717070901,
"eval_sickr_spearman": 0.7931744179023573,
"eval_stsb_spearman": 0.8574490162394447,
"step": 28000
},
{
"epoch": 1.8,
"eval_avg_sts": 0.8256482381761492,
"eval_sickr_spearman": 0.7934648139416521,
"eval_stsb_spearman": 0.8578316624106462,
"step": 28125
},
{
"epoch": 1.81,
"eval_avg_sts": 0.8261129479959839,
"eval_sickr_spearman": 0.7939418588411357,
"eval_stsb_spearman": 0.858284037150832,
"step": 28250
},
{
"epoch": 1.82,
"eval_avg_sts": 0.8262712326490254,
"eval_sickr_spearman": 0.7933230261302068,
"eval_stsb_spearman": 0.8592194391678438,
"step": 28375
},
{
"epoch": 1.82,
"learning_rate": 6.164085498528094e-07,
"loss": 0.0002,
"step": 28500
},
{
"epoch": 1.82,
"eval_avg_sts": 0.8262943695062834,
"eval_sickr_spearman": 0.7934199048618075,
"eval_stsb_spearman": 0.8591688341507593,
"step": 28500
},
{
"epoch": 1.83,
"eval_avg_sts": 0.8260598340905722,
"eval_sickr_spearman": 0.7933951208134654,
"eval_stsb_spearman": 0.8587245473676789,
"step": 28625
},
{
"epoch": 1.84,
"eval_avg_sts": 0.8259360112469695,
"eval_sickr_spearman": 0.7933420944774778,
"eval_stsb_spearman": 0.8585299280164611,
"step": 28750
},
{
"epoch": 1.85,
"eval_avg_sts": 0.8258330858999741,
"eval_sickr_spearman": 0.7933054467470805,
"eval_stsb_spearman": 0.8583607250528676,
"step": 28875
},
{
"epoch": 1.86,
"learning_rate": 5.044157173940868e-07,
"loss": 0.0001,
"step": 29000
},
{
"epoch": 1.86,
"eval_avg_sts": 0.8258376969438936,
"eval_sickr_spearman": 0.7933141884075422,
"eval_stsb_spearman": 0.8583612054802452,
"step": 29000
},
{
"epoch": 1.86,
"eval_avg_sts": 0.8259136180644091,
"eval_sickr_spearman": 0.7933194718287004,
"eval_stsb_spearman": 0.8585077643001178,
"step": 29125
},
{
"epoch": 1.87,
"eval_avg_sts": 0.825910175107258,
"eval_sickr_spearman": 0.7933039097518345,
"eval_stsb_spearman": 0.8585164404626813,
"step": 29250
},
{
"epoch": 1.88,
"eval_avg_sts": 0.8258308833879402,
"eval_sickr_spearman": 0.7933173584602371,
"eval_stsb_spearman": 0.8583444083156432,
"step": 29375
},
{
"epoch": 1.89,
"learning_rate": 3.9242288493536413e-07,
"loss": 0.0001,
"step": 29500
},
{
"epoch": 1.89,
"eval_avg_sts": 0.8257221328599513,
"eval_sickr_spearman": 0.7931374819853514,
"eval_stsb_spearman": 0.8583067837345514,
"step": 29500
},
{
"epoch": 1.9,
"eval_avg_sts": 0.825786763719202,
"eval_sickr_spearman": 0.7932694234210019,
"eval_stsb_spearman": 0.858304104017402,
"step": 29625
},
{
"epoch": 1.9,
"eval_avg_sts": 0.8257681951340192,
"eval_sickr_spearman": 0.7932804705743327,
"eval_stsb_spearman": 0.8582559196937056,
"step": 29750
},
{
"epoch": 1.91,
"eval_avg_sts": 0.8258082608558808,
"eval_sickr_spearman": 0.7933519408532725,
"eval_stsb_spearman": 0.8582645808584891,
"step": 29875
},
{
"epoch": 1.92,
"learning_rate": 2.804300524766415e-07,
"loss": 0.0001,
"step": 30000
},
{
"epoch": 1.92,
"eval_avg_sts": 0.8258262861889483,
"eval_sickr_spearman": 0.7933999719547107,
"eval_stsb_spearman": 0.8582526004231857,
"step": 30000
},
{
"epoch": 1.93,
"eval_avg_sts": 0.8256086631585,
"eval_sickr_spearman": 0.7930556369885008,
"eval_stsb_spearman": 0.8581616893284993,
"step": 30125
},
{
"epoch": 1.94,
"eval_avg_sts": 0.8256480515518101,
"eval_sickr_spearman": 0.7931325828130048,
"eval_stsb_spearman": 0.8581635202906153,
"step": 30250
},
{
"epoch": 1.94,
"eval_avg_sts": 0.8258219208455879,
"eval_sickr_spearman": 0.7934267252782117,
"eval_stsb_spearman": 0.8582171164129642,
"step": 30375
},
{
"epoch": 1.95,
"learning_rate": 1.6843722001791884e-07,
"loss": 0.0002,
"step": 30500
},
{
"epoch": 1.95,
"eval_avg_sts": 0.8258322719939588,
"eval_sickr_spearman": 0.7934731233222009,
"eval_stsb_spearman": 0.8581914206657169,
"step": 30500
},
{
"epoch": 1.96,
"eval_avg_sts": 0.8258242424865203,
"eval_sickr_spearman": 0.7934302315486167,
"eval_stsb_spearman": 0.858218253424424,
"step": 30625
},
{
"epoch": 1.97,
"eval_avg_sts": 0.8258248316168127,
"eval_sickr_spearman": 0.7934435841948165,
"eval_stsb_spearman": 0.858206079038809,
"step": 30750
},
{
"epoch": 1.98,
"eval_avg_sts": 0.8257922895919085,
"eval_sickr_spearman": 0.7933790303944838,
"eval_stsb_spearman": 0.8582055487893332,
"step": 30875
},
{
"epoch": 1.98,
"learning_rate": 5.64443875591962e-08,
"loss": 0.0001,
"step": 31000
},
{
"epoch": 1.98,
"eval_avg_sts": 0.8257897415072173,
"eval_sickr_spearman": 0.7933720178536738,
"eval_stsb_spearman": 0.8582074651607609,
"step": 31000
},
{
"epoch": 1.99,
"eval_avg_sts": 0.8257977713308224,
"eval_sickr_spearman": 0.7933829209137002,
"eval_stsb_spearman": 0.8582126217479447,
"step": 31125
},
{
"epoch": 2.0,
"eval_avg_sts": 0.8258126560134551,
"eval_sickr_spearman": 0.7934017010743625,
"eval_stsb_spearman": 0.8582236109525477,
"step": 31250
},
{
"epoch": 2.0,
"step": 31252,
"train_runtime": 21163.9877,
"train_samples_per_second": 1.477
}
],
"max_steps": 31252,
"num_train_epochs": 2,
"total_flos": 776159526314354880,
"trial_name": null,
"trial_params": null
}