{ "best_metric": 0.8631831216150027, "best_model_checkpoint": "result/InfoCSE-bert-large", "epoch": 2.0, "global_step": 31252, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.01, "eval_avg_sts": 0.6667446229182062, "eval_sickr_spearman": 0.6627723790529534, "eval_stsb_spearman": 0.6707168667834591, "step": 125 }, { "epoch": 0.02, "eval_avg_sts": 0.7051305088963267, "eval_sickr_spearman": 0.6969365172570714, "eval_stsb_spearman": 0.713324500535582, "step": 250 }, { "epoch": 0.02, "eval_avg_sts": 0.725875395370044, "eval_sickr_spearman": 0.716654533206054, "eval_stsb_spearman": 0.735096257534034, "step": 375 }, { "epoch": 0.03, "learning_rate": 6.888007167541277e-06, "loss": 0.001, "step": 500 }, { "epoch": 0.03, "eval_avg_sts": 0.7357340574594278, "eval_sickr_spearman": 0.7235103965631273, "eval_stsb_spearman": 0.7479577183557282, "step": 500 }, { "epoch": 0.04, "eval_avg_sts": 0.7464037729944727, "eval_sickr_spearman": 0.7301059313504061, "eval_stsb_spearman": 0.7627016146385392, "step": 625 }, { "epoch": 0.05, "eval_avg_sts": 0.7591284137806686, "eval_sickr_spearman": 0.7344878567657066, "eval_stsb_spearman": 0.7837689707956308, "step": 750 }, { "epoch": 0.06, "eval_avg_sts": 0.7608889169495914, "eval_sickr_spearman": 0.7373875423906269, "eval_stsb_spearman": 0.7843902915085559, "step": 875 }, { "epoch": 0.06, "learning_rate": 6.776014335082554e-06, "loss": 0.0002, "step": 1000 }, { "epoch": 0.06, "eval_avg_sts": 0.7633437897321462, "eval_sickr_spearman": 0.7394359247736582, "eval_stsb_spearman": 0.7872516546906342, "step": 1000 }, { "epoch": 0.07, "eval_avg_sts": 0.7689886003242912, "eval_sickr_spearman": 0.7459672900094155, "eval_stsb_spearman": 0.7920099106391669, "step": 1125 }, { "epoch": 0.08, "eval_avg_sts": 0.7695141299706598, "eval_sickr_spearman": 0.749662274611948, "eval_stsb_spearman": 0.7893659853293715, "step": 1250 }, { "epoch": 0.09, "eval_avg_sts": 0.771575990947651, "eval_sickr_spearman": 0.7507335602984238, "eval_stsb_spearman": 0.7924184215968783, "step": 1375 }, { "epoch": 0.1, "learning_rate": 6.6640215026238325e-06, "loss": 0.0003, "step": 1500 }, { "epoch": 0.1, "eval_avg_sts": 0.7721249223821594, "eval_sickr_spearman": 0.7508546947362507, "eval_stsb_spearman": 0.7933951500280679, "step": 1500 }, { "epoch": 0.1, "eval_avg_sts": 0.7736414601237904, "eval_sickr_spearman": 0.7518223773369244, "eval_stsb_spearman": 0.7954605429106565, "step": 1625 }, { "epoch": 0.11, "eval_avg_sts": 0.7750895970401648, "eval_sickr_spearman": 0.7527568224154028, "eval_stsb_spearman": 0.7974223716649267, "step": 1750 }, { "epoch": 0.12, "eval_avg_sts": 0.7776564224610277, "eval_sickr_spearman": 0.7542352378193863, "eval_stsb_spearman": 0.8010776071026692, "step": 1875 }, { "epoch": 0.13, "learning_rate": 6.55202867016511e-06, "loss": 0.0001, "step": 2000 }, { "epoch": 0.13, "eval_avg_sts": 0.7785919822208553, "eval_sickr_spearman": 0.7546353668237488, "eval_stsb_spearman": 0.802548597617962, "step": 2000 }, { "epoch": 0.14, "eval_avg_sts": 0.7804785012417673, "eval_sickr_spearman": 0.7560601133857076, "eval_stsb_spearman": 0.8048968890978271, "step": 2125 }, { "epoch": 0.14, "eval_avg_sts": 0.7791958793390172, "eval_sickr_spearman": 0.7571627153503209, "eval_stsb_spearman": 0.8012290433277136, "step": 2250 }, { "epoch": 0.15, "eval_avg_sts": 0.7808643358009081, "eval_sickr_spearman": 0.757428807652288, "eval_stsb_spearman": 0.8042998639495281, "step": 2375 }, { "epoch": 0.16, "learning_rate": 6.440035837706387e-06, "loss": 0.0005, "step": 2500 }, { "epoch": 0.16, "eval_avg_sts": 0.7997499220712412, "eval_sickr_spearman": 0.7682156324132593, "eval_stsb_spearman": 0.8312842117292232, "step": 2500 }, { "epoch": 0.17, "eval_avg_sts": 0.8000945443564438, "eval_sickr_spearman": 0.769006603032424, "eval_stsb_spearman": 0.8311824856804637, "step": 2625 }, { "epoch": 0.18, "eval_avg_sts": 0.8015655863550484, "eval_sickr_spearman": 0.7697635307193054, "eval_stsb_spearman": 0.8333676419907914, "step": 2750 }, { "epoch": 0.18, "eval_avg_sts": 0.8020135971999303, "eval_sickr_spearman": 0.7738109675441908, "eval_stsb_spearman": 0.8302162268556699, "step": 2875 }, { "epoch": 0.19, "learning_rate": 6.328043005247664e-06, "loss": 0.0001, "step": 3000 }, { "epoch": 0.19, "eval_avg_sts": 0.8021055052889553, "eval_sickr_spearman": 0.7723527913356312, "eval_stsb_spearman": 0.8318582192422794, "step": 3000 }, { "epoch": 0.2, "eval_avg_sts": 0.8034828561746414, "eval_sickr_spearman": 0.7730187425570707, "eval_stsb_spearman": 0.8339469697922121, "step": 3125 }, { "epoch": 0.21, "eval_avg_sts": 0.809294388946485, "eval_sickr_spearman": 0.7739637544778655, "eval_stsb_spearman": 0.8446250234151045, "step": 3250 }, { "epoch": 0.22, "eval_avg_sts": 0.8095468267478854, "eval_sickr_spearman": 0.7742509804644655, "eval_stsb_spearman": 0.8448426730313053, "step": 3375 }, { "epoch": 0.22, "learning_rate": 6.2160501727889415e-06, "loss": 0.0001, "step": 3500 }, { "epoch": 0.22, "eval_avg_sts": 0.8075109934505635, "eval_sickr_spearman": 0.7709388998025974, "eval_stsb_spearman": 0.8440830870985296, "step": 3500 }, { "epoch": 0.23, "eval_avg_sts": 0.8072613664062491, "eval_sickr_spearman": 0.7727868483993274, "eval_stsb_spearman": 0.8417358844131708, "step": 3625 }, { "epoch": 0.24, "eval_avg_sts": 0.8035650181540979, "eval_sickr_spearman": 0.7687000741023642, "eval_stsb_spearman": 0.8384299622058315, "step": 3750 }, { "epoch": 0.25, "eval_avg_sts": 0.8060855472554131, "eval_sickr_spearman": 0.7709744428176617, "eval_stsb_spearman": 0.8411966516931645, "step": 3875 }, { "epoch": 0.26, "learning_rate": 6.104057340330219e-06, "loss": 0.0004, "step": 4000 }, { "epoch": 0.26, "eval_avg_sts": 0.803351813599069, "eval_sickr_spearman": 0.7677387500328843, "eval_stsb_spearman": 0.8389648771652538, "step": 4000 }, { "epoch": 0.26, "eval_avg_sts": 0.802660483963512, "eval_sickr_spearman": 0.7673760487601211, "eval_stsb_spearman": 0.8379449191669028, "step": 4125 }, { "epoch": 0.27, "eval_avg_sts": 0.8047314511229144, "eval_sickr_spearman": 0.7691939779184522, "eval_stsb_spearman": 0.8402689243273768, "step": 4250 }, { "epoch": 0.28, "eval_avg_sts": 0.8040567267552472, "eval_sickr_spearman": 0.7695367278583146, "eval_stsb_spearman": 0.8385767256521798, "step": 4375 }, { "epoch": 0.29, "learning_rate": 5.992064507871497e-06, "loss": 0.0003, "step": 4500 }, { "epoch": 0.29, "eval_avg_sts": 0.8031439674900422, "eval_sickr_spearman": 0.7708419250087939, "eval_stsb_spearman": 0.8354460099712906, "step": 4500 }, { "epoch": 0.3, "eval_avg_sts": 0.8016452961027151, "eval_sickr_spearman": 0.76836294380137, "eval_stsb_spearman": 0.8349276484040601, "step": 4625 }, { "epoch": 0.3, "eval_avg_sts": 0.8036856358976682, "eval_sickr_spearman": 0.7702216513648221, "eval_stsb_spearman": 0.8371496204305142, "step": 4750 }, { "epoch": 0.31, "eval_avg_sts": 0.8061976413597232, "eval_sickr_spearman": 0.7719798778640656, "eval_stsb_spearman": 0.8404154048553806, "step": 4875 }, { "epoch": 0.32, "learning_rate": 5.880071675412773e-06, "loss": 0.0001, "step": 5000 }, { "epoch": 0.32, "eval_avg_sts": 0.8067273899585344, "eval_sickr_spearman": 0.7723029350523384, "eval_stsb_spearman": 0.8411518448647305, "step": 5000 }, { "epoch": 0.33, "eval_avg_sts": 0.8078358230567408, "eval_sickr_spearman": 0.7726999601368258, "eval_stsb_spearman": 0.8429716859766557, "step": 5125 }, { "epoch": 0.34, "eval_avg_sts": 0.802548441043093, "eval_sickr_spearman": 0.7676195664444124, "eval_stsb_spearman": 0.8374773156417734, "step": 5250 }, { "epoch": 0.34, "eval_avg_sts": 0.800628830120568, "eval_sickr_spearman": 0.7634932625509655, "eval_stsb_spearman": 0.8377643976901704, "step": 5375 }, { "epoch": 0.35, "learning_rate": 5.7680788429540505e-06, "loss": 0.0002, "step": 5500 }, { "epoch": 0.35, "eval_avg_sts": 0.8020238168463023, "eval_sickr_spearman": 0.7652266089396642, "eval_stsb_spearman": 0.8388210247529404, "step": 5500 }, { "epoch": 0.36, "eval_avg_sts": 0.8040364434874829, "eval_sickr_spearman": 0.7675117846527851, "eval_stsb_spearman": 0.8405611023221807, "step": 5625 }, { "epoch": 0.37, "eval_avg_sts": 0.8016723711497669, "eval_sickr_spearman": 0.7650260310600586, "eval_stsb_spearman": 0.8383187112394752, "step": 5750 }, { "epoch": 0.38, "eval_avg_sts": 0.8020864629480828, "eval_sickr_spearman": 0.7653134972021658, "eval_stsb_spearman": 0.8388594286939999, "step": 5875 }, { "epoch": 0.38, "learning_rate": 5.656086010495328e-06, "loss": 0.0001, "step": 6000 }, { "epoch": 0.38, "eval_avg_sts": 0.8028151558848002, "eval_sickr_spearman": 0.7671768637824573, "eval_stsb_spearman": 0.838453447987143, "step": 6000 }, { "epoch": 0.39, "eval_avg_sts": 0.8049514040827435, "eval_sickr_spearman": 0.7685626571211498, "eval_stsb_spearman": 0.8413401510443372, "step": 6125 }, { "epoch": 0.4, "eval_avg_sts": 0.8059812583547672, "eval_sickr_spearman": 0.7690958503782142, "eval_stsb_spearman": 0.8428666663313202, "step": 6250 }, { "epoch": 0.41, "eval_avg_sts": 0.8063265220940947, "eval_sickr_spearman": 0.7693663135104123, "eval_stsb_spearman": 0.8432867306777773, "step": 6375 }, { "epoch": 0.42, "learning_rate": 5.544093178036605e-06, "loss": 0.0001, "step": 6500 }, { "epoch": 0.42, "eval_avg_sts": 0.8061105071256144, "eval_sickr_spearman": 0.769672271626573, "eval_stsb_spearman": 0.8425487426246557, "step": 6500 }, { "epoch": 0.42, "eval_avg_sts": 0.8069978292318387, "eval_sickr_spearman": 0.770697879735581, "eval_stsb_spearman": 0.8432977787280964, "step": 6625 }, { "epoch": 0.43, "eval_avg_sts": 0.8080712074218199, "eval_sickr_spearman": 0.7709677664945618, "eval_stsb_spearman": 0.8451746483490781, "step": 6750 }, { "epoch": 0.44, "eval_avg_sts": 0.808918715708319, "eval_sickr_spearman": 0.7720352577240238, "eval_stsb_spearman": 0.8458021736926141, "step": 6875 }, { "epoch": 0.45, "learning_rate": 5.432100345577883e-06, "loss": 0.0001, "step": 7000 }, { "epoch": 0.45, "eval_avg_sts": 0.8006026057334057, "eval_sickr_spearman": 0.7608432425913206, "eval_stsb_spearman": 0.8403619688754909, "step": 7000 }, { "epoch": 0.46, "eval_avg_sts": 0.8020612965823335, "eval_sickr_spearman": 0.7626692409746934, "eval_stsb_spearman": 0.8414533521899736, "step": 7125 }, { "epoch": 0.46, "eval_avg_sts": 0.810499992265102, "eval_sickr_spearman": 0.7673374317545649, "eval_stsb_spearman": 0.8536625527756392, "step": 7250 }, { "epoch": 0.47, "eval_avg_sts": 0.8112538171528675, "eval_sickr_spearman": 0.7687574232374812, "eval_stsb_spearman": 0.8537502110682538, "step": 7375 }, { "epoch": 0.48, "learning_rate": 5.32010751311916e-06, "loss": 0.0002, "step": 7500 }, { "epoch": 0.48, "eval_avg_sts": 0.8149817134253148, "eval_sickr_spearman": 0.7774900538521474, "eval_stsb_spearman": 0.852473372998482, "step": 7500 }, { "epoch": 0.49, "eval_avg_sts": 0.8174625453813287, "eval_sickr_spearman": 0.7815984901758593, "eval_stsb_spearman": 0.8533266005867981, "step": 7625 }, { "epoch": 0.5, "eval_avg_sts": 0.8176977199916579, "eval_sickr_spearman": 0.782115160734029, "eval_stsb_spearman": 0.8532802792492867, "step": 7750 }, { "epoch": 0.5, "eval_avg_sts": 0.8178800789250669, "eval_sickr_spearman": 0.782127648820403, "eval_stsb_spearman": 0.8536325090297309, "step": 7875 }, { "epoch": 0.51, "learning_rate": 5.2081146806604376e-06, "loss": 0.0001, "step": 8000 }, { "epoch": 0.51, "eval_avg_sts": 0.8181362028628546, "eval_sickr_spearman": 0.7824101677590619, "eval_stsb_spearman": 0.8538622379666473, "step": 8000 }, { "epoch": 0.52, "eval_avg_sts": 0.8182071435777255, "eval_sickr_spearman": 0.7826502752351511, "eval_stsb_spearman": 0.8537640119202999, "step": 8125 }, { "epoch": 0.53, "eval_avg_sts": 0.8175148093264073, "eval_sickr_spearman": 0.7809989179366073, "eval_stsb_spearman": 0.8540307007162073, "step": 8250 }, { "epoch": 0.54, "eval_avg_sts": 0.817271425771201, "eval_sickr_spearman": 0.7809910408359715, "eval_stsb_spearman": 0.8535518107064306, "step": 8375 }, { "epoch": 0.54, "learning_rate": 5.096121848201715e-06, "loss": 0.0, "step": 8500 }, { "epoch": 0.54, "eval_avg_sts": 0.8169878861543607, "eval_sickr_spearman": 0.7807656308769224, "eval_stsb_spearman": 0.8532101414317989, "step": 8500 }, { "epoch": 0.55, "eval_avg_sts": 0.8163714998445242, "eval_sickr_spearman": 0.7799410809585343, "eval_stsb_spearman": 0.852801918730514, "step": 8625 }, { "epoch": 0.56, "eval_avg_sts": 0.814914066335918, "eval_sickr_spearman": 0.7796482833641676, "eval_stsb_spearman": 0.8501798493076684, "step": 8750 }, { "epoch": 0.57, "eval_avg_sts": 0.8150768291940962, "eval_sickr_spearman": 0.7799102930225125, "eval_stsb_spearman": 0.8502433653656799, "step": 8875 }, { "epoch": 0.58, "learning_rate": 4.984129015742992e-06, "loss": 0.0001, "step": 9000 }, { "epoch": 0.58, "eval_avg_sts": 0.8157444131185677, "eval_sickr_spearman": 0.7805133715321694, "eval_stsb_spearman": 0.850975454704966, "step": 9000 }, { "epoch": 0.58, "eval_avg_sts": 0.8194025294491036, "eval_sickr_spearman": 0.7869190393754633, "eval_stsb_spearman": 0.851886019522744, "step": 9125 }, { "epoch": 0.59, "eval_avg_sts": 0.6858142517829269, "eval_sickr_spearman": 0.6164898018315937, "eval_stsb_spearman": 0.7551387017342599, "step": 9250 }, { "epoch": 0.6, "eval_avg_sts": 0.8177747035338222, "eval_sickr_spearman": 0.783078280380066, "eval_stsb_spearman": 0.8524711266875784, "step": 9375 }, { "epoch": 0.61, "learning_rate": 4.872136183284269e-06, "loss": 0.0015, "step": 9500 }, { "epoch": 0.61, "eval_avg_sts": 0.819985242900733, "eval_sickr_spearman": 0.7850574019148235, "eval_stsb_spearman": 0.8549130838866427, "step": 9500 }, { "epoch": 0.62, "eval_avg_sts": 0.820612467391125, "eval_sickr_spearman": 0.7860280624437863, "eval_stsb_spearman": 0.8551968723384636, "step": 9625 }, { "epoch": 0.62, "eval_avg_sts": 0.8210179120381628, "eval_sickr_spearman": 0.7866489124609753, "eval_stsb_spearman": 0.8553869116153502, "step": 9750 }, { "epoch": 0.63, "eval_avg_sts": 0.821463549997331, "eval_sickr_spearman": 0.787914243797261, "eval_stsb_spearman": 0.8550128561974009, "step": 9875 }, { "epoch": 0.64, "learning_rate": 4.760143350825547e-06, "loss": 0.0002, "step": 10000 }, { "epoch": 0.64, "eval_avg_sts": 0.8220538798411258, "eval_sickr_spearman": 0.7882646787133534, "eval_stsb_spearman": 0.8558430809688982, "step": 10000 }, { "epoch": 0.65, "eval_avg_sts": 0.8227053843456922, "eval_sickr_spearman": 0.7892594508552383, "eval_stsb_spearman": 0.856151317836146, "step": 10125 }, { "epoch": 0.66, "eval_avg_sts": 0.8211210354889169, "eval_sickr_spearman": 0.7858874273787755, "eval_stsb_spearman": 0.8563546435990582, "step": 10250 }, { "epoch": 0.66, "eval_avg_sts": 0.8217109523377687, "eval_sickr_spearman": 0.7865405062650296, "eval_stsb_spearman": 0.8568813984105078, "step": 10375 }, { "epoch": 0.67, "learning_rate": 4.648150518366825e-06, "loss": 0.0002, "step": 10500 }, { "epoch": 0.67, "eval_avg_sts": 0.8231847712907092, "eval_sickr_spearman": 0.7883226042216879, "eval_stsb_spearman": 0.8580469383597307, "step": 10500 }, { "epoch": 0.68, "eval_avg_sts": 0.8231833094531285, "eval_sickr_spearman": 0.7886680439032306, "eval_stsb_spearman": 0.8576985750030263, "step": 10625 }, { "epoch": 0.69, "eval_avg_sts": 0.8235797750151058, "eval_sickr_spearman": 0.7894692507063199, "eval_stsb_spearman": 0.8576902993238917, "step": 10750 }, { "epoch": 0.7, "eval_avg_sts": 0.8239802387430818, "eval_sickr_spearman": 0.7900059982648908, "eval_stsb_spearman": 0.8579544792212728, "step": 10875 }, { "epoch": 0.7, "learning_rate": 4.536157685908102e-06, "loss": 0.0001, "step": 11000 }, { "epoch": 0.7, "eval_avg_sts": 0.8228846723006884, "eval_sickr_spearman": 0.7878013707088813, "eval_stsb_spearman": 0.8579679738924955, "step": 11000 }, { "epoch": 0.71, "eval_avg_sts": 0.8233402178257747, "eval_sickr_spearman": 0.788485765873273, "eval_stsb_spearman": 0.8581946697782764, "step": 11125 }, { "epoch": 0.72, "eval_avg_sts": 0.8233165033728497, "eval_sickr_spearman": 0.788493306756199, "eval_stsb_spearman": 0.8581396999895003, "step": 11250 }, { "epoch": 0.73, "eval_avg_sts": 0.8211286933035429, "eval_sickr_spearman": 0.787368274267214, "eval_stsb_spearman": 0.8548891123398719, "step": 11375 }, { "epoch": 0.74, "learning_rate": 4.424164853449379e-06, "loss": 0.0002, "step": 11500 }, { "epoch": 0.74, "eval_avg_sts": 0.8222354006770852, "eval_sickr_spearman": 0.7882437371531265, "eval_stsb_spearman": 0.856227064201044, "step": 11500 }, { "epoch": 0.74, "eval_avg_sts": 0.823058736106017, "eval_sickr_spearman": 0.7882230837795081, "eval_stsb_spearman": 0.8578943884325259, "step": 11625 }, { "epoch": 0.75, "eval_avg_sts": 0.8240623262398707, "eval_sickr_spearman": 0.7903270861780045, "eval_stsb_spearman": 0.8577975663017371, "step": 11750 }, { "epoch": 0.76, "eval_avg_sts": 0.8193741224170432, "eval_sickr_spearman": 0.7834559008995725, "eval_stsb_spearman": 0.8552923439345139, "step": 11875 }, { "epoch": 0.77, "learning_rate": 4.312172020990656e-06, "loss": 0.0004, "step": 12000 }, { "epoch": 0.77, "eval_avg_sts": 0.8219118427006455, "eval_sickr_spearman": 0.785794199010884, "eval_stsb_spearman": 0.8580294863904071, "step": 12000 }, { "epoch": 0.78, "eval_avg_sts": 0.823098023008008, "eval_sickr_spearman": 0.7879260114171134, "eval_stsb_spearman": 0.8582700345989028, "step": 12125 }, { "epoch": 0.78, "eval_avg_sts": 0.8227772117211238, "eval_sickr_spearman": 0.7878058376013152, "eval_stsb_spearman": 0.8577485858409325, "step": 12250 }, { "epoch": 0.79, "eval_avg_sts": 0.8244800942376741, "eval_sickr_spearman": 0.7899311658088503, "eval_stsb_spearman": 0.8590290226664979, "step": 12375 }, { "epoch": 0.8, "learning_rate": 4.2001791885319345e-06, "loss": 0.0003, "step": 12500 }, { "epoch": 0.8, "eval_avg_sts": 0.8252546537289246, "eval_sickr_spearman": 0.7905314585146238, "eval_stsb_spearman": 0.8599778489432254, "step": 12500 }, { "epoch": 0.81, "eval_avg_sts": 0.8242515246774704, "eval_sickr_spearman": 0.7934860436884877, "eval_stsb_spearman": 0.855017005666453, "step": 12625 }, { "epoch": 0.82, "eval_avg_sts": 0.8251886392831695, "eval_sickr_spearman": 0.7935808570827266, "eval_stsb_spearman": 0.8567964214836123, "step": 12750 }, { "epoch": 0.82, "eval_avg_sts": 0.8255732979417849, "eval_sickr_spearman": 0.7939037701776952, "eval_stsb_spearman": 0.8572428257058746, "step": 12875 }, { "epoch": 0.83, "learning_rate": 4.088186356073212e-06, "loss": 0.0002, "step": 13000 }, { "epoch": 0.83, "eval_avg_sts": 0.8272525514506217, "eval_sickr_spearman": 0.7954193915835747, "eval_stsb_spearman": 0.8590857113176686, "step": 13000 }, { "epoch": 0.84, "eval_avg_sts": 0.8276110249953785, "eval_sickr_spearman": 0.7955957617880555, "eval_stsb_spearman": 0.8596262882027015, "step": 13125 }, { "epoch": 0.85, "eval_avg_sts": 0.8262806808137206, "eval_sickr_spearman": 0.792061729406442, "eval_stsb_spearman": 0.8604996322209992, "step": 13250 }, { "epoch": 0.86, "eval_avg_sts": 0.8270413161061019, "eval_sickr_spearman": 0.7918599027181991, "eval_stsb_spearman": 0.8622227294940048, "step": 13375 }, { "epoch": 0.86, "learning_rate": 3.976193523614489e-06, "loss": 0.0002, "step": 13500 }, { "epoch": 0.86, "eval_avg_sts": 0.8277173388272963, "eval_sickr_spearman": 0.7929541472711621, "eval_stsb_spearman": 0.8624805303834304, "step": 13500 }, { "epoch": 0.87, "eval_avg_sts": 0.8280371802211439, "eval_sickr_spearman": 0.7936189937772684, "eval_stsb_spearman": 0.8624553666650194, "step": 13625 }, { "epoch": 0.88, "eval_avg_sts": 0.8280087430461096, "eval_sickr_spearman": 0.7934894538966899, "eval_stsb_spearman": 0.8625280321955292, "step": 13750 }, { "epoch": 0.89, "eval_avg_sts": 0.8279846750031183, "eval_sickr_spearman": 0.7941465193643633, "eval_stsb_spearman": 0.8618228306418733, "step": 13875 }, { "epoch": 0.9, "learning_rate": 3.864200691155766e-06, "loss": 0.0001, "step": 14000 }, { "epoch": 0.9, "eval_avg_sts": 0.8281003824811937, "eval_sickr_spearman": 0.7943439752223754, "eval_stsb_spearman": 0.8618567897400118, "step": 14000 }, { "epoch": 0.9, "eval_avg_sts": 0.8280440185035953, "eval_sickr_spearman": 0.792904915392188, "eval_stsb_spearman": 0.8631831216150027, "step": 14125 }, { "epoch": 0.91, "eval_avg_sts": 0.8279193239585301, "eval_sickr_spearman": 0.7931221120328913, "eval_stsb_spearman": 0.8627165358841689, "step": 14250 }, { "epoch": 0.92, "eval_avg_sts": 0.8275099017452278, "eval_sickr_spearman": 0.793065195177687, "eval_stsb_spearman": 0.8619546083127685, "step": 14375 }, { "epoch": 0.93, "learning_rate": 3.7522078586970435e-06, "loss": 0.0001, "step": 14500 }, { "epoch": 0.93, "eval_avg_sts": 0.8275982959975564, "eval_sickr_spearman": 0.7935053521912658, "eval_stsb_spearman": 0.861691239803847, "step": 14500 }, { "epoch": 0.94, "eval_avg_sts": 0.8276150816017793, "eval_sickr_spearman": 0.7940267778284781, "eval_stsb_spearman": 0.8612033853750805, "step": 14625 }, { "epoch": 0.94, "eval_avg_sts": 0.8277678050001869, "eval_sickr_spearman": 0.7940122244047422, "eval_stsb_spearman": 0.8615233855956315, "step": 14750 }, { "epoch": 0.95, "eval_avg_sts": 0.827775044421294, "eval_sickr_spearman": 0.79435247672733, "eval_stsb_spearman": 0.861197612115258, "step": 14875 }, { "epoch": 0.96, "learning_rate": 3.6402150262383203e-06, "loss": 0.0002, "step": 15000 }, { "epoch": 0.96, "eval_avg_sts": 0.8265288786526938, "eval_sickr_spearman": 0.7941830230014563, "eval_stsb_spearman": 0.8588747343039312, "step": 15000 }, { "epoch": 0.97, "eval_avg_sts": 0.826595528411173, "eval_sickr_spearman": 0.7947538726420482, "eval_stsb_spearman": 0.8584371841802979, "step": 15125 }, { "epoch": 0.98, "eval_avg_sts": 0.8271259707838263, "eval_sickr_spearman": 0.7952840399397222, "eval_stsb_spearman": 0.8589679016279306, "step": 15250 }, { "epoch": 0.98, "eval_avg_sts": 0.8269049666463504, "eval_sickr_spearman": 0.7927316191781993, "eval_stsb_spearman": 0.8610783141145013, "step": 15375 }, { "epoch": 0.99, "learning_rate": 3.5282221937795976e-06, "loss": 0.0003, "step": 15500 }, { "epoch": 0.99, "eval_avg_sts": 0.82737580758211, "eval_sickr_spearman": 0.7935406550508229, "eval_stsb_spearman": 0.8612109601133972, "step": 15500 }, { "epoch": 1.0, "eval_avg_sts": 0.8264028870845463, "eval_sickr_spearman": 0.7940738673657366, "eval_stsb_spearman": 0.8587319068033561, "step": 15625 }, { "epoch": 1.01, "eval_avg_sts": 0.8268441102829658, "eval_sickr_spearman": 0.7937048253555384, "eval_stsb_spearman": 0.8599833952103932, "step": 15750 }, { "epoch": 1.02, "eval_avg_sts": 0.8275739286019619, "eval_sickr_spearman": 0.7947639591733503, "eval_stsb_spearman": 0.8603838980305735, "step": 15875 }, { "epoch": 1.02, "learning_rate": 3.4162293613208757e-06, "loss": 0.0001, "step": 16000 }, { "epoch": 1.02, "eval_avg_sts": 0.8277768410299685, "eval_sickr_spearman": 0.7952131460339995, "eval_stsb_spearman": 0.8603405360259375, "step": 16000 }, { "epoch": 1.03, "eval_avg_sts": 0.8282682698041279, "eval_sickr_spearman": 0.7963400997670419, "eval_stsb_spearman": 0.860196439841214, "step": 16125 }, { "epoch": 1.04, "eval_avg_sts": 0.8264618348746703, "eval_sickr_spearman": 0.7934643816617393, "eval_stsb_spearman": 0.8594592880876013, "step": 16250 }, { "epoch": 1.05, "eval_avg_sts": 0.8264717428559492, "eval_sickr_spearman": 0.7932766280862176, "eval_stsb_spearman": 0.8596668576256806, "step": 16375 }, { "epoch": 1.06, "learning_rate": 3.304236528862153e-06, "loss": 0.0002, "step": 16500 }, { "epoch": 1.06, "eval_avg_sts": 0.8274883631622513, "eval_sickr_spearman": 0.7946689056236043, "eval_stsb_spearman": 0.8603078207008983, "step": 16500 }, { "epoch": 1.06, "eval_avg_sts": 0.8285054599151072, "eval_sickr_spearman": 0.7953375465867241, "eval_stsb_spearman": 0.8616733732434904, "step": 16625 }, { "epoch": 1.07, "eval_avg_sts": 0.8267040342845151, "eval_sickr_spearman": 0.7930167317963359, "eval_stsb_spearman": 0.8603913367726943, "step": 16750 }, { "epoch": 1.08, "eval_avg_sts": 0.8254063226482575, "eval_sickr_spearman": 0.7925604363326739, "eval_stsb_spearman": 0.8582522089638411, "step": 16875 }, { "epoch": 1.09, "learning_rate": 3.19224369640343e-06, "loss": 0.0003, "step": 17000 }, { "epoch": 1.09, "eval_avg_sts": 0.8263459648804743, "eval_sickr_spearman": 0.7938006474029073, "eval_stsb_spearman": 0.8588912823580412, "step": 17000 }, { "epoch": 1.1, "eval_avg_sts": 0.8265585284525776, "eval_sickr_spearman": 0.7938499273129829, "eval_stsb_spearman": 0.8592671295921722, "step": 17125 }, { "epoch": 1.1, "eval_avg_sts": 0.8275713806370856, "eval_sickr_spearman": 0.795413819975808, "eval_stsb_spearman": 0.8597289412983632, "step": 17250 }, { "epoch": 1.11, "eval_avg_sts": 0.8278030720022054, "eval_sickr_spearman": 0.7957596439061624, "eval_stsb_spearman": 0.8598465000982485, "step": 17375 }, { "epoch": 1.12, "learning_rate": 3.0802508639447074e-06, "loss": 0.0003, "step": 17500 }, { "epoch": 1.12, "eval_avg_sts": 0.828665230451958, "eval_sickr_spearman": 0.7959547942713053, "eval_stsb_spearman": 0.8613756666326104, "step": 17500 }, { "epoch": 1.13, "eval_avg_sts": 0.8288773890103436, "eval_sickr_spearman": 0.7964317911396872, "eval_stsb_spearman": 0.861322986881, "step": 17625 }, { "epoch": 1.14, "eval_avg_sts": 0.8287921576974288, "eval_sickr_spearman": 0.7965225699214054, "eval_stsb_spearman": 0.8610617454734522, "step": 17750 }, { "epoch": 1.14, "eval_avg_sts": 0.8287755856452497, "eval_sickr_spearman": 0.7967101794036225, "eval_stsb_spearman": 0.8608409918868768, "step": 17875 }, { "epoch": 1.15, "learning_rate": 2.9682580314859847e-06, "loss": 0.0001, "step": 18000 }, { "epoch": 1.15, "eval_avg_sts": 0.8292774010789281, "eval_sickr_spearman": 0.7969440428365246, "eval_stsb_spearman": 0.8616107593213317, "step": 18000 }, { "epoch": 1.16, "eval_avg_sts": 0.8293137062967321, "eval_sickr_spearman": 0.7971494238262741, "eval_stsb_spearman": 0.8614779887671901, "step": 18125 }, { "epoch": 1.17, "eval_avg_sts": 0.8293003591512393, "eval_sickr_spearman": 0.7972976478053122, "eval_stsb_spearman": 0.8613030704971664, "step": 18250 }, { "epoch": 1.18, "eval_avg_sts": 0.8269276043107123, "eval_sickr_spearman": 0.7936150552269506, "eval_stsb_spearman": 0.8602401533944739, "step": 18375 }, { "epoch": 1.18, "learning_rate": 2.8562651990272623e-06, "loss": 0.0001, "step": 18500 }, { "epoch": 1.18, "eval_avg_sts": 0.8271598852494388, "eval_sickr_spearman": 0.7938677468516165, "eval_stsb_spearman": 0.8604520236472611, "step": 18500 }, { "epoch": 1.19, "eval_avg_sts": 0.8273011691673453, "eval_sickr_spearman": 0.7941100157272702, "eval_stsb_spearman": 0.8604923226074204, "step": 18625 }, { "epoch": 1.2, "eval_avg_sts": 0.8274659412451935, "eval_sickr_spearman": 0.7943473373994759, "eval_stsb_spearman": 0.860584545090911, "step": 18750 }, { "epoch": 1.21, "eval_avg_sts": 0.8273871753451842, "eval_sickr_spearman": 0.7941770191137765, "eval_stsb_spearman": 0.8605973315765919, "step": 18875 }, { "epoch": 1.22, "learning_rate": 2.7442723665685396e-06, "loss": 0.0002, "step": 19000 }, { "epoch": 1.22, "eval_avg_sts": 0.8268924907436139, "eval_sickr_spearman": 0.7941484406084208, "eval_stsb_spearman": 0.859636540878807, "step": 19000 }, { "epoch": 1.22, "eval_avg_sts": 0.8258034139625235, "eval_sickr_spearman": 0.7932116900370734, "eval_stsb_spearman": 0.8583951378879737, "step": 19125 }, { "epoch": 1.23, "eval_avg_sts": 0.8252544789859086, "eval_sickr_spearman": 0.7925500616147634, "eval_stsb_spearman": 0.857958896357054, "step": 19250 }, { "epoch": 1.24, "eval_avg_sts": 0.8253536873185088, "eval_sickr_spearman": 0.7926197067118486, "eval_stsb_spearman": 0.858087667925169, "step": 19375 }, { "epoch": 1.25, "learning_rate": 2.632279534109817e-06, "loss": 0.0002, "step": 19500 }, { "epoch": 1.25, "eval_avg_sts": 0.8259692031147807, "eval_sickr_spearman": 0.7942922457261266, "eval_stsb_spearman": 0.8576461605034348, "step": 19500 }, { "epoch": 1.26, "eval_avg_sts": 0.8262977896726795, "eval_sickr_spearman": 0.7945857637870148, "eval_stsb_spearman": 0.8580098155583442, "step": 19625 }, { "epoch": 1.26, "eval_avg_sts": 0.8265435124446001, "eval_sickr_spearman": 0.7949808676274447, "eval_stsb_spearman": 0.8581061572617555, "step": 19750 }, { "epoch": 1.27, "eval_avg_sts": 0.82660901551375, "eval_sickr_spearman": 0.795241820601558, "eval_stsb_spearman": 0.8579762104259421, "step": 19875 }, { "epoch": 1.28, "learning_rate": 2.5202867016510945e-06, "loss": 0.0001, "step": 20000 }, { "epoch": 1.28, "eval_avg_sts": 0.8249759667991925, "eval_sickr_spearman": 0.7929103429066506, "eval_stsb_spearman": 0.8570415906917342, "step": 20000 }, { "epoch": 1.29, "eval_avg_sts": 0.8252695158247048, "eval_sickr_spearman": 0.7941818702550217, "eval_stsb_spearman": 0.8563571613943879, "step": 20125 }, { "epoch": 1.3, "eval_avg_sts": 0.8254168575586551, "eval_sickr_spearman": 0.794336146152841, "eval_stsb_spearman": 0.8564975689644694, "step": 20250 }, { "epoch": 1.3, "eval_avg_sts": 0.8259865535716795, "eval_sickr_spearman": 0.7950048831781639, "eval_stsb_spearman": 0.8569682239651952, "step": 20375 }, { "epoch": 1.31, "learning_rate": 2.4082938691923718e-06, "loss": 0.0001, "step": 20500 }, { "epoch": 1.31, "eval_avg_sts": 0.826209318888689, "eval_sickr_spearman": 0.7952033957204077, "eval_stsb_spearman": 0.8572152420569702, "step": 20500 }, { "epoch": 1.32, "eval_avg_sts": 0.8259891403986184, "eval_sickr_spearman": 0.7948762078574111, "eval_stsb_spearman": 0.8571020729398255, "step": 20625 }, { "epoch": 1.33, "eval_avg_sts": 0.8259890083537097, "eval_sickr_spearman": 0.7947911447767642, "eval_stsb_spearman": 0.8571868719306552, "step": 20750 }, { "epoch": 1.34, "eval_avg_sts": 0.8261152907691348, "eval_sickr_spearman": 0.7949135280232285, "eval_stsb_spearman": 0.8573170535150412, "step": 20875 }, { "epoch": 1.34, "learning_rate": 2.296301036733649e-06, "loss": 0.0001, "step": 21000 }, { "epoch": 1.34, "eval_avg_sts": 0.826274962054796, "eval_sickr_spearman": 0.7950501284757184, "eval_stsb_spearman": 0.8574997956338737, "step": 21000 }, { "epoch": 1.35, "eval_avg_sts": 0.8260486313726075, "eval_sickr_spearman": 0.794899647034913, "eval_stsb_spearman": 0.8571976157103021, "step": 21125 }, { "epoch": 1.36, "eval_avg_sts": 0.825587114078729, "eval_sickr_spearman": 0.7946725559873136, "eval_stsb_spearman": 0.8565016721701444, "step": 21250 }, { "epoch": 1.37, "eval_avg_sts": 0.8256303672089018, "eval_sickr_spearman": 0.7944853787850091, "eval_stsb_spearman": 0.8567753556327944, "step": 21375 }, { "epoch": 1.38, "learning_rate": 2.1843082042749267e-06, "loss": 0.0002, "step": 21500 }, { "epoch": 1.38, "eval_avg_sts": 0.8254654257169443, "eval_sickr_spearman": 0.7936856129149631, "eval_stsb_spearman": 0.8572452385189255, "step": 21500 }, { "epoch": 1.38, "eval_avg_sts": 0.8257646791990041, "eval_sickr_spearman": 0.7941317738162218, "eval_stsb_spearman": 0.8573975845817864, "step": 21625 }, { "epoch": 1.39, "eval_avg_sts": 0.8263390736725806, "eval_sickr_spearman": 0.7947459955414125, "eval_stsb_spearman": 0.8579321518037489, "step": 21750 }, { "epoch": 1.4, "eval_avg_sts": 0.825957826826842, "eval_sickr_spearman": 0.7945194808670303, "eval_stsb_spearman": 0.8573961727866538, "step": 21875 }, { "epoch": 1.41, "learning_rate": 2.072315371816204e-06, "loss": 0.0001, "step": 22000 }, { "epoch": 1.41, "eval_avg_sts": 0.8257198535359889, "eval_sickr_spearman": 0.7936219236744562, "eval_stsb_spearman": 0.8578177833975217, "step": 22000 }, { "epoch": 1.42, "eval_avg_sts": 0.8270054813778303, "eval_sickr_spearman": 0.7958380306637094, "eval_stsb_spearman": 0.858172932091951, "step": 22125 }, { "epoch": 1.42, "eval_avg_sts": 0.8270091578481822, "eval_sickr_spearman": 0.7962583028012928, "eval_stsb_spearman": 0.8577600128950715, "step": 22250 }, { "epoch": 1.43, "eval_avg_sts": 0.8259725703398417, "eval_sickr_spearman": 0.7959245346773993, "eval_stsb_spearman": 0.8560206060022842, "step": 22375 }, { "epoch": 1.44, "learning_rate": 1.9603225393574807e-06, "loss": 0.0002, "step": 22500 }, { "epoch": 1.44, "eval_avg_sts": 0.8254714237214871, "eval_sickr_spearman": 0.7955676635937141, "eval_stsb_spearman": 0.8553751838492601, "step": 22500 }, { "epoch": 1.45, "eval_avg_sts": 0.8243312613565763, "eval_sickr_spearman": 0.7926490056837258, "eval_stsb_spearman": 0.8560135170294269, "step": 22625 }, { "epoch": 1.46, "eval_avg_sts": 0.8244931271533935, "eval_sickr_spearman": 0.7931114971594734, "eval_stsb_spearman": 0.8558747571473136, "step": 22750 }, { "epoch": 1.46, "eval_avg_sts": 0.8245178381258861, "eval_sickr_spearman": 0.7931850518122927, "eval_stsb_spearman": 0.8558506244394795, "step": 22875 }, { "epoch": 1.47, "learning_rate": 1.8483297068987584e-06, "loss": 0.0002, "step": 23000 }, { "epoch": 1.47, "eval_avg_sts": 0.8250123369922542, "eval_sickr_spearman": 0.7931228324994128, "eval_stsb_spearman": 0.8569018414850956, "step": 23000 }, { "epoch": 1.48, "eval_avg_sts": 0.8254867372327745, "eval_sickr_spearman": 0.7938168819151935, "eval_stsb_spearman": 0.8571565925503556, "step": 23125 }, { "epoch": 1.49, "eval_avg_sts": 0.8256499116596692, "eval_sickr_spearman": 0.7939716381240272, "eval_stsb_spearman": 0.8573281851953113, "step": 23250 }, { "epoch": 1.5, "eval_avg_sts": 0.8258346679802114, "eval_sickr_spearman": 0.7940527146232547, "eval_stsb_spearman": 0.8576166213371682, "step": 23375 }, { "epoch": 1.5, "learning_rate": 1.7363368744400357e-06, "loss": 0.0001, "step": 23500 }, { "epoch": 1.5, "eval_avg_sts": 0.825945269207895, "eval_sickr_spearman": 0.7943781253354978, "eval_stsb_spearman": 0.8575124130802922, "step": 23500 }, { "epoch": 1.51, "eval_avg_sts": 0.8258713568091718, "eval_sickr_spearman": 0.794315540810324, "eval_stsb_spearman": 0.8574271728080196, "step": 23625 }, { "epoch": 1.52, "eval_avg_sts": 0.8258355435328646, "eval_sickr_spearman": 0.7940151062708286, "eval_stsb_spearman": 0.8576559807949005, "step": 23750 }, { "epoch": 1.53, "eval_avg_sts": 0.8257865803230886, "eval_sickr_spearman": 0.7940416194388225, "eval_stsb_spearman": 0.8575315412073548, "step": 23875 }, { "epoch": 1.54, "learning_rate": 1.6243440419813131e-06, "loss": 0.0002, "step": 24000 }, { "epoch": 1.54, "eval_avg_sts": 0.8258057571249391, "eval_sickr_spearman": 0.7941539161539849, "eval_stsb_spearman": 0.8574575980958933, "step": 24000 }, { "epoch": 1.54, "eval_avg_sts": 0.8258599414659757, "eval_sickr_spearman": 0.7942335517201692, "eval_stsb_spearman": 0.8574863312117823, "step": 24125 }, { "epoch": 1.55, "eval_avg_sts": 0.8259837419138151, "eval_sickr_spearman": 0.7943245706573944, "eval_stsb_spearman": 0.8576429131702358, "step": 24250 }, { "epoch": 1.56, "eval_avg_sts": 0.8273046944370666, "eval_sickr_spearman": 0.7953777005875265, "eval_stsb_spearman": 0.8592316882866066, "step": 24375 }, { "epoch": 1.57, "learning_rate": 1.5123512095225906e-06, "loss": 0.0001, "step": 24500 }, { "epoch": 1.57, "eval_avg_sts": 0.8270336322444836, "eval_sickr_spearman": 0.7948833644915253, "eval_stsb_spearman": 0.8591838999974419, "step": 24500 }, { "epoch": 1.58, "eval_avg_sts": 0.8268251999183458, "eval_sickr_spearman": 0.7944777418398805, "eval_stsb_spearman": 0.8591726579968111, "step": 24625 }, { "epoch": 1.58, "eval_avg_sts": 0.8267020534374147, "eval_sickr_spearman": 0.7943936393812624, "eval_stsb_spearman": 0.8590104674935669, "step": 24750 }, { "epoch": 1.59, "eval_avg_sts": 0.825917107993902, "eval_sickr_spearman": 0.7938579965380246, "eval_stsb_spearman": 0.8579762194497796, "step": 24875 }, { "epoch": 1.6, "learning_rate": 1.4003583770638678e-06, "loss": 0.0002, "step": 25000 }, { "epoch": 1.6, "eval_avg_sts": 0.8263527703022291, "eval_sickr_spearman": 0.7941290360434399, "eval_stsb_spearman": 0.8585765045610182, "step": 25000 }, { "epoch": 1.61, "eval_avg_sts": 0.8269584920385149, "eval_sickr_spearman": 0.7941601601971716, "eval_stsb_spearman": 0.8597568238798581, "step": 25125 }, { "epoch": 1.62, "eval_avg_sts": 0.8264998215853827, "eval_sickr_spearman": 0.7927663936956405, "eval_stsb_spearman": 0.8602332494751249, "step": 25250 }, { "epoch": 1.62, "eval_avg_sts": 0.825942745088348, "eval_sickr_spearman": 0.7922521246925426, "eval_stsb_spearman": 0.8596333654841534, "step": 25375 }, { "epoch": 1.63, "learning_rate": 1.2883655446051453e-06, "loss": 0.0001, "step": 25500 }, { "epoch": 1.63, "eval_avg_sts": 0.8259010696773026, "eval_sickr_spearman": 0.7922646127789166, "eval_stsb_spearman": 0.8595375265756887, "step": 25500 }, { "epoch": 1.64, "eval_avg_sts": 0.8259285307896478, "eval_sickr_spearman": 0.7926812825838921, "eval_stsb_spearman": 0.8591757789954035, "step": 25625 }, { "epoch": 1.65, "eval_avg_sts": 0.8258391793675839, "eval_sickr_spearman": 0.7926954517588166, "eval_stsb_spearman": 0.858982906976351, "step": 25750 }, { "epoch": 1.66, "eval_avg_sts": 0.8258409312899861, "eval_sickr_spearman": 0.7928338293620596, "eval_stsb_spearman": 0.8588480332179126, "step": 25875 }, { "epoch": 1.66, "learning_rate": 1.1763727121464225e-06, "loss": 0.0001, "step": 26000 }, { "epoch": 1.66, "eval_avg_sts": 0.8251984305884675, "eval_sickr_spearman": 0.7933060231202977, "eval_stsb_spearman": 0.8570908380566373, "step": 26000 }, { "epoch": 1.67, "eval_avg_sts": 0.8253196217152283, "eval_sickr_spearman": 0.7932125065657978, "eval_stsb_spearman": 0.8574267368646588, "step": 26125 }, { "epoch": 1.68, "eval_avg_sts": 0.8253745698430313, "eval_sickr_spearman": 0.7933913263564519, "eval_stsb_spearman": 0.8573578133296105, "step": 26250 }, { "epoch": 1.69, "eval_avg_sts": 0.825411316540875, "eval_sickr_spearman": 0.7934114513879544, "eval_stsb_spearman": 0.8574111816937955, "step": 26375 }, { "epoch": 1.7, "learning_rate": 1.0643798796877e-06, "loss": 0.0001, "step": 26500 }, { "epoch": 1.7, "eval_avg_sts": 0.8249370852399975, "eval_sickr_spearman": 0.7937128945805799, "eval_stsb_spearman": 0.8561612758994152, "step": 26500 }, { "epoch": 1.7, "eval_avg_sts": 0.825459765367129, "eval_sickr_spearman": 0.7933420944774778, "eval_stsb_spearman": 0.8575774362567802, "step": 26625 }, { "epoch": 1.71, "eval_avg_sts": 0.826427995376563, "eval_sickr_spearman": 0.7947685701590883, "eval_stsb_spearman": 0.8580874205940376, "step": 26750 }, { "epoch": 1.72, "eval_avg_sts": 0.8258856380174763, "eval_sickr_spearman": 0.7942930142237495, "eval_stsb_spearman": 0.857478261811203, "step": 26875 }, { "epoch": 1.73, "learning_rate": 9.523870472289774e-07, "loss": 0.0002, "step": 27000 }, { "epoch": 1.73, "eval_avg_sts": 0.8258593024414255, "eval_sickr_spearman": 0.7941693821686479, "eval_stsb_spearman": 0.8575492227142031, "step": 27000 }, { "epoch": 1.74, "eval_avg_sts": 0.8258720619743833, "eval_sickr_spearman": 0.7941788923267327, "eval_stsb_spearman": 0.857565231622034, "step": 27125 }, { "epoch": 1.74, "eval_avg_sts": 0.8259531389747516, "eval_sickr_spearman": 0.7941532917496662, "eval_stsb_spearman": 0.8577529861998372, "step": 27250 }, { "epoch": 1.75, "eval_avg_sts": 0.825969657799255, "eval_sickr_spearman": 0.7942109771024933, "eval_stsb_spearman": 0.8577283384960166, "step": 27375 }, { "epoch": 1.76, "learning_rate": 8.403942147702547e-07, "loss": 0.0002, "step": 27500 }, { "epoch": 1.76, "eval_avg_sts": 0.8259987251545413, "eval_sickr_spearman": 0.7943161171835413, "eval_stsb_spearman": 0.8576813331255413, "step": 27500 }, { "epoch": 1.77, "eval_avg_sts": 0.8252131722274082, "eval_sickr_spearman": 0.793231382788663, "eval_stsb_spearman": 0.8571949616661534, "step": 27625 }, { "epoch": 1.78, "eval_avg_sts": 0.8252604604270115, "eval_sickr_spearman": 0.7933024207876899, "eval_stsb_spearman": 0.857218500066333, "step": 27750 }, { "epoch": 1.78, "eval_avg_sts": 0.8251969961170478, "eval_sickr_spearman": 0.793198385421975, "eval_stsb_spearman": 0.8571956068121205, "step": 27875 }, { "epoch": 1.79, "learning_rate": 7.284013823115321e-07, "loss": 0.0002, "step": 28000 }, { "epoch": 1.79, "eval_avg_sts": 0.825311717070901, "eval_sickr_spearman": 0.7931744179023573, "eval_stsb_spearman": 0.8574490162394447, "step": 28000 }, { "epoch": 1.8, "eval_avg_sts": 0.8256482381761492, "eval_sickr_spearman": 0.7934648139416521, "eval_stsb_spearman": 0.8578316624106462, "step": 28125 }, { "epoch": 1.81, "eval_avg_sts": 0.8261129479959839, "eval_sickr_spearman": 0.7939418588411357, "eval_stsb_spearman": 0.858284037150832, "step": 28250 }, { "epoch": 1.82, "eval_avg_sts": 0.8262712326490254, "eval_sickr_spearman": 0.7933230261302068, "eval_stsb_spearman": 0.8592194391678438, "step": 28375 }, { "epoch": 1.82, "learning_rate": 6.164085498528094e-07, "loss": 0.0002, "step": 28500 }, { "epoch": 1.82, "eval_avg_sts": 0.8262943695062834, "eval_sickr_spearman": 0.7934199048618075, "eval_stsb_spearman": 0.8591688341507593, "step": 28500 }, { "epoch": 1.83, "eval_avg_sts": 0.8260598340905722, "eval_sickr_spearman": 0.7933951208134654, "eval_stsb_spearman": 0.8587245473676789, "step": 28625 }, { "epoch": 1.84, "eval_avg_sts": 0.8259360112469695, "eval_sickr_spearman": 0.7933420944774778, "eval_stsb_spearman": 0.8585299280164611, "step": 28750 }, { "epoch": 1.85, "eval_avg_sts": 0.8258330858999741, "eval_sickr_spearman": 0.7933054467470805, "eval_stsb_spearman": 0.8583607250528676, "step": 28875 }, { "epoch": 1.86, "learning_rate": 5.044157173940868e-07, "loss": 0.0001, "step": 29000 }, { "epoch": 1.86, "eval_avg_sts": 0.8258376969438936, "eval_sickr_spearman": 0.7933141884075422, "eval_stsb_spearman": 0.8583612054802452, "step": 29000 }, { "epoch": 1.86, "eval_avg_sts": 0.8259136180644091, "eval_sickr_spearman": 0.7933194718287004, "eval_stsb_spearman": 0.8585077643001178, "step": 29125 }, { "epoch": 1.87, "eval_avg_sts": 0.825910175107258, "eval_sickr_spearman": 0.7933039097518345, "eval_stsb_spearman": 0.8585164404626813, "step": 29250 }, { "epoch": 1.88, "eval_avg_sts": 0.8258308833879402, "eval_sickr_spearman": 0.7933173584602371, "eval_stsb_spearman": 0.8583444083156432, "step": 29375 }, { "epoch": 1.89, "learning_rate": 3.9242288493536413e-07, "loss": 0.0001, "step": 29500 }, { "epoch": 1.89, "eval_avg_sts": 0.8257221328599513, "eval_sickr_spearman": 0.7931374819853514, "eval_stsb_spearman": 0.8583067837345514, "step": 29500 }, { "epoch": 1.9, "eval_avg_sts": 0.825786763719202, "eval_sickr_spearman": 0.7932694234210019, "eval_stsb_spearman": 0.858304104017402, "step": 29625 }, { "epoch": 1.9, "eval_avg_sts": 0.8257681951340192, "eval_sickr_spearman": 0.7932804705743327, "eval_stsb_spearman": 0.8582559196937056, "step": 29750 }, { "epoch": 1.91, "eval_avg_sts": 0.8258082608558808, "eval_sickr_spearman": 0.7933519408532725, "eval_stsb_spearman": 0.8582645808584891, "step": 29875 }, { "epoch": 1.92, "learning_rate": 2.804300524766415e-07, "loss": 0.0001, "step": 30000 }, { "epoch": 1.92, "eval_avg_sts": 0.8258262861889483, "eval_sickr_spearman": 0.7933999719547107, "eval_stsb_spearman": 0.8582526004231857, "step": 30000 }, { "epoch": 1.93, "eval_avg_sts": 0.8256086631585, "eval_sickr_spearman": 0.7930556369885008, "eval_stsb_spearman": 0.8581616893284993, "step": 30125 }, { "epoch": 1.94, "eval_avg_sts": 0.8256480515518101, "eval_sickr_spearman": 0.7931325828130048, "eval_stsb_spearman": 0.8581635202906153, "step": 30250 }, { "epoch": 1.94, "eval_avg_sts": 0.8258219208455879, "eval_sickr_spearman": 0.7934267252782117, "eval_stsb_spearman": 0.8582171164129642, "step": 30375 }, { "epoch": 1.95, "learning_rate": 1.6843722001791884e-07, "loss": 0.0002, "step": 30500 }, { "epoch": 1.95, "eval_avg_sts": 0.8258322719939588, "eval_sickr_spearman": 0.7934731233222009, "eval_stsb_spearman": 0.8581914206657169, "step": 30500 }, { "epoch": 1.96, "eval_avg_sts": 0.8258242424865203, "eval_sickr_spearman": 0.7934302315486167, "eval_stsb_spearman": 0.858218253424424, "step": 30625 }, { "epoch": 1.97, "eval_avg_sts": 0.8258248316168127, "eval_sickr_spearman": 0.7934435841948165, "eval_stsb_spearman": 0.858206079038809, "step": 30750 }, { "epoch": 1.98, "eval_avg_sts": 0.8257922895919085, "eval_sickr_spearman": 0.7933790303944838, "eval_stsb_spearman": 0.8582055487893332, "step": 30875 }, { "epoch": 1.98, "learning_rate": 5.64443875591962e-08, "loss": 0.0001, "step": 31000 }, { "epoch": 1.98, "eval_avg_sts": 0.8257897415072173, "eval_sickr_spearman": 0.7933720178536738, "eval_stsb_spearman": 0.8582074651607609, "step": 31000 }, { "epoch": 1.99, "eval_avg_sts": 0.8257977713308224, "eval_sickr_spearman": 0.7933829209137002, "eval_stsb_spearman": 0.8582126217479447, "step": 31125 }, { "epoch": 2.0, "eval_avg_sts": 0.8258126560134551, "eval_sickr_spearman": 0.7934017010743625, "eval_stsb_spearman": 0.8582236109525477, "step": 31250 }, { "epoch": 2.0, "step": 31252, "train_runtime": 21163.9877, "train_samples_per_second": 1.477 } ], "max_steps": 31252, "num_train_epochs": 2, "total_flos": 776159526314354880, "trial_name": null, "trial_params": null }