|
{ |
|
"best_metric": 0.8631831216150027, |
|
"best_model_checkpoint": "result/InfoCSE-bert-large", |
|
"epoch": 2.0, |
|
"global_step": 31252, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.01, |
|
"eval_avg_sts": 0.6667446229182062, |
|
"eval_sickr_spearman": 0.6627723790529534, |
|
"eval_stsb_spearman": 0.6707168667834591, |
|
"step": 125 |
|
}, |
|
{ |
|
"epoch": 0.02, |
|
"eval_avg_sts": 0.7051305088963267, |
|
"eval_sickr_spearman": 0.6969365172570714, |
|
"eval_stsb_spearman": 0.713324500535582, |
|
"step": 250 |
|
}, |
|
{ |
|
"epoch": 0.02, |
|
"eval_avg_sts": 0.725875395370044, |
|
"eval_sickr_spearman": 0.716654533206054, |
|
"eval_stsb_spearman": 0.735096257534034, |
|
"step": 375 |
|
}, |
|
{ |
|
"epoch": 0.03, |
|
"learning_rate": 6.888007167541277e-06, |
|
"loss": 0.001, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 0.03, |
|
"eval_avg_sts": 0.7357340574594278, |
|
"eval_sickr_spearman": 0.7235103965631273, |
|
"eval_stsb_spearman": 0.7479577183557282, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 0.04, |
|
"eval_avg_sts": 0.7464037729944727, |
|
"eval_sickr_spearman": 0.7301059313504061, |
|
"eval_stsb_spearman": 0.7627016146385392, |
|
"step": 625 |
|
}, |
|
{ |
|
"epoch": 0.05, |
|
"eval_avg_sts": 0.7591284137806686, |
|
"eval_sickr_spearman": 0.7344878567657066, |
|
"eval_stsb_spearman": 0.7837689707956308, |
|
"step": 750 |
|
}, |
|
{ |
|
"epoch": 0.06, |
|
"eval_avg_sts": 0.7608889169495914, |
|
"eval_sickr_spearman": 0.7373875423906269, |
|
"eval_stsb_spearman": 0.7843902915085559, |
|
"step": 875 |
|
}, |
|
{ |
|
"epoch": 0.06, |
|
"learning_rate": 6.776014335082554e-06, |
|
"loss": 0.0002, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 0.06, |
|
"eval_avg_sts": 0.7633437897321462, |
|
"eval_sickr_spearman": 0.7394359247736582, |
|
"eval_stsb_spearman": 0.7872516546906342, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 0.07, |
|
"eval_avg_sts": 0.7689886003242912, |
|
"eval_sickr_spearman": 0.7459672900094155, |
|
"eval_stsb_spearman": 0.7920099106391669, |
|
"step": 1125 |
|
}, |
|
{ |
|
"epoch": 0.08, |
|
"eval_avg_sts": 0.7695141299706598, |
|
"eval_sickr_spearman": 0.749662274611948, |
|
"eval_stsb_spearman": 0.7893659853293715, |
|
"step": 1250 |
|
}, |
|
{ |
|
"epoch": 0.09, |
|
"eval_avg_sts": 0.771575990947651, |
|
"eval_sickr_spearman": 0.7507335602984238, |
|
"eval_stsb_spearman": 0.7924184215968783, |
|
"step": 1375 |
|
}, |
|
{ |
|
"epoch": 0.1, |
|
"learning_rate": 6.6640215026238325e-06, |
|
"loss": 0.0003, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 0.1, |
|
"eval_avg_sts": 0.7721249223821594, |
|
"eval_sickr_spearman": 0.7508546947362507, |
|
"eval_stsb_spearman": 0.7933951500280679, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 0.1, |
|
"eval_avg_sts": 0.7736414601237904, |
|
"eval_sickr_spearman": 0.7518223773369244, |
|
"eval_stsb_spearman": 0.7954605429106565, |
|
"step": 1625 |
|
}, |
|
{ |
|
"epoch": 0.11, |
|
"eval_avg_sts": 0.7750895970401648, |
|
"eval_sickr_spearman": 0.7527568224154028, |
|
"eval_stsb_spearman": 0.7974223716649267, |
|
"step": 1750 |
|
}, |
|
{ |
|
"epoch": 0.12, |
|
"eval_avg_sts": 0.7776564224610277, |
|
"eval_sickr_spearman": 0.7542352378193863, |
|
"eval_stsb_spearman": 0.8010776071026692, |
|
"step": 1875 |
|
}, |
|
{ |
|
"epoch": 0.13, |
|
"learning_rate": 6.55202867016511e-06, |
|
"loss": 0.0001, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 0.13, |
|
"eval_avg_sts": 0.7785919822208553, |
|
"eval_sickr_spearman": 0.7546353668237488, |
|
"eval_stsb_spearman": 0.802548597617962, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 0.14, |
|
"eval_avg_sts": 0.7804785012417673, |
|
"eval_sickr_spearman": 0.7560601133857076, |
|
"eval_stsb_spearman": 0.8048968890978271, |
|
"step": 2125 |
|
}, |
|
{ |
|
"epoch": 0.14, |
|
"eval_avg_sts": 0.7791958793390172, |
|
"eval_sickr_spearman": 0.7571627153503209, |
|
"eval_stsb_spearman": 0.8012290433277136, |
|
"step": 2250 |
|
}, |
|
{ |
|
"epoch": 0.15, |
|
"eval_avg_sts": 0.7808643358009081, |
|
"eval_sickr_spearman": 0.757428807652288, |
|
"eval_stsb_spearman": 0.8042998639495281, |
|
"step": 2375 |
|
}, |
|
{ |
|
"epoch": 0.16, |
|
"learning_rate": 6.440035837706387e-06, |
|
"loss": 0.0005, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 0.16, |
|
"eval_avg_sts": 0.7997499220712412, |
|
"eval_sickr_spearman": 0.7682156324132593, |
|
"eval_stsb_spearman": 0.8312842117292232, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 0.17, |
|
"eval_avg_sts": 0.8000945443564438, |
|
"eval_sickr_spearman": 0.769006603032424, |
|
"eval_stsb_spearman": 0.8311824856804637, |
|
"step": 2625 |
|
}, |
|
{ |
|
"epoch": 0.18, |
|
"eval_avg_sts": 0.8015655863550484, |
|
"eval_sickr_spearman": 0.7697635307193054, |
|
"eval_stsb_spearman": 0.8333676419907914, |
|
"step": 2750 |
|
}, |
|
{ |
|
"epoch": 0.18, |
|
"eval_avg_sts": 0.8020135971999303, |
|
"eval_sickr_spearman": 0.7738109675441908, |
|
"eval_stsb_spearman": 0.8302162268556699, |
|
"step": 2875 |
|
}, |
|
{ |
|
"epoch": 0.19, |
|
"learning_rate": 6.328043005247664e-06, |
|
"loss": 0.0001, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 0.19, |
|
"eval_avg_sts": 0.8021055052889553, |
|
"eval_sickr_spearman": 0.7723527913356312, |
|
"eval_stsb_spearman": 0.8318582192422794, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 0.2, |
|
"eval_avg_sts": 0.8034828561746414, |
|
"eval_sickr_spearman": 0.7730187425570707, |
|
"eval_stsb_spearman": 0.8339469697922121, |
|
"step": 3125 |
|
}, |
|
{ |
|
"epoch": 0.21, |
|
"eval_avg_sts": 0.809294388946485, |
|
"eval_sickr_spearman": 0.7739637544778655, |
|
"eval_stsb_spearman": 0.8446250234151045, |
|
"step": 3250 |
|
}, |
|
{ |
|
"epoch": 0.22, |
|
"eval_avg_sts": 0.8095468267478854, |
|
"eval_sickr_spearman": 0.7742509804644655, |
|
"eval_stsb_spearman": 0.8448426730313053, |
|
"step": 3375 |
|
}, |
|
{ |
|
"epoch": 0.22, |
|
"learning_rate": 6.2160501727889415e-06, |
|
"loss": 0.0001, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 0.22, |
|
"eval_avg_sts": 0.8075109934505635, |
|
"eval_sickr_spearman": 0.7709388998025974, |
|
"eval_stsb_spearman": 0.8440830870985296, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 0.23, |
|
"eval_avg_sts": 0.8072613664062491, |
|
"eval_sickr_spearman": 0.7727868483993274, |
|
"eval_stsb_spearman": 0.8417358844131708, |
|
"step": 3625 |
|
}, |
|
{ |
|
"epoch": 0.24, |
|
"eval_avg_sts": 0.8035650181540979, |
|
"eval_sickr_spearman": 0.7687000741023642, |
|
"eval_stsb_spearman": 0.8384299622058315, |
|
"step": 3750 |
|
}, |
|
{ |
|
"epoch": 0.25, |
|
"eval_avg_sts": 0.8060855472554131, |
|
"eval_sickr_spearman": 0.7709744428176617, |
|
"eval_stsb_spearman": 0.8411966516931645, |
|
"step": 3875 |
|
}, |
|
{ |
|
"epoch": 0.26, |
|
"learning_rate": 6.104057340330219e-06, |
|
"loss": 0.0004, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 0.26, |
|
"eval_avg_sts": 0.803351813599069, |
|
"eval_sickr_spearman": 0.7677387500328843, |
|
"eval_stsb_spearman": 0.8389648771652538, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 0.26, |
|
"eval_avg_sts": 0.802660483963512, |
|
"eval_sickr_spearman": 0.7673760487601211, |
|
"eval_stsb_spearman": 0.8379449191669028, |
|
"step": 4125 |
|
}, |
|
{ |
|
"epoch": 0.27, |
|
"eval_avg_sts": 0.8047314511229144, |
|
"eval_sickr_spearman": 0.7691939779184522, |
|
"eval_stsb_spearman": 0.8402689243273768, |
|
"step": 4250 |
|
}, |
|
{ |
|
"epoch": 0.28, |
|
"eval_avg_sts": 0.8040567267552472, |
|
"eval_sickr_spearman": 0.7695367278583146, |
|
"eval_stsb_spearman": 0.8385767256521798, |
|
"step": 4375 |
|
}, |
|
{ |
|
"epoch": 0.29, |
|
"learning_rate": 5.992064507871497e-06, |
|
"loss": 0.0003, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 0.29, |
|
"eval_avg_sts": 0.8031439674900422, |
|
"eval_sickr_spearman": 0.7708419250087939, |
|
"eval_stsb_spearman": 0.8354460099712906, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 0.3, |
|
"eval_avg_sts": 0.8016452961027151, |
|
"eval_sickr_spearman": 0.76836294380137, |
|
"eval_stsb_spearman": 0.8349276484040601, |
|
"step": 4625 |
|
}, |
|
{ |
|
"epoch": 0.3, |
|
"eval_avg_sts": 0.8036856358976682, |
|
"eval_sickr_spearman": 0.7702216513648221, |
|
"eval_stsb_spearman": 0.8371496204305142, |
|
"step": 4750 |
|
}, |
|
{ |
|
"epoch": 0.31, |
|
"eval_avg_sts": 0.8061976413597232, |
|
"eval_sickr_spearman": 0.7719798778640656, |
|
"eval_stsb_spearman": 0.8404154048553806, |
|
"step": 4875 |
|
}, |
|
{ |
|
"epoch": 0.32, |
|
"learning_rate": 5.880071675412773e-06, |
|
"loss": 0.0001, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 0.32, |
|
"eval_avg_sts": 0.8067273899585344, |
|
"eval_sickr_spearman": 0.7723029350523384, |
|
"eval_stsb_spearman": 0.8411518448647305, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 0.33, |
|
"eval_avg_sts": 0.8078358230567408, |
|
"eval_sickr_spearman": 0.7726999601368258, |
|
"eval_stsb_spearman": 0.8429716859766557, |
|
"step": 5125 |
|
}, |
|
{ |
|
"epoch": 0.34, |
|
"eval_avg_sts": 0.802548441043093, |
|
"eval_sickr_spearman": 0.7676195664444124, |
|
"eval_stsb_spearman": 0.8374773156417734, |
|
"step": 5250 |
|
}, |
|
{ |
|
"epoch": 0.34, |
|
"eval_avg_sts": 0.800628830120568, |
|
"eval_sickr_spearman": 0.7634932625509655, |
|
"eval_stsb_spearman": 0.8377643976901704, |
|
"step": 5375 |
|
}, |
|
{ |
|
"epoch": 0.35, |
|
"learning_rate": 5.7680788429540505e-06, |
|
"loss": 0.0002, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 0.35, |
|
"eval_avg_sts": 0.8020238168463023, |
|
"eval_sickr_spearman": 0.7652266089396642, |
|
"eval_stsb_spearman": 0.8388210247529404, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 0.36, |
|
"eval_avg_sts": 0.8040364434874829, |
|
"eval_sickr_spearman": 0.7675117846527851, |
|
"eval_stsb_spearman": 0.8405611023221807, |
|
"step": 5625 |
|
}, |
|
{ |
|
"epoch": 0.37, |
|
"eval_avg_sts": 0.8016723711497669, |
|
"eval_sickr_spearman": 0.7650260310600586, |
|
"eval_stsb_spearman": 0.8383187112394752, |
|
"step": 5750 |
|
}, |
|
{ |
|
"epoch": 0.38, |
|
"eval_avg_sts": 0.8020864629480828, |
|
"eval_sickr_spearman": 0.7653134972021658, |
|
"eval_stsb_spearman": 0.8388594286939999, |
|
"step": 5875 |
|
}, |
|
{ |
|
"epoch": 0.38, |
|
"learning_rate": 5.656086010495328e-06, |
|
"loss": 0.0001, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 0.38, |
|
"eval_avg_sts": 0.8028151558848002, |
|
"eval_sickr_spearman": 0.7671768637824573, |
|
"eval_stsb_spearman": 0.838453447987143, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 0.39, |
|
"eval_avg_sts": 0.8049514040827435, |
|
"eval_sickr_spearman": 0.7685626571211498, |
|
"eval_stsb_spearman": 0.8413401510443372, |
|
"step": 6125 |
|
}, |
|
{ |
|
"epoch": 0.4, |
|
"eval_avg_sts": 0.8059812583547672, |
|
"eval_sickr_spearman": 0.7690958503782142, |
|
"eval_stsb_spearman": 0.8428666663313202, |
|
"step": 6250 |
|
}, |
|
{ |
|
"epoch": 0.41, |
|
"eval_avg_sts": 0.8063265220940947, |
|
"eval_sickr_spearman": 0.7693663135104123, |
|
"eval_stsb_spearman": 0.8432867306777773, |
|
"step": 6375 |
|
}, |
|
{ |
|
"epoch": 0.42, |
|
"learning_rate": 5.544093178036605e-06, |
|
"loss": 0.0001, |
|
"step": 6500 |
|
}, |
|
{ |
|
"epoch": 0.42, |
|
"eval_avg_sts": 0.8061105071256144, |
|
"eval_sickr_spearman": 0.769672271626573, |
|
"eval_stsb_spearman": 0.8425487426246557, |
|
"step": 6500 |
|
}, |
|
{ |
|
"epoch": 0.42, |
|
"eval_avg_sts": 0.8069978292318387, |
|
"eval_sickr_spearman": 0.770697879735581, |
|
"eval_stsb_spearman": 0.8432977787280964, |
|
"step": 6625 |
|
}, |
|
{ |
|
"epoch": 0.43, |
|
"eval_avg_sts": 0.8080712074218199, |
|
"eval_sickr_spearman": 0.7709677664945618, |
|
"eval_stsb_spearman": 0.8451746483490781, |
|
"step": 6750 |
|
}, |
|
{ |
|
"epoch": 0.44, |
|
"eval_avg_sts": 0.808918715708319, |
|
"eval_sickr_spearman": 0.7720352577240238, |
|
"eval_stsb_spearman": 0.8458021736926141, |
|
"step": 6875 |
|
}, |
|
{ |
|
"epoch": 0.45, |
|
"learning_rate": 5.432100345577883e-06, |
|
"loss": 0.0001, |
|
"step": 7000 |
|
}, |
|
{ |
|
"epoch": 0.45, |
|
"eval_avg_sts": 0.8006026057334057, |
|
"eval_sickr_spearman": 0.7608432425913206, |
|
"eval_stsb_spearman": 0.8403619688754909, |
|
"step": 7000 |
|
}, |
|
{ |
|
"epoch": 0.46, |
|
"eval_avg_sts": 0.8020612965823335, |
|
"eval_sickr_spearman": 0.7626692409746934, |
|
"eval_stsb_spearman": 0.8414533521899736, |
|
"step": 7125 |
|
}, |
|
{ |
|
"epoch": 0.46, |
|
"eval_avg_sts": 0.810499992265102, |
|
"eval_sickr_spearman": 0.7673374317545649, |
|
"eval_stsb_spearman": 0.8536625527756392, |
|
"step": 7250 |
|
}, |
|
{ |
|
"epoch": 0.47, |
|
"eval_avg_sts": 0.8112538171528675, |
|
"eval_sickr_spearman": 0.7687574232374812, |
|
"eval_stsb_spearman": 0.8537502110682538, |
|
"step": 7375 |
|
}, |
|
{ |
|
"epoch": 0.48, |
|
"learning_rate": 5.32010751311916e-06, |
|
"loss": 0.0002, |
|
"step": 7500 |
|
}, |
|
{ |
|
"epoch": 0.48, |
|
"eval_avg_sts": 0.8149817134253148, |
|
"eval_sickr_spearman": 0.7774900538521474, |
|
"eval_stsb_spearman": 0.852473372998482, |
|
"step": 7500 |
|
}, |
|
{ |
|
"epoch": 0.49, |
|
"eval_avg_sts": 0.8174625453813287, |
|
"eval_sickr_spearman": 0.7815984901758593, |
|
"eval_stsb_spearman": 0.8533266005867981, |
|
"step": 7625 |
|
}, |
|
{ |
|
"epoch": 0.5, |
|
"eval_avg_sts": 0.8176977199916579, |
|
"eval_sickr_spearman": 0.782115160734029, |
|
"eval_stsb_spearman": 0.8532802792492867, |
|
"step": 7750 |
|
}, |
|
{ |
|
"epoch": 0.5, |
|
"eval_avg_sts": 0.8178800789250669, |
|
"eval_sickr_spearman": 0.782127648820403, |
|
"eval_stsb_spearman": 0.8536325090297309, |
|
"step": 7875 |
|
}, |
|
{ |
|
"epoch": 0.51, |
|
"learning_rate": 5.2081146806604376e-06, |
|
"loss": 0.0001, |
|
"step": 8000 |
|
}, |
|
{ |
|
"epoch": 0.51, |
|
"eval_avg_sts": 0.8181362028628546, |
|
"eval_sickr_spearman": 0.7824101677590619, |
|
"eval_stsb_spearman": 0.8538622379666473, |
|
"step": 8000 |
|
}, |
|
{ |
|
"epoch": 0.52, |
|
"eval_avg_sts": 0.8182071435777255, |
|
"eval_sickr_spearman": 0.7826502752351511, |
|
"eval_stsb_spearman": 0.8537640119202999, |
|
"step": 8125 |
|
}, |
|
{ |
|
"epoch": 0.53, |
|
"eval_avg_sts": 0.8175148093264073, |
|
"eval_sickr_spearman": 0.7809989179366073, |
|
"eval_stsb_spearman": 0.8540307007162073, |
|
"step": 8250 |
|
}, |
|
{ |
|
"epoch": 0.54, |
|
"eval_avg_sts": 0.817271425771201, |
|
"eval_sickr_spearman": 0.7809910408359715, |
|
"eval_stsb_spearman": 0.8535518107064306, |
|
"step": 8375 |
|
}, |
|
{ |
|
"epoch": 0.54, |
|
"learning_rate": 5.096121848201715e-06, |
|
"loss": 0.0, |
|
"step": 8500 |
|
}, |
|
{ |
|
"epoch": 0.54, |
|
"eval_avg_sts": 0.8169878861543607, |
|
"eval_sickr_spearman": 0.7807656308769224, |
|
"eval_stsb_spearman": 0.8532101414317989, |
|
"step": 8500 |
|
}, |
|
{ |
|
"epoch": 0.55, |
|
"eval_avg_sts": 0.8163714998445242, |
|
"eval_sickr_spearman": 0.7799410809585343, |
|
"eval_stsb_spearman": 0.852801918730514, |
|
"step": 8625 |
|
}, |
|
{ |
|
"epoch": 0.56, |
|
"eval_avg_sts": 0.814914066335918, |
|
"eval_sickr_spearman": 0.7796482833641676, |
|
"eval_stsb_spearman": 0.8501798493076684, |
|
"step": 8750 |
|
}, |
|
{ |
|
"epoch": 0.57, |
|
"eval_avg_sts": 0.8150768291940962, |
|
"eval_sickr_spearman": 0.7799102930225125, |
|
"eval_stsb_spearman": 0.8502433653656799, |
|
"step": 8875 |
|
}, |
|
{ |
|
"epoch": 0.58, |
|
"learning_rate": 4.984129015742992e-06, |
|
"loss": 0.0001, |
|
"step": 9000 |
|
}, |
|
{ |
|
"epoch": 0.58, |
|
"eval_avg_sts": 0.8157444131185677, |
|
"eval_sickr_spearman": 0.7805133715321694, |
|
"eval_stsb_spearman": 0.850975454704966, |
|
"step": 9000 |
|
}, |
|
{ |
|
"epoch": 0.58, |
|
"eval_avg_sts": 0.8194025294491036, |
|
"eval_sickr_spearman": 0.7869190393754633, |
|
"eval_stsb_spearman": 0.851886019522744, |
|
"step": 9125 |
|
}, |
|
{ |
|
"epoch": 0.59, |
|
"eval_avg_sts": 0.6858142517829269, |
|
"eval_sickr_spearman": 0.6164898018315937, |
|
"eval_stsb_spearman": 0.7551387017342599, |
|
"step": 9250 |
|
}, |
|
{ |
|
"epoch": 0.6, |
|
"eval_avg_sts": 0.8177747035338222, |
|
"eval_sickr_spearman": 0.783078280380066, |
|
"eval_stsb_spearman": 0.8524711266875784, |
|
"step": 9375 |
|
}, |
|
{ |
|
"epoch": 0.61, |
|
"learning_rate": 4.872136183284269e-06, |
|
"loss": 0.0015, |
|
"step": 9500 |
|
}, |
|
{ |
|
"epoch": 0.61, |
|
"eval_avg_sts": 0.819985242900733, |
|
"eval_sickr_spearman": 0.7850574019148235, |
|
"eval_stsb_spearman": 0.8549130838866427, |
|
"step": 9500 |
|
}, |
|
{ |
|
"epoch": 0.62, |
|
"eval_avg_sts": 0.820612467391125, |
|
"eval_sickr_spearman": 0.7860280624437863, |
|
"eval_stsb_spearman": 0.8551968723384636, |
|
"step": 9625 |
|
}, |
|
{ |
|
"epoch": 0.62, |
|
"eval_avg_sts": 0.8210179120381628, |
|
"eval_sickr_spearman": 0.7866489124609753, |
|
"eval_stsb_spearman": 0.8553869116153502, |
|
"step": 9750 |
|
}, |
|
{ |
|
"epoch": 0.63, |
|
"eval_avg_sts": 0.821463549997331, |
|
"eval_sickr_spearman": 0.787914243797261, |
|
"eval_stsb_spearman": 0.8550128561974009, |
|
"step": 9875 |
|
}, |
|
{ |
|
"epoch": 0.64, |
|
"learning_rate": 4.760143350825547e-06, |
|
"loss": 0.0002, |
|
"step": 10000 |
|
}, |
|
{ |
|
"epoch": 0.64, |
|
"eval_avg_sts": 0.8220538798411258, |
|
"eval_sickr_spearman": 0.7882646787133534, |
|
"eval_stsb_spearman": 0.8558430809688982, |
|
"step": 10000 |
|
}, |
|
{ |
|
"epoch": 0.65, |
|
"eval_avg_sts": 0.8227053843456922, |
|
"eval_sickr_spearman": 0.7892594508552383, |
|
"eval_stsb_spearman": 0.856151317836146, |
|
"step": 10125 |
|
}, |
|
{ |
|
"epoch": 0.66, |
|
"eval_avg_sts": 0.8211210354889169, |
|
"eval_sickr_spearman": 0.7858874273787755, |
|
"eval_stsb_spearman": 0.8563546435990582, |
|
"step": 10250 |
|
}, |
|
{ |
|
"epoch": 0.66, |
|
"eval_avg_sts": 0.8217109523377687, |
|
"eval_sickr_spearman": 0.7865405062650296, |
|
"eval_stsb_spearman": 0.8568813984105078, |
|
"step": 10375 |
|
}, |
|
{ |
|
"epoch": 0.67, |
|
"learning_rate": 4.648150518366825e-06, |
|
"loss": 0.0002, |
|
"step": 10500 |
|
}, |
|
{ |
|
"epoch": 0.67, |
|
"eval_avg_sts": 0.8231847712907092, |
|
"eval_sickr_spearman": 0.7883226042216879, |
|
"eval_stsb_spearman": 0.8580469383597307, |
|
"step": 10500 |
|
}, |
|
{ |
|
"epoch": 0.68, |
|
"eval_avg_sts": 0.8231833094531285, |
|
"eval_sickr_spearman": 0.7886680439032306, |
|
"eval_stsb_spearman": 0.8576985750030263, |
|
"step": 10625 |
|
}, |
|
{ |
|
"epoch": 0.69, |
|
"eval_avg_sts": 0.8235797750151058, |
|
"eval_sickr_spearman": 0.7894692507063199, |
|
"eval_stsb_spearman": 0.8576902993238917, |
|
"step": 10750 |
|
}, |
|
{ |
|
"epoch": 0.7, |
|
"eval_avg_sts": 0.8239802387430818, |
|
"eval_sickr_spearman": 0.7900059982648908, |
|
"eval_stsb_spearman": 0.8579544792212728, |
|
"step": 10875 |
|
}, |
|
{ |
|
"epoch": 0.7, |
|
"learning_rate": 4.536157685908102e-06, |
|
"loss": 0.0001, |
|
"step": 11000 |
|
}, |
|
{ |
|
"epoch": 0.7, |
|
"eval_avg_sts": 0.8228846723006884, |
|
"eval_sickr_spearman": 0.7878013707088813, |
|
"eval_stsb_spearman": 0.8579679738924955, |
|
"step": 11000 |
|
}, |
|
{ |
|
"epoch": 0.71, |
|
"eval_avg_sts": 0.8233402178257747, |
|
"eval_sickr_spearman": 0.788485765873273, |
|
"eval_stsb_spearman": 0.8581946697782764, |
|
"step": 11125 |
|
}, |
|
{ |
|
"epoch": 0.72, |
|
"eval_avg_sts": 0.8233165033728497, |
|
"eval_sickr_spearman": 0.788493306756199, |
|
"eval_stsb_spearman": 0.8581396999895003, |
|
"step": 11250 |
|
}, |
|
{ |
|
"epoch": 0.73, |
|
"eval_avg_sts": 0.8211286933035429, |
|
"eval_sickr_spearman": 0.787368274267214, |
|
"eval_stsb_spearman": 0.8548891123398719, |
|
"step": 11375 |
|
}, |
|
{ |
|
"epoch": 0.74, |
|
"learning_rate": 4.424164853449379e-06, |
|
"loss": 0.0002, |
|
"step": 11500 |
|
}, |
|
{ |
|
"epoch": 0.74, |
|
"eval_avg_sts": 0.8222354006770852, |
|
"eval_sickr_spearman": 0.7882437371531265, |
|
"eval_stsb_spearman": 0.856227064201044, |
|
"step": 11500 |
|
}, |
|
{ |
|
"epoch": 0.74, |
|
"eval_avg_sts": 0.823058736106017, |
|
"eval_sickr_spearman": 0.7882230837795081, |
|
"eval_stsb_spearman": 0.8578943884325259, |
|
"step": 11625 |
|
}, |
|
{ |
|
"epoch": 0.75, |
|
"eval_avg_sts": 0.8240623262398707, |
|
"eval_sickr_spearman": 0.7903270861780045, |
|
"eval_stsb_spearman": 0.8577975663017371, |
|
"step": 11750 |
|
}, |
|
{ |
|
"epoch": 0.76, |
|
"eval_avg_sts": 0.8193741224170432, |
|
"eval_sickr_spearman": 0.7834559008995725, |
|
"eval_stsb_spearman": 0.8552923439345139, |
|
"step": 11875 |
|
}, |
|
{ |
|
"epoch": 0.77, |
|
"learning_rate": 4.312172020990656e-06, |
|
"loss": 0.0004, |
|
"step": 12000 |
|
}, |
|
{ |
|
"epoch": 0.77, |
|
"eval_avg_sts": 0.8219118427006455, |
|
"eval_sickr_spearman": 0.785794199010884, |
|
"eval_stsb_spearman": 0.8580294863904071, |
|
"step": 12000 |
|
}, |
|
{ |
|
"epoch": 0.78, |
|
"eval_avg_sts": 0.823098023008008, |
|
"eval_sickr_spearman": 0.7879260114171134, |
|
"eval_stsb_spearman": 0.8582700345989028, |
|
"step": 12125 |
|
}, |
|
{ |
|
"epoch": 0.78, |
|
"eval_avg_sts": 0.8227772117211238, |
|
"eval_sickr_spearman": 0.7878058376013152, |
|
"eval_stsb_spearman": 0.8577485858409325, |
|
"step": 12250 |
|
}, |
|
{ |
|
"epoch": 0.79, |
|
"eval_avg_sts": 0.8244800942376741, |
|
"eval_sickr_spearman": 0.7899311658088503, |
|
"eval_stsb_spearman": 0.8590290226664979, |
|
"step": 12375 |
|
}, |
|
{ |
|
"epoch": 0.8, |
|
"learning_rate": 4.2001791885319345e-06, |
|
"loss": 0.0003, |
|
"step": 12500 |
|
}, |
|
{ |
|
"epoch": 0.8, |
|
"eval_avg_sts": 0.8252546537289246, |
|
"eval_sickr_spearman": 0.7905314585146238, |
|
"eval_stsb_spearman": 0.8599778489432254, |
|
"step": 12500 |
|
}, |
|
{ |
|
"epoch": 0.81, |
|
"eval_avg_sts": 0.8242515246774704, |
|
"eval_sickr_spearman": 0.7934860436884877, |
|
"eval_stsb_spearman": 0.855017005666453, |
|
"step": 12625 |
|
}, |
|
{ |
|
"epoch": 0.82, |
|
"eval_avg_sts": 0.8251886392831695, |
|
"eval_sickr_spearman": 0.7935808570827266, |
|
"eval_stsb_spearman": 0.8567964214836123, |
|
"step": 12750 |
|
}, |
|
{ |
|
"epoch": 0.82, |
|
"eval_avg_sts": 0.8255732979417849, |
|
"eval_sickr_spearman": 0.7939037701776952, |
|
"eval_stsb_spearman": 0.8572428257058746, |
|
"step": 12875 |
|
}, |
|
{ |
|
"epoch": 0.83, |
|
"learning_rate": 4.088186356073212e-06, |
|
"loss": 0.0002, |
|
"step": 13000 |
|
}, |
|
{ |
|
"epoch": 0.83, |
|
"eval_avg_sts": 0.8272525514506217, |
|
"eval_sickr_spearman": 0.7954193915835747, |
|
"eval_stsb_spearman": 0.8590857113176686, |
|
"step": 13000 |
|
}, |
|
{ |
|
"epoch": 0.84, |
|
"eval_avg_sts": 0.8276110249953785, |
|
"eval_sickr_spearman": 0.7955957617880555, |
|
"eval_stsb_spearman": 0.8596262882027015, |
|
"step": 13125 |
|
}, |
|
{ |
|
"epoch": 0.85, |
|
"eval_avg_sts": 0.8262806808137206, |
|
"eval_sickr_spearman": 0.792061729406442, |
|
"eval_stsb_spearman": 0.8604996322209992, |
|
"step": 13250 |
|
}, |
|
{ |
|
"epoch": 0.86, |
|
"eval_avg_sts": 0.8270413161061019, |
|
"eval_sickr_spearman": 0.7918599027181991, |
|
"eval_stsb_spearman": 0.8622227294940048, |
|
"step": 13375 |
|
}, |
|
{ |
|
"epoch": 0.86, |
|
"learning_rate": 3.976193523614489e-06, |
|
"loss": 0.0002, |
|
"step": 13500 |
|
}, |
|
{ |
|
"epoch": 0.86, |
|
"eval_avg_sts": 0.8277173388272963, |
|
"eval_sickr_spearman": 0.7929541472711621, |
|
"eval_stsb_spearman": 0.8624805303834304, |
|
"step": 13500 |
|
}, |
|
{ |
|
"epoch": 0.87, |
|
"eval_avg_sts": 0.8280371802211439, |
|
"eval_sickr_spearman": 0.7936189937772684, |
|
"eval_stsb_spearman": 0.8624553666650194, |
|
"step": 13625 |
|
}, |
|
{ |
|
"epoch": 0.88, |
|
"eval_avg_sts": 0.8280087430461096, |
|
"eval_sickr_spearman": 0.7934894538966899, |
|
"eval_stsb_spearman": 0.8625280321955292, |
|
"step": 13750 |
|
}, |
|
{ |
|
"epoch": 0.89, |
|
"eval_avg_sts": 0.8279846750031183, |
|
"eval_sickr_spearman": 0.7941465193643633, |
|
"eval_stsb_spearman": 0.8618228306418733, |
|
"step": 13875 |
|
}, |
|
{ |
|
"epoch": 0.9, |
|
"learning_rate": 3.864200691155766e-06, |
|
"loss": 0.0001, |
|
"step": 14000 |
|
}, |
|
{ |
|
"epoch": 0.9, |
|
"eval_avg_sts": 0.8281003824811937, |
|
"eval_sickr_spearman": 0.7943439752223754, |
|
"eval_stsb_spearman": 0.8618567897400118, |
|
"step": 14000 |
|
}, |
|
{ |
|
"epoch": 0.9, |
|
"eval_avg_sts": 0.8280440185035953, |
|
"eval_sickr_spearman": 0.792904915392188, |
|
"eval_stsb_spearman": 0.8631831216150027, |
|
"step": 14125 |
|
}, |
|
{ |
|
"epoch": 0.91, |
|
"eval_avg_sts": 0.8279193239585301, |
|
"eval_sickr_spearman": 0.7931221120328913, |
|
"eval_stsb_spearman": 0.8627165358841689, |
|
"step": 14250 |
|
}, |
|
{ |
|
"epoch": 0.92, |
|
"eval_avg_sts": 0.8275099017452278, |
|
"eval_sickr_spearman": 0.793065195177687, |
|
"eval_stsb_spearman": 0.8619546083127685, |
|
"step": 14375 |
|
}, |
|
{ |
|
"epoch": 0.93, |
|
"learning_rate": 3.7522078586970435e-06, |
|
"loss": 0.0001, |
|
"step": 14500 |
|
}, |
|
{ |
|
"epoch": 0.93, |
|
"eval_avg_sts": 0.8275982959975564, |
|
"eval_sickr_spearman": 0.7935053521912658, |
|
"eval_stsb_spearman": 0.861691239803847, |
|
"step": 14500 |
|
}, |
|
{ |
|
"epoch": 0.94, |
|
"eval_avg_sts": 0.8276150816017793, |
|
"eval_sickr_spearman": 0.7940267778284781, |
|
"eval_stsb_spearman": 0.8612033853750805, |
|
"step": 14625 |
|
}, |
|
{ |
|
"epoch": 0.94, |
|
"eval_avg_sts": 0.8277678050001869, |
|
"eval_sickr_spearman": 0.7940122244047422, |
|
"eval_stsb_spearman": 0.8615233855956315, |
|
"step": 14750 |
|
}, |
|
{ |
|
"epoch": 0.95, |
|
"eval_avg_sts": 0.827775044421294, |
|
"eval_sickr_spearman": 0.79435247672733, |
|
"eval_stsb_spearman": 0.861197612115258, |
|
"step": 14875 |
|
}, |
|
{ |
|
"epoch": 0.96, |
|
"learning_rate": 3.6402150262383203e-06, |
|
"loss": 0.0002, |
|
"step": 15000 |
|
}, |
|
{ |
|
"epoch": 0.96, |
|
"eval_avg_sts": 0.8265288786526938, |
|
"eval_sickr_spearman": 0.7941830230014563, |
|
"eval_stsb_spearman": 0.8588747343039312, |
|
"step": 15000 |
|
}, |
|
{ |
|
"epoch": 0.97, |
|
"eval_avg_sts": 0.826595528411173, |
|
"eval_sickr_spearman": 0.7947538726420482, |
|
"eval_stsb_spearman": 0.8584371841802979, |
|
"step": 15125 |
|
}, |
|
{ |
|
"epoch": 0.98, |
|
"eval_avg_sts": 0.8271259707838263, |
|
"eval_sickr_spearman": 0.7952840399397222, |
|
"eval_stsb_spearman": 0.8589679016279306, |
|
"step": 15250 |
|
}, |
|
{ |
|
"epoch": 0.98, |
|
"eval_avg_sts": 0.8269049666463504, |
|
"eval_sickr_spearman": 0.7927316191781993, |
|
"eval_stsb_spearman": 0.8610783141145013, |
|
"step": 15375 |
|
}, |
|
{ |
|
"epoch": 0.99, |
|
"learning_rate": 3.5282221937795976e-06, |
|
"loss": 0.0003, |
|
"step": 15500 |
|
}, |
|
{ |
|
"epoch": 0.99, |
|
"eval_avg_sts": 0.82737580758211, |
|
"eval_sickr_spearman": 0.7935406550508229, |
|
"eval_stsb_spearman": 0.8612109601133972, |
|
"step": 15500 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_avg_sts": 0.8264028870845463, |
|
"eval_sickr_spearman": 0.7940738673657366, |
|
"eval_stsb_spearman": 0.8587319068033561, |
|
"step": 15625 |
|
}, |
|
{ |
|
"epoch": 1.01, |
|
"eval_avg_sts": 0.8268441102829658, |
|
"eval_sickr_spearman": 0.7937048253555384, |
|
"eval_stsb_spearman": 0.8599833952103932, |
|
"step": 15750 |
|
}, |
|
{ |
|
"epoch": 1.02, |
|
"eval_avg_sts": 0.8275739286019619, |
|
"eval_sickr_spearman": 0.7947639591733503, |
|
"eval_stsb_spearman": 0.8603838980305735, |
|
"step": 15875 |
|
}, |
|
{ |
|
"epoch": 1.02, |
|
"learning_rate": 3.4162293613208757e-06, |
|
"loss": 0.0001, |
|
"step": 16000 |
|
}, |
|
{ |
|
"epoch": 1.02, |
|
"eval_avg_sts": 0.8277768410299685, |
|
"eval_sickr_spearman": 0.7952131460339995, |
|
"eval_stsb_spearman": 0.8603405360259375, |
|
"step": 16000 |
|
}, |
|
{ |
|
"epoch": 1.03, |
|
"eval_avg_sts": 0.8282682698041279, |
|
"eval_sickr_spearman": 0.7963400997670419, |
|
"eval_stsb_spearman": 0.860196439841214, |
|
"step": 16125 |
|
}, |
|
{ |
|
"epoch": 1.04, |
|
"eval_avg_sts": 0.8264618348746703, |
|
"eval_sickr_spearman": 0.7934643816617393, |
|
"eval_stsb_spearman": 0.8594592880876013, |
|
"step": 16250 |
|
}, |
|
{ |
|
"epoch": 1.05, |
|
"eval_avg_sts": 0.8264717428559492, |
|
"eval_sickr_spearman": 0.7932766280862176, |
|
"eval_stsb_spearman": 0.8596668576256806, |
|
"step": 16375 |
|
}, |
|
{ |
|
"epoch": 1.06, |
|
"learning_rate": 3.304236528862153e-06, |
|
"loss": 0.0002, |
|
"step": 16500 |
|
}, |
|
{ |
|
"epoch": 1.06, |
|
"eval_avg_sts": 0.8274883631622513, |
|
"eval_sickr_spearman": 0.7946689056236043, |
|
"eval_stsb_spearman": 0.8603078207008983, |
|
"step": 16500 |
|
}, |
|
{ |
|
"epoch": 1.06, |
|
"eval_avg_sts": 0.8285054599151072, |
|
"eval_sickr_spearman": 0.7953375465867241, |
|
"eval_stsb_spearman": 0.8616733732434904, |
|
"step": 16625 |
|
}, |
|
{ |
|
"epoch": 1.07, |
|
"eval_avg_sts": 0.8267040342845151, |
|
"eval_sickr_spearman": 0.7930167317963359, |
|
"eval_stsb_spearman": 0.8603913367726943, |
|
"step": 16750 |
|
}, |
|
{ |
|
"epoch": 1.08, |
|
"eval_avg_sts": 0.8254063226482575, |
|
"eval_sickr_spearman": 0.7925604363326739, |
|
"eval_stsb_spearman": 0.8582522089638411, |
|
"step": 16875 |
|
}, |
|
{ |
|
"epoch": 1.09, |
|
"learning_rate": 3.19224369640343e-06, |
|
"loss": 0.0003, |
|
"step": 17000 |
|
}, |
|
{ |
|
"epoch": 1.09, |
|
"eval_avg_sts": 0.8263459648804743, |
|
"eval_sickr_spearman": 0.7938006474029073, |
|
"eval_stsb_spearman": 0.8588912823580412, |
|
"step": 17000 |
|
}, |
|
{ |
|
"epoch": 1.1, |
|
"eval_avg_sts": 0.8265585284525776, |
|
"eval_sickr_spearman": 0.7938499273129829, |
|
"eval_stsb_spearman": 0.8592671295921722, |
|
"step": 17125 |
|
}, |
|
{ |
|
"epoch": 1.1, |
|
"eval_avg_sts": 0.8275713806370856, |
|
"eval_sickr_spearman": 0.795413819975808, |
|
"eval_stsb_spearman": 0.8597289412983632, |
|
"step": 17250 |
|
}, |
|
{ |
|
"epoch": 1.11, |
|
"eval_avg_sts": 0.8278030720022054, |
|
"eval_sickr_spearman": 0.7957596439061624, |
|
"eval_stsb_spearman": 0.8598465000982485, |
|
"step": 17375 |
|
}, |
|
{ |
|
"epoch": 1.12, |
|
"learning_rate": 3.0802508639447074e-06, |
|
"loss": 0.0003, |
|
"step": 17500 |
|
}, |
|
{ |
|
"epoch": 1.12, |
|
"eval_avg_sts": 0.828665230451958, |
|
"eval_sickr_spearman": 0.7959547942713053, |
|
"eval_stsb_spearman": 0.8613756666326104, |
|
"step": 17500 |
|
}, |
|
{ |
|
"epoch": 1.13, |
|
"eval_avg_sts": 0.8288773890103436, |
|
"eval_sickr_spearman": 0.7964317911396872, |
|
"eval_stsb_spearman": 0.861322986881, |
|
"step": 17625 |
|
}, |
|
{ |
|
"epoch": 1.14, |
|
"eval_avg_sts": 0.8287921576974288, |
|
"eval_sickr_spearman": 0.7965225699214054, |
|
"eval_stsb_spearman": 0.8610617454734522, |
|
"step": 17750 |
|
}, |
|
{ |
|
"epoch": 1.14, |
|
"eval_avg_sts": 0.8287755856452497, |
|
"eval_sickr_spearman": 0.7967101794036225, |
|
"eval_stsb_spearman": 0.8608409918868768, |
|
"step": 17875 |
|
}, |
|
{ |
|
"epoch": 1.15, |
|
"learning_rate": 2.9682580314859847e-06, |
|
"loss": 0.0001, |
|
"step": 18000 |
|
}, |
|
{ |
|
"epoch": 1.15, |
|
"eval_avg_sts": 0.8292774010789281, |
|
"eval_sickr_spearman": 0.7969440428365246, |
|
"eval_stsb_spearman": 0.8616107593213317, |
|
"step": 18000 |
|
}, |
|
{ |
|
"epoch": 1.16, |
|
"eval_avg_sts": 0.8293137062967321, |
|
"eval_sickr_spearman": 0.7971494238262741, |
|
"eval_stsb_spearman": 0.8614779887671901, |
|
"step": 18125 |
|
}, |
|
{ |
|
"epoch": 1.17, |
|
"eval_avg_sts": 0.8293003591512393, |
|
"eval_sickr_spearman": 0.7972976478053122, |
|
"eval_stsb_spearman": 0.8613030704971664, |
|
"step": 18250 |
|
}, |
|
{ |
|
"epoch": 1.18, |
|
"eval_avg_sts": 0.8269276043107123, |
|
"eval_sickr_spearman": 0.7936150552269506, |
|
"eval_stsb_spearman": 0.8602401533944739, |
|
"step": 18375 |
|
}, |
|
{ |
|
"epoch": 1.18, |
|
"learning_rate": 2.8562651990272623e-06, |
|
"loss": 0.0001, |
|
"step": 18500 |
|
}, |
|
{ |
|
"epoch": 1.18, |
|
"eval_avg_sts": 0.8271598852494388, |
|
"eval_sickr_spearman": 0.7938677468516165, |
|
"eval_stsb_spearman": 0.8604520236472611, |
|
"step": 18500 |
|
}, |
|
{ |
|
"epoch": 1.19, |
|
"eval_avg_sts": 0.8273011691673453, |
|
"eval_sickr_spearman": 0.7941100157272702, |
|
"eval_stsb_spearman": 0.8604923226074204, |
|
"step": 18625 |
|
}, |
|
{ |
|
"epoch": 1.2, |
|
"eval_avg_sts": 0.8274659412451935, |
|
"eval_sickr_spearman": 0.7943473373994759, |
|
"eval_stsb_spearman": 0.860584545090911, |
|
"step": 18750 |
|
}, |
|
{ |
|
"epoch": 1.21, |
|
"eval_avg_sts": 0.8273871753451842, |
|
"eval_sickr_spearman": 0.7941770191137765, |
|
"eval_stsb_spearman": 0.8605973315765919, |
|
"step": 18875 |
|
}, |
|
{ |
|
"epoch": 1.22, |
|
"learning_rate": 2.7442723665685396e-06, |
|
"loss": 0.0002, |
|
"step": 19000 |
|
}, |
|
{ |
|
"epoch": 1.22, |
|
"eval_avg_sts": 0.8268924907436139, |
|
"eval_sickr_spearman": 0.7941484406084208, |
|
"eval_stsb_spearman": 0.859636540878807, |
|
"step": 19000 |
|
}, |
|
{ |
|
"epoch": 1.22, |
|
"eval_avg_sts": 0.8258034139625235, |
|
"eval_sickr_spearman": 0.7932116900370734, |
|
"eval_stsb_spearman": 0.8583951378879737, |
|
"step": 19125 |
|
}, |
|
{ |
|
"epoch": 1.23, |
|
"eval_avg_sts": 0.8252544789859086, |
|
"eval_sickr_spearman": 0.7925500616147634, |
|
"eval_stsb_spearman": 0.857958896357054, |
|
"step": 19250 |
|
}, |
|
{ |
|
"epoch": 1.24, |
|
"eval_avg_sts": 0.8253536873185088, |
|
"eval_sickr_spearman": 0.7926197067118486, |
|
"eval_stsb_spearman": 0.858087667925169, |
|
"step": 19375 |
|
}, |
|
{ |
|
"epoch": 1.25, |
|
"learning_rate": 2.632279534109817e-06, |
|
"loss": 0.0002, |
|
"step": 19500 |
|
}, |
|
{ |
|
"epoch": 1.25, |
|
"eval_avg_sts": 0.8259692031147807, |
|
"eval_sickr_spearman": 0.7942922457261266, |
|
"eval_stsb_spearman": 0.8576461605034348, |
|
"step": 19500 |
|
}, |
|
{ |
|
"epoch": 1.26, |
|
"eval_avg_sts": 0.8262977896726795, |
|
"eval_sickr_spearman": 0.7945857637870148, |
|
"eval_stsb_spearman": 0.8580098155583442, |
|
"step": 19625 |
|
}, |
|
{ |
|
"epoch": 1.26, |
|
"eval_avg_sts": 0.8265435124446001, |
|
"eval_sickr_spearman": 0.7949808676274447, |
|
"eval_stsb_spearman": 0.8581061572617555, |
|
"step": 19750 |
|
}, |
|
{ |
|
"epoch": 1.27, |
|
"eval_avg_sts": 0.82660901551375, |
|
"eval_sickr_spearman": 0.795241820601558, |
|
"eval_stsb_spearman": 0.8579762104259421, |
|
"step": 19875 |
|
}, |
|
{ |
|
"epoch": 1.28, |
|
"learning_rate": 2.5202867016510945e-06, |
|
"loss": 0.0001, |
|
"step": 20000 |
|
}, |
|
{ |
|
"epoch": 1.28, |
|
"eval_avg_sts": 0.8249759667991925, |
|
"eval_sickr_spearman": 0.7929103429066506, |
|
"eval_stsb_spearman": 0.8570415906917342, |
|
"step": 20000 |
|
}, |
|
{ |
|
"epoch": 1.29, |
|
"eval_avg_sts": 0.8252695158247048, |
|
"eval_sickr_spearman": 0.7941818702550217, |
|
"eval_stsb_spearman": 0.8563571613943879, |
|
"step": 20125 |
|
}, |
|
{ |
|
"epoch": 1.3, |
|
"eval_avg_sts": 0.8254168575586551, |
|
"eval_sickr_spearman": 0.794336146152841, |
|
"eval_stsb_spearman": 0.8564975689644694, |
|
"step": 20250 |
|
}, |
|
{ |
|
"epoch": 1.3, |
|
"eval_avg_sts": 0.8259865535716795, |
|
"eval_sickr_spearman": 0.7950048831781639, |
|
"eval_stsb_spearman": 0.8569682239651952, |
|
"step": 20375 |
|
}, |
|
{ |
|
"epoch": 1.31, |
|
"learning_rate": 2.4082938691923718e-06, |
|
"loss": 0.0001, |
|
"step": 20500 |
|
}, |
|
{ |
|
"epoch": 1.31, |
|
"eval_avg_sts": 0.826209318888689, |
|
"eval_sickr_spearman": 0.7952033957204077, |
|
"eval_stsb_spearman": 0.8572152420569702, |
|
"step": 20500 |
|
}, |
|
{ |
|
"epoch": 1.32, |
|
"eval_avg_sts": 0.8259891403986184, |
|
"eval_sickr_spearman": 0.7948762078574111, |
|
"eval_stsb_spearman": 0.8571020729398255, |
|
"step": 20625 |
|
}, |
|
{ |
|
"epoch": 1.33, |
|
"eval_avg_sts": 0.8259890083537097, |
|
"eval_sickr_spearman": 0.7947911447767642, |
|
"eval_stsb_spearman": 0.8571868719306552, |
|
"step": 20750 |
|
}, |
|
{ |
|
"epoch": 1.34, |
|
"eval_avg_sts": 0.8261152907691348, |
|
"eval_sickr_spearman": 0.7949135280232285, |
|
"eval_stsb_spearman": 0.8573170535150412, |
|
"step": 20875 |
|
}, |
|
{ |
|
"epoch": 1.34, |
|
"learning_rate": 2.296301036733649e-06, |
|
"loss": 0.0001, |
|
"step": 21000 |
|
}, |
|
{ |
|
"epoch": 1.34, |
|
"eval_avg_sts": 0.826274962054796, |
|
"eval_sickr_spearman": 0.7950501284757184, |
|
"eval_stsb_spearman": 0.8574997956338737, |
|
"step": 21000 |
|
}, |
|
{ |
|
"epoch": 1.35, |
|
"eval_avg_sts": 0.8260486313726075, |
|
"eval_sickr_spearman": 0.794899647034913, |
|
"eval_stsb_spearman": 0.8571976157103021, |
|
"step": 21125 |
|
}, |
|
{ |
|
"epoch": 1.36, |
|
"eval_avg_sts": 0.825587114078729, |
|
"eval_sickr_spearman": 0.7946725559873136, |
|
"eval_stsb_spearman": 0.8565016721701444, |
|
"step": 21250 |
|
}, |
|
{ |
|
"epoch": 1.37, |
|
"eval_avg_sts": 0.8256303672089018, |
|
"eval_sickr_spearman": 0.7944853787850091, |
|
"eval_stsb_spearman": 0.8567753556327944, |
|
"step": 21375 |
|
}, |
|
{ |
|
"epoch": 1.38, |
|
"learning_rate": 2.1843082042749267e-06, |
|
"loss": 0.0002, |
|
"step": 21500 |
|
}, |
|
{ |
|
"epoch": 1.38, |
|
"eval_avg_sts": 0.8254654257169443, |
|
"eval_sickr_spearman": 0.7936856129149631, |
|
"eval_stsb_spearman": 0.8572452385189255, |
|
"step": 21500 |
|
}, |
|
{ |
|
"epoch": 1.38, |
|
"eval_avg_sts": 0.8257646791990041, |
|
"eval_sickr_spearman": 0.7941317738162218, |
|
"eval_stsb_spearman": 0.8573975845817864, |
|
"step": 21625 |
|
}, |
|
{ |
|
"epoch": 1.39, |
|
"eval_avg_sts": 0.8263390736725806, |
|
"eval_sickr_spearman": 0.7947459955414125, |
|
"eval_stsb_spearman": 0.8579321518037489, |
|
"step": 21750 |
|
}, |
|
{ |
|
"epoch": 1.4, |
|
"eval_avg_sts": 0.825957826826842, |
|
"eval_sickr_spearman": 0.7945194808670303, |
|
"eval_stsb_spearman": 0.8573961727866538, |
|
"step": 21875 |
|
}, |
|
{ |
|
"epoch": 1.41, |
|
"learning_rate": 2.072315371816204e-06, |
|
"loss": 0.0001, |
|
"step": 22000 |
|
}, |
|
{ |
|
"epoch": 1.41, |
|
"eval_avg_sts": 0.8257198535359889, |
|
"eval_sickr_spearman": 0.7936219236744562, |
|
"eval_stsb_spearman": 0.8578177833975217, |
|
"step": 22000 |
|
}, |
|
{ |
|
"epoch": 1.42, |
|
"eval_avg_sts": 0.8270054813778303, |
|
"eval_sickr_spearman": 0.7958380306637094, |
|
"eval_stsb_spearman": 0.858172932091951, |
|
"step": 22125 |
|
}, |
|
{ |
|
"epoch": 1.42, |
|
"eval_avg_sts": 0.8270091578481822, |
|
"eval_sickr_spearman": 0.7962583028012928, |
|
"eval_stsb_spearman": 0.8577600128950715, |
|
"step": 22250 |
|
}, |
|
{ |
|
"epoch": 1.43, |
|
"eval_avg_sts": 0.8259725703398417, |
|
"eval_sickr_spearman": 0.7959245346773993, |
|
"eval_stsb_spearman": 0.8560206060022842, |
|
"step": 22375 |
|
}, |
|
{ |
|
"epoch": 1.44, |
|
"learning_rate": 1.9603225393574807e-06, |
|
"loss": 0.0002, |
|
"step": 22500 |
|
}, |
|
{ |
|
"epoch": 1.44, |
|
"eval_avg_sts": 0.8254714237214871, |
|
"eval_sickr_spearman": 0.7955676635937141, |
|
"eval_stsb_spearman": 0.8553751838492601, |
|
"step": 22500 |
|
}, |
|
{ |
|
"epoch": 1.45, |
|
"eval_avg_sts": 0.8243312613565763, |
|
"eval_sickr_spearman": 0.7926490056837258, |
|
"eval_stsb_spearman": 0.8560135170294269, |
|
"step": 22625 |
|
}, |
|
{ |
|
"epoch": 1.46, |
|
"eval_avg_sts": 0.8244931271533935, |
|
"eval_sickr_spearman": 0.7931114971594734, |
|
"eval_stsb_spearman": 0.8558747571473136, |
|
"step": 22750 |
|
}, |
|
{ |
|
"epoch": 1.46, |
|
"eval_avg_sts": 0.8245178381258861, |
|
"eval_sickr_spearman": 0.7931850518122927, |
|
"eval_stsb_spearman": 0.8558506244394795, |
|
"step": 22875 |
|
}, |
|
{ |
|
"epoch": 1.47, |
|
"learning_rate": 1.8483297068987584e-06, |
|
"loss": 0.0002, |
|
"step": 23000 |
|
}, |
|
{ |
|
"epoch": 1.47, |
|
"eval_avg_sts": 0.8250123369922542, |
|
"eval_sickr_spearman": 0.7931228324994128, |
|
"eval_stsb_spearman": 0.8569018414850956, |
|
"step": 23000 |
|
}, |
|
{ |
|
"epoch": 1.48, |
|
"eval_avg_sts": 0.8254867372327745, |
|
"eval_sickr_spearman": 0.7938168819151935, |
|
"eval_stsb_spearman": 0.8571565925503556, |
|
"step": 23125 |
|
}, |
|
{ |
|
"epoch": 1.49, |
|
"eval_avg_sts": 0.8256499116596692, |
|
"eval_sickr_spearman": 0.7939716381240272, |
|
"eval_stsb_spearman": 0.8573281851953113, |
|
"step": 23250 |
|
}, |
|
{ |
|
"epoch": 1.5, |
|
"eval_avg_sts": 0.8258346679802114, |
|
"eval_sickr_spearman": 0.7940527146232547, |
|
"eval_stsb_spearman": 0.8576166213371682, |
|
"step": 23375 |
|
}, |
|
{ |
|
"epoch": 1.5, |
|
"learning_rate": 1.7363368744400357e-06, |
|
"loss": 0.0001, |
|
"step": 23500 |
|
}, |
|
{ |
|
"epoch": 1.5, |
|
"eval_avg_sts": 0.825945269207895, |
|
"eval_sickr_spearman": 0.7943781253354978, |
|
"eval_stsb_spearman": 0.8575124130802922, |
|
"step": 23500 |
|
}, |
|
{ |
|
"epoch": 1.51, |
|
"eval_avg_sts": 0.8258713568091718, |
|
"eval_sickr_spearman": 0.794315540810324, |
|
"eval_stsb_spearman": 0.8574271728080196, |
|
"step": 23625 |
|
}, |
|
{ |
|
"epoch": 1.52, |
|
"eval_avg_sts": 0.8258355435328646, |
|
"eval_sickr_spearman": 0.7940151062708286, |
|
"eval_stsb_spearman": 0.8576559807949005, |
|
"step": 23750 |
|
}, |
|
{ |
|
"epoch": 1.53, |
|
"eval_avg_sts": 0.8257865803230886, |
|
"eval_sickr_spearman": 0.7940416194388225, |
|
"eval_stsb_spearman": 0.8575315412073548, |
|
"step": 23875 |
|
}, |
|
{ |
|
"epoch": 1.54, |
|
"learning_rate": 1.6243440419813131e-06, |
|
"loss": 0.0002, |
|
"step": 24000 |
|
}, |
|
{ |
|
"epoch": 1.54, |
|
"eval_avg_sts": 0.8258057571249391, |
|
"eval_sickr_spearman": 0.7941539161539849, |
|
"eval_stsb_spearman": 0.8574575980958933, |
|
"step": 24000 |
|
}, |
|
{ |
|
"epoch": 1.54, |
|
"eval_avg_sts": 0.8258599414659757, |
|
"eval_sickr_spearman": 0.7942335517201692, |
|
"eval_stsb_spearman": 0.8574863312117823, |
|
"step": 24125 |
|
}, |
|
{ |
|
"epoch": 1.55, |
|
"eval_avg_sts": 0.8259837419138151, |
|
"eval_sickr_spearman": 0.7943245706573944, |
|
"eval_stsb_spearman": 0.8576429131702358, |
|
"step": 24250 |
|
}, |
|
{ |
|
"epoch": 1.56, |
|
"eval_avg_sts": 0.8273046944370666, |
|
"eval_sickr_spearman": 0.7953777005875265, |
|
"eval_stsb_spearman": 0.8592316882866066, |
|
"step": 24375 |
|
}, |
|
{ |
|
"epoch": 1.57, |
|
"learning_rate": 1.5123512095225906e-06, |
|
"loss": 0.0001, |
|
"step": 24500 |
|
}, |
|
{ |
|
"epoch": 1.57, |
|
"eval_avg_sts": 0.8270336322444836, |
|
"eval_sickr_spearman": 0.7948833644915253, |
|
"eval_stsb_spearman": 0.8591838999974419, |
|
"step": 24500 |
|
}, |
|
{ |
|
"epoch": 1.58, |
|
"eval_avg_sts": 0.8268251999183458, |
|
"eval_sickr_spearman": 0.7944777418398805, |
|
"eval_stsb_spearman": 0.8591726579968111, |
|
"step": 24625 |
|
}, |
|
{ |
|
"epoch": 1.58, |
|
"eval_avg_sts": 0.8267020534374147, |
|
"eval_sickr_spearman": 0.7943936393812624, |
|
"eval_stsb_spearman": 0.8590104674935669, |
|
"step": 24750 |
|
}, |
|
{ |
|
"epoch": 1.59, |
|
"eval_avg_sts": 0.825917107993902, |
|
"eval_sickr_spearman": 0.7938579965380246, |
|
"eval_stsb_spearman": 0.8579762194497796, |
|
"step": 24875 |
|
}, |
|
{ |
|
"epoch": 1.6, |
|
"learning_rate": 1.4003583770638678e-06, |
|
"loss": 0.0002, |
|
"step": 25000 |
|
}, |
|
{ |
|
"epoch": 1.6, |
|
"eval_avg_sts": 0.8263527703022291, |
|
"eval_sickr_spearman": 0.7941290360434399, |
|
"eval_stsb_spearman": 0.8585765045610182, |
|
"step": 25000 |
|
}, |
|
{ |
|
"epoch": 1.61, |
|
"eval_avg_sts": 0.8269584920385149, |
|
"eval_sickr_spearman": 0.7941601601971716, |
|
"eval_stsb_spearman": 0.8597568238798581, |
|
"step": 25125 |
|
}, |
|
{ |
|
"epoch": 1.62, |
|
"eval_avg_sts": 0.8264998215853827, |
|
"eval_sickr_spearman": 0.7927663936956405, |
|
"eval_stsb_spearman": 0.8602332494751249, |
|
"step": 25250 |
|
}, |
|
{ |
|
"epoch": 1.62, |
|
"eval_avg_sts": 0.825942745088348, |
|
"eval_sickr_spearman": 0.7922521246925426, |
|
"eval_stsb_spearman": 0.8596333654841534, |
|
"step": 25375 |
|
}, |
|
{ |
|
"epoch": 1.63, |
|
"learning_rate": 1.2883655446051453e-06, |
|
"loss": 0.0001, |
|
"step": 25500 |
|
}, |
|
{ |
|
"epoch": 1.63, |
|
"eval_avg_sts": 0.8259010696773026, |
|
"eval_sickr_spearman": 0.7922646127789166, |
|
"eval_stsb_spearman": 0.8595375265756887, |
|
"step": 25500 |
|
}, |
|
{ |
|
"epoch": 1.64, |
|
"eval_avg_sts": 0.8259285307896478, |
|
"eval_sickr_spearman": 0.7926812825838921, |
|
"eval_stsb_spearman": 0.8591757789954035, |
|
"step": 25625 |
|
}, |
|
{ |
|
"epoch": 1.65, |
|
"eval_avg_sts": 0.8258391793675839, |
|
"eval_sickr_spearman": 0.7926954517588166, |
|
"eval_stsb_spearman": 0.858982906976351, |
|
"step": 25750 |
|
}, |
|
{ |
|
"epoch": 1.66, |
|
"eval_avg_sts": 0.8258409312899861, |
|
"eval_sickr_spearman": 0.7928338293620596, |
|
"eval_stsb_spearman": 0.8588480332179126, |
|
"step": 25875 |
|
}, |
|
{ |
|
"epoch": 1.66, |
|
"learning_rate": 1.1763727121464225e-06, |
|
"loss": 0.0001, |
|
"step": 26000 |
|
}, |
|
{ |
|
"epoch": 1.66, |
|
"eval_avg_sts": 0.8251984305884675, |
|
"eval_sickr_spearman": 0.7933060231202977, |
|
"eval_stsb_spearman": 0.8570908380566373, |
|
"step": 26000 |
|
}, |
|
{ |
|
"epoch": 1.67, |
|
"eval_avg_sts": 0.8253196217152283, |
|
"eval_sickr_spearman": 0.7932125065657978, |
|
"eval_stsb_spearman": 0.8574267368646588, |
|
"step": 26125 |
|
}, |
|
{ |
|
"epoch": 1.68, |
|
"eval_avg_sts": 0.8253745698430313, |
|
"eval_sickr_spearman": 0.7933913263564519, |
|
"eval_stsb_spearman": 0.8573578133296105, |
|
"step": 26250 |
|
}, |
|
{ |
|
"epoch": 1.69, |
|
"eval_avg_sts": 0.825411316540875, |
|
"eval_sickr_spearman": 0.7934114513879544, |
|
"eval_stsb_spearman": 0.8574111816937955, |
|
"step": 26375 |
|
}, |
|
{ |
|
"epoch": 1.7, |
|
"learning_rate": 1.0643798796877e-06, |
|
"loss": 0.0001, |
|
"step": 26500 |
|
}, |
|
{ |
|
"epoch": 1.7, |
|
"eval_avg_sts": 0.8249370852399975, |
|
"eval_sickr_spearman": 0.7937128945805799, |
|
"eval_stsb_spearman": 0.8561612758994152, |
|
"step": 26500 |
|
}, |
|
{ |
|
"epoch": 1.7, |
|
"eval_avg_sts": 0.825459765367129, |
|
"eval_sickr_spearman": 0.7933420944774778, |
|
"eval_stsb_spearman": 0.8575774362567802, |
|
"step": 26625 |
|
}, |
|
{ |
|
"epoch": 1.71, |
|
"eval_avg_sts": 0.826427995376563, |
|
"eval_sickr_spearman": 0.7947685701590883, |
|
"eval_stsb_spearman": 0.8580874205940376, |
|
"step": 26750 |
|
}, |
|
{ |
|
"epoch": 1.72, |
|
"eval_avg_sts": 0.8258856380174763, |
|
"eval_sickr_spearman": 0.7942930142237495, |
|
"eval_stsb_spearman": 0.857478261811203, |
|
"step": 26875 |
|
}, |
|
{ |
|
"epoch": 1.73, |
|
"learning_rate": 9.523870472289774e-07, |
|
"loss": 0.0002, |
|
"step": 27000 |
|
}, |
|
{ |
|
"epoch": 1.73, |
|
"eval_avg_sts": 0.8258593024414255, |
|
"eval_sickr_spearman": 0.7941693821686479, |
|
"eval_stsb_spearman": 0.8575492227142031, |
|
"step": 27000 |
|
}, |
|
{ |
|
"epoch": 1.74, |
|
"eval_avg_sts": 0.8258720619743833, |
|
"eval_sickr_spearman": 0.7941788923267327, |
|
"eval_stsb_spearman": 0.857565231622034, |
|
"step": 27125 |
|
}, |
|
{ |
|
"epoch": 1.74, |
|
"eval_avg_sts": 0.8259531389747516, |
|
"eval_sickr_spearman": 0.7941532917496662, |
|
"eval_stsb_spearman": 0.8577529861998372, |
|
"step": 27250 |
|
}, |
|
{ |
|
"epoch": 1.75, |
|
"eval_avg_sts": 0.825969657799255, |
|
"eval_sickr_spearman": 0.7942109771024933, |
|
"eval_stsb_spearman": 0.8577283384960166, |
|
"step": 27375 |
|
}, |
|
{ |
|
"epoch": 1.76, |
|
"learning_rate": 8.403942147702547e-07, |
|
"loss": 0.0002, |
|
"step": 27500 |
|
}, |
|
{ |
|
"epoch": 1.76, |
|
"eval_avg_sts": 0.8259987251545413, |
|
"eval_sickr_spearman": 0.7943161171835413, |
|
"eval_stsb_spearman": 0.8576813331255413, |
|
"step": 27500 |
|
}, |
|
{ |
|
"epoch": 1.77, |
|
"eval_avg_sts": 0.8252131722274082, |
|
"eval_sickr_spearman": 0.793231382788663, |
|
"eval_stsb_spearman": 0.8571949616661534, |
|
"step": 27625 |
|
}, |
|
{ |
|
"epoch": 1.78, |
|
"eval_avg_sts": 0.8252604604270115, |
|
"eval_sickr_spearman": 0.7933024207876899, |
|
"eval_stsb_spearman": 0.857218500066333, |
|
"step": 27750 |
|
}, |
|
{ |
|
"epoch": 1.78, |
|
"eval_avg_sts": 0.8251969961170478, |
|
"eval_sickr_spearman": 0.793198385421975, |
|
"eval_stsb_spearman": 0.8571956068121205, |
|
"step": 27875 |
|
}, |
|
{ |
|
"epoch": 1.79, |
|
"learning_rate": 7.284013823115321e-07, |
|
"loss": 0.0002, |
|
"step": 28000 |
|
}, |
|
{ |
|
"epoch": 1.79, |
|
"eval_avg_sts": 0.825311717070901, |
|
"eval_sickr_spearman": 0.7931744179023573, |
|
"eval_stsb_spearman": 0.8574490162394447, |
|
"step": 28000 |
|
}, |
|
{ |
|
"epoch": 1.8, |
|
"eval_avg_sts": 0.8256482381761492, |
|
"eval_sickr_spearman": 0.7934648139416521, |
|
"eval_stsb_spearman": 0.8578316624106462, |
|
"step": 28125 |
|
}, |
|
{ |
|
"epoch": 1.81, |
|
"eval_avg_sts": 0.8261129479959839, |
|
"eval_sickr_spearman": 0.7939418588411357, |
|
"eval_stsb_spearman": 0.858284037150832, |
|
"step": 28250 |
|
}, |
|
{ |
|
"epoch": 1.82, |
|
"eval_avg_sts": 0.8262712326490254, |
|
"eval_sickr_spearman": 0.7933230261302068, |
|
"eval_stsb_spearman": 0.8592194391678438, |
|
"step": 28375 |
|
}, |
|
{ |
|
"epoch": 1.82, |
|
"learning_rate": 6.164085498528094e-07, |
|
"loss": 0.0002, |
|
"step": 28500 |
|
}, |
|
{ |
|
"epoch": 1.82, |
|
"eval_avg_sts": 0.8262943695062834, |
|
"eval_sickr_spearman": 0.7934199048618075, |
|
"eval_stsb_spearman": 0.8591688341507593, |
|
"step": 28500 |
|
}, |
|
{ |
|
"epoch": 1.83, |
|
"eval_avg_sts": 0.8260598340905722, |
|
"eval_sickr_spearman": 0.7933951208134654, |
|
"eval_stsb_spearman": 0.8587245473676789, |
|
"step": 28625 |
|
}, |
|
{ |
|
"epoch": 1.84, |
|
"eval_avg_sts": 0.8259360112469695, |
|
"eval_sickr_spearman": 0.7933420944774778, |
|
"eval_stsb_spearman": 0.8585299280164611, |
|
"step": 28750 |
|
}, |
|
{ |
|
"epoch": 1.85, |
|
"eval_avg_sts": 0.8258330858999741, |
|
"eval_sickr_spearman": 0.7933054467470805, |
|
"eval_stsb_spearman": 0.8583607250528676, |
|
"step": 28875 |
|
}, |
|
{ |
|
"epoch": 1.86, |
|
"learning_rate": 5.044157173940868e-07, |
|
"loss": 0.0001, |
|
"step": 29000 |
|
}, |
|
{ |
|
"epoch": 1.86, |
|
"eval_avg_sts": 0.8258376969438936, |
|
"eval_sickr_spearman": 0.7933141884075422, |
|
"eval_stsb_spearman": 0.8583612054802452, |
|
"step": 29000 |
|
}, |
|
{ |
|
"epoch": 1.86, |
|
"eval_avg_sts": 0.8259136180644091, |
|
"eval_sickr_spearman": 0.7933194718287004, |
|
"eval_stsb_spearman": 0.8585077643001178, |
|
"step": 29125 |
|
}, |
|
{ |
|
"epoch": 1.87, |
|
"eval_avg_sts": 0.825910175107258, |
|
"eval_sickr_spearman": 0.7933039097518345, |
|
"eval_stsb_spearman": 0.8585164404626813, |
|
"step": 29250 |
|
}, |
|
{ |
|
"epoch": 1.88, |
|
"eval_avg_sts": 0.8258308833879402, |
|
"eval_sickr_spearman": 0.7933173584602371, |
|
"eval_stsb_spearman": 0.8583444083156432, |
|
"step": 29375 |
|
}, |
|
{ |
|
"epoch": 1.89, |
|
"learning_rate": 3.9242288493536413e-07, |
|
"loss": 0.0001, |
|
"step": 29500 |
|
}, |
|
{ |
|
"epoch": 1.89, |
|
"eval_avg_sts": 0.8257221328599513, |
|
"eval_sickr_spearman": 0.7931374819853514, |
|
"eval_stsb_spearman": 0.8583067837345514, |
|
"step": 29500 |
|
}, |
|
{ |
|
"epoch": 1.9, |
|
"eval_avg_sts": 0.825786763719202, |
|
"eval_sickr_spearman": 0.7932694234210019, |
|
"eval_stsb_spearman": 0.858304104017402, |
|
"step": 29625 |
|
}, |
|
{ |
|
"epoch": 1.9, |
|
"eval_avg_sts": 0.8257681951340192, |
|
"eval_sickr_spearman": 0.7932804705743327, |
|
"eval_stsb_spearman": 0.8582559196937056, |
|
"step": 29750 |
|
}, |
|
{ |
|
"epoch": 1.91, |
|
"eval_avg_sts": 0.8258082608558808, |
|
"eval_sickr_spearman": 0.7933519408532725, |
|
"eval_stsb_spearman": 0.8582645808584891, |
|
"step": 29875 |
|
}, |
|
{ |
|
"epoch": 1.92, |
|
"learning_rate": 2.804300524766415e-07, |
|
"loss": 0.0001, |
|
"step": 30000 |
|
}, |
|
{ |
|
"epoch": 1.92, |
|
"eval_avg_sts": 0.8258262861889483, |
|
"eval_sickr_spearman": 0.7933999719547107, |
|
"eval_stsb_spearman": 0.8582526004231857, |
|
"step": 30000 |
|
}, |
|
{ |
|
"epoch": 1.93, |
|
"eval_avg_sts": 0.8256086631585, |
|
"eval_sickr_spearman": 0.7930556369885008, |
|
"eval_stsb_spearman": 0.8581616893284993, |
|
"step": 30125 |
|
}, |
|
{ |
|
"epoch": 1.94, |
|
"eval_avg_sts": 0.8256480515518101, |
|
"eval_sickr_spearman": 0.7931325828130048, |
|
"eval_stsb_spearman": 0.8581635202906153, |
|
"step": 30250 |
|
}, |
|
{ |
|
"epoch": 1.94, |
|
"eval_avg_sts": 0.8258219208455879, |
|
"eval_sickr_spearman": 0.7934267252782117, |
|
"eval_stsb_spearman": 0.8582171164129642, |
|
"step": 30375 |
|
}, |
|
{ |
|
"epoch": 1.95, |
|
"learning_rate": 1.6843722001791884e-07, |
|
"loss": 0.0002, |
|
"step": 30500 |
|
}, |
|
{ |
|
"epoch": 1.95, |
|
"eval_avg_sts": 0.8258322719939588, |
|
"eval_sickr_spearman": 0.7934731233222009, |
|
"eval_stsb_spearman": 0.8581914206657169, |
|
"step": 30500 |
|
}, |
|
{ |
|
"epoch": 1.96, |
|
"eval_avg_sts": 0.8258242424865203, |
|
"eval_sickr_spearman": 0.7934302315486167, |
|
"eval_stsb_spearman": 0.858218253424424, |
|
"step": 30625 |
|
}, |
|
{ |
|
"epoch": 1.97, |
|
"eval_avg_sts": 0.8258248316168127, |
|
"eval_sickr_spearman": 0.7934435841948165, |
|
"eval_stsb_spearman": 0.858206079038809, |
|
"step": 30750 |
|
}, |
|
{ |
|
"epoch": 1.98, |
|
"eval_avg_sts": 0.8257922895919085, |
|
"eval_sickr_spearman": 0.7933790303944838, |
|
"eval_stsb_spearman": 0.8582055487893332, |
|
"step": 30875 |
|
}, |
|
{ |
|
"epoch": 1.98, |
|
"learning_rate": 5.64443875591962e-08, |
|
"loss": 0.0001, |
|
"step": 31000 |
|
}, |
|
{ |
|
"epoch": 1.98, |
|
"eval_avg_sts": 0.8257897415072173, |
|
"eval_sickr_spearman": 0.7933720178536738, |
|
"eval_stsb_spearman": 0.8582074651607609, |
|
"step": 31000 |
|
}, |
|
{ |
|
"epoch": 1.99, |
|
"eval_avg_sts": 0.8257977713308224, |
|
"eval_sickr_spearman": 0.7933829209137002, |
|
"eval_stsb_spearman": 0.8582126217479447, |
|
"step": 31125 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_avg_sts": 0.8258126560134551, |
|
"eval_sickr_spearman": 0.7934017010743625, |
|
"eval_stsb_spearman": 0.8582236109525477, |
|
"step": 31250 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"step": 31252, |
|
"train_runtime": 21163.9877, |
|
"train_samples_per_second": 1.477 |
|
} |
|
], |
|
"max_steps": 31252, |
|
"num_train_epochs": 2, |
|
"total_flos": 776159526314354880, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|