|
{ |
|
"best_metric": 0.624123043712898, |
|
"best_model_checkpoint": "/tmp/test-ner1_/checkpoint-52109", |
|
"epoch": 120.0, |
|
"global_step": 58440, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.741183488427583, |
|
"eval_f1": 0.46964064436183395, |
|
"eval_loss": 0.8133957386016846, |
|
"eval_precision": 0.4221430162619737, |
|
"eval_recall": 0.5291817927953085, |
|
"eval_runtime": 2.7713, |
|
"eval_samples_per_second": 401.25, |
|
"eval_steps_per_second": 25.259, |
|
"step": 487 |
|
}, |
|
{ |
|
"epoch": 1.03, |
|
"learning_rate": 2.9743326488706367e-05, |
|
"loss": 1.0691, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.7599856836077309, |
|
"eval_f1": 0.5087176950661556, |
|
"eval_loss": 0.7439278960227966, |
|
"eval_precision": 0.4565024411895251, |
|
"eval_recall": 0.5744205529181793, |
|
"eval_runtime": 2.7397, |
|
"eval_samples_per_second": 405.878, |
|
"eval_steps_per_second": 25.55, |
|
"step": 974 |
|
}, |
|
{ |
|
"epoch": 2.05, |
|
"learning_rate": 2.9486652977412733e-05, |
|
"loss": 0.6796, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.7499642090193271, |
|
"eval_f1": 0.5268402042595591, |
|
"eval_loss": 0.8020838499069214, |
|
"eval_precision": 0.4754946043165468, |
|
"eval_recall": 0.5906171460485897, |
|
"eval_runtime": 2.7638, |
|
"eval_samples_per_second": 402.346, |
|
"eval_steps_per_second": 25.328, |
|
"step": 1461 |
|
}, |
|
{ |
|
"epoch": 3.08, |
|
"learning_rate": 2.9229979466119096e-05, |
|
"loss": 0.5266, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.7569315199236459, |
|
"eval_f1": 0.5452078450721599, |
|
"eval_loss": 0.826590895652771, |
|
"eval_precision": 0.4882898806893504, |
|
"eval_recall": 0.6171460485897794, |
|
"eval_runtime": 2.7581, |
|
"eval_samples_per_second": 403.178, |
|
"eval_steps_per_second": 25.38, |
|
"step": 1948 |
|
}, |
|
{ |
|
"epoch": 4.11, |
|
"learning_rate": 2.8973305954825462e-05, |
|
"loss": 0.4087, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.7584347411119065, |
|
"eval_f1": 0.5577331169641744, |
|
"eval_loss": 0.8819655776023865, |
|
"eval_precision": 0.5042889390519187, |
|
"eval_recall": 0.623848087126501, |
|
"eval_runtime": 2.7608, |
|
"eval_samples_per_second": 402.775, |
|
"eval_steps_per_second": 25.355, |
|
"step": 2435 |
|
}, |
|
{ |
|
"epoch": 5.13, |
|
"learning_rate": 2.8716632443531828e-05, |
|
"loss": 0.314, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.7587687902648532, |
|
"eval_f1": 0.5619107479572597, |
|
"eval_loss": 0.8884239196777344, |
|
"eval_precision": 0.5109739368998628, |
|
"eval_recall": 0.6241273387321977, |
|
"eval_runtime": 2.7416, |
|
"eval_samples_per_second": 405.6, |
|
"eval_steps_per_second": 25.532, |
|
"step": 2922 |
|
}, |
|
{ |
|
"epoch": 6.16, |
|
"learning_rate": 2.8459958932238194e-05, |
|
"loss": 0.254, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_accuracy": 0.7592937246480553, |
|
"eval_f1": 0.5628216392619556, |
|
"eval_loss": 0.9709771275520325, |
|
"eval_precision": 0.511171910624715, |
|
"eval_recall": 0.6260820999720749, |
|
"eval_runtime": 2.7411, |
|
"eval_samples_per_second": 405.673, |
|
"eval_steps_per_second": 25.537, |
|
"step": 3409 |
|
}, |
|
{ |
|
"epoch": 7.19, |
|
"learning_rate": 2.8203285420944557e-05, |
|
"loss": 0.2096, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.7622285850632308, |
|
"eval_f1": 0.5648183075568968, |
|
"eval_loss": 1.0743454694747925, |
|
"eval_precision": 0.5137236962488564, |
|
"eval_recall": 0.6271991063948618, |
|
"eval_runtime": 2.7561, |
|
"eval_samples_per_second": 403.467, |
|
"eval_steps_per_second": 25.398, |
|
"step": 3896 |
|
}, |
|
{ |
|
"epoch": 8.21, |
|
"learning_rate": 2.7946611909650923e-05, |
|
"loss": 0.1786, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_accuracy": 0.7570985445001193, |
|
"eval_f1": 0.5668016194331984, |
|
"eval_loss": 1.1285585165023804, |
|
"eval_precision": 0.5181586860976174, |
|
"eval_recall": 0.6255235967606814, |
|
"eval_runtime": 2.7449, |
|
"eval_samples_per_second": 405.112, |
|
"eval_steps_per_second": 25.502, |
|
"step": 4383 |
|
}, |
|
{ |
|
"epoch": 9.24, |
|
"learning_rate": 2.7689938398357292e-05, |
|
"loss": 0.1486, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_accuracy": 0.7544738725841088, |
|
"eval_f1": 0.5723700887198986, |
|
"eval_loss": 1.1630432605743408, |
|
"eval_precision": 0.5240194940821536, |
|
"eval_recall": 0.6305501256632225, |
|
"eval_runtime": 2.8838, |
|
"eval_samples_per_second": 385.605, |
|
"eval_steps_per_second": 24.274, |
|
"step": 4870 |
|
}, |
|
{ |
|
"epoch": 10.27, |
|
"learning_rate": 2.743326488706366e-05, |
|
"loss": 0.132, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_accuracy": 0.7605821999522787, |
|
"eval_f1": 0.5760409993593851, |
|
"eval_loss": 1.1933799982070923, |
|
"eval_precision": 0.5321969696969697, |
|
"eval_recall": 0.6277576096062553, |
|
"eval_runtime": 2.7538, |
|
"eval_samples_per_second": 403.799, |
|
"eval_steps_per_second": 25.419, |
|
"step": 5357 |
|
}, |
|
{ |
|
"epoch": 11.29, |
|
"learning_rate": 2.717659137577002e-05, |
|
"loss": 0.1098, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_accuracy": 0.760200429491768, |
|
"eval_f1": 0.5755844155844156, |
|
"eval_loss": 1.1861658096313477, |
|
"eval_precision": 0.5379946588977907, |
|
"eval_recall": 0.6188215582239598, |
|
"eval_runtime": 2.7422, |
|
"eval_samples_per_second": 405.52, |
|
"eval_steps_per_second": 25.527, |
|
"step": 5844 |
|
}, |
|
{ |
|
"epoch": 12.32, |
|
"learning_rate": 2.6919917864476387e-05, |
|
"loss": 0.094, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_accuracy": 0.7506084466714388, |
|
"eval_f1": 0.5764092123679858, |
|
"eval_loss": 1.3724055290222168, |
|
"eval_precision": 0.52945301542777, |
|
"eval_recall": 0.6325048869030997, |
|
"eval_runtime": 2.7524, |
|
"eval_samples_per_second": 404.018, |
|
"eval_steps_per_second": 25.433, |
|
"step": 6331 |
|
}, |
|
{ |
|
"epoch": 13.35, |
|
"learning_rate": 2.6663244353182754e-05, |
|
"loss": 0.084, |
|
"step": 6500 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_accuracy": 0.7531615366261035, |
|
"eval_f1": 0.574173712528824, |
|
"eval_loss": 1.374582290649414, |
|
"eval_precision": 0.530414201183432, |
|
"eval_recall": 0.6258028483663781, |
|
"eval_runtime": 2.7617, |
|
"eval_samples_per_second": 402.648, |
|
"eval_steps_per_second": 25.347, |
|
"step": 6818 |
|
}, |
|
{ |
|
"epoch": 14.37, |
|
"learning_rate": 2.640657084188912e-05, |
|
"loss": 0.0758, |
|
"step": 7000 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_accuracy": 0.7581245526127416, |
|
"eval_f1": 0.5684922922672014, |
|
"eval_loss": 1.3000197410583496, |
|
"eval_precision": 0.5156889495225102, |
|
"eval_recall": 0.6333426417201898, |
|
"eval_runtime": 2.7658, |
|
"eval_samples_per_second": 402.06, |
|
"eval_steps_per_second": 25.31, |
|
"step": 7305 |
|
}, |
|
{ |
|
"epoch": 15.4, |
|
"learning_rate": 2.6149897330595482e-05, |
|
"loss": 0.0694, |
|
"step": 7500 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_accuracy": 0.7593175853018372, |
|
"eval_f1": 0.5867220995192932, |
|
"eval_loss": 1.4194592237472534, |
|
"eval_precision": 0.5485908649173955, |
|
"eval_recall": 0.6305501256632225, |
|
"eval_runtime": 2.7493, |
|
"eval_samples_per_second": 404.466, |
|
"eval_steps_per_second": 25.461, |
|
"step": 7792 |
|
}, |
|
{ |
|
"epoch": 16.43, |
|
"learning_rate": 2.589322381930185e-05, |
|
"loss": 0.062, |
|
"step": 8000 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_accuracy": 0.7465521355285135, |
|
"eval_f1": 0.5717906475731847, |
|
"eval_loss": 1.4974385499954224, |
|
"eval_precision": 0.5234338747099768, |
|
"eval_recall": 0.629991622451829, |
|
"eval_runtime": 2.7551, |
|
"eval_samples_per_second": 403.608, |
|
"eval_steps_per_second": 25.407, |
|
"step": 8279 |
|
}, |
|
{ |
|
"epoch": 17.45, |
|
"learning_rate": 2.5636550308008215e-05, |
|
"loss": 0.0543, |
|
"step": 8500 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_accuracy": 0.7567644953471725, |
|
"eval_f1": 0.5741626794258373, |
|
"eval_loss": 1.5013597011566162, |
|
"eval_precision": 0.5346820809248555, |
|
"eval_recall": 0.6199385646467467, |
|
"eval_runtime": 2.7536, |
|
"eval_samples_per_second": 403.832, |
|
"eval_steps_per_second": 25.421, |
|
"step": 8766 |
|
}, |
|
{ |
|
"epoch": 18.48, |
|
"learning_rate": 2.537987679671458e-05, |
|
"loss": 0.0471, |
|
"step": 9000 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_accuracy": 0.7546408971605822, |
|
"eval_f1": 0.5768982020437201, |
|
"eval_loss": 1.5164920091629028, |
|
"eval_precision": 0.5373493975903615, |
|
"eval_recall": 0.6227310807037141, |
|
"eval_runtime": 2.7556, |
|
"eval_samples_per_second": 403.547, |
|
"eval_steps_per_second": 25.403, |
|
"step": 9253 |
|
}, |
|
{ |
|
"epoch": 19.51, |
|
"learning_rate": 2.5123203285420943e-05, |
|
"loss": 0.0449, |
|
"step": 9500 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_accuracy": 0.7568122166547363, |
|
"eval_f1": 0.5733962504782553, |
|
"eval_loss": 1.5718824863433838, |
|
"eval_precision": 0.5276995305164319, |
|
"eval_recall": 0.6277576096062553, |
|
"eval_runtime": 2.7667, |
|
"eval_samples_per_second": 401.921, |
|
"eval_steps_per_second": 25.301, |
|
"step": 9740 |
|
}, |
|
{ |
|
"epoch": 20.53, |
|
"learning_rate": 2.486652977412731e-05, |
|
"loss": 0.0451, |
|
"step": 10000 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_accuracy": 0.7607253638749701, |
|
"eval_f1": 0.5917858548746885, |
|
"eval_loss": 1.5306912660598755, |
|
"eval_precision": 0.5581683168316832, |
|
"eval_recall": 0.6297123708461324, |
|
"eval_runtime": 2.7618, |
|
"eval_samples_per_second": 402.633, |
|
"eval_steps_per_second": 25.346, |
|
"step": 10227 |
|
}, |
|
{ |
|
"epoch": 21.56, |
|
"learning_rate": 2.4609856262833676e-05, |
|
"loss": 0.039, |
|
"step": 10500 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_accuracy": 0.7572417084228108, |
|
"eval_f1": 0.5844206174912802, |
|
"eval_loss": 1.5783377885818481, |
|
"eval_precision": 0.54375, |
|
"eval_recall": 0.6316671320860094, |
|
"eval_runtime": 2.7632, |
|
"eval_samples_per_second": 402.427, |
|
"eval_steps_per_second": 25.333, |
|
"step": 10714 |
|
}, |
|
{ |
|
"epoch": 22.59, |
|
"learning_rate": 2.4353182751540042e-05, |
|
"loss": 0.0363, |
|
"step": 11000 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_accuracy": 0.7541875447387258, |
|
"eval_f1": 0.5802802416763081, |
|
"eval_loss": 1.6342318058013916, |
|
"eval_precision": 0.5376369699857074, |
|
"eval_recall": 0.6302708740575258, |
|
"eval_runtime": 2.7447, |
|
"eval_samples_per_second": 405.151, |
|
"eval_steps_per_second": 25.504, |
|
"step": 11201 |
|
}, |
|
{ |
|
"epoch": 23.61, |
|
"learning_rate": 2.4096509240246405e-05, |
|
"loss": 0.0326, |
|
"step": 11500 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_accuracy": 0.7596993557623479, |
|
"eval_f1": 0.5911304118963022, |
|
"eval_loss": 1.641722321510315, |
|
"eval_precision": 0.5589845694375312, |
|
"eval_recall": 0.6271991063948618, |
|
"eval_runtime": 2.7546, |
|
"eval_samples_per_second": 403.689, |
|
"eval_steps_per_second": 25.412, |
|
"step": 11688 |
|
}, |
|
{ |
|
"epoch": 24.64, |
|
"learning_rate": 2.383983572895277e-05, |
|
"loss": 0.0296, |
|
"step": 12000 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_accuracy": 0.7586733476497256, |
|
"eval_f1": 0.5861406430126809, |
|
"eval_loss": 1.6684845685958862, |
|
"eval_precision": 0.5414103170847137, |
|
"eval_recall": 0.6389276738341245, |
|
"eval_runtime": 2.8726, |
|
"eval_samples_per_second": 387.108, |
|
"eval_steps_per_second": 24.368, |
|
"step": 12175 |
|
}, |
|
{ |
|
"epoch": 25.67, |
|
"learning_rate": 2.3583162217659137e-05, |
|
"loss": 0.0283, |
|
"step": 12500 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"eval_accuracy": 0.760200429491768, |
|
"eval_f1": 0.5926797385620914, |
|
"eval_loss": 1.7346807718276978, |
|
"eval_precision": 0.5571393462767265, |
|
"eval_recall": 0.6330633901144932, |
|
"eval_runtime": 2.7525, |
|
"eval_samples_per_second": 404.0, |
|
"eval_steps_per_second": 25.432, |
|
"step": 12662 |
|
}, |
|
{ |
|
"epoch": 26.69, |
|
"learning_rate": 2.3326488706365506e-05, |
|
"loss": 0.0277, |
|
"step": 13000 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"eval_accuracy": 0.7632068718682892, |
|
"eval_f1": 0.6025674613570867, |
|
"eval_loss": 1.6559849977493286, |
|
"eval_precision": 0.5674808783617074, |
|
"eval_recall": 0.6422786931024853, |
|
"eval_runtime": 2.7331, |
|
"eval_samples_per_second": 406.857, |
|
"eval_steps_per_second": 25.612, |
|
"step": 13149 |
|
}, |
|
{ |
|
"epoch": 27.72, |
|
"learning_rate": 2.306981519507187e-05, |
|
"loss": 0.025, |
|
"step": 13500 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_accuracy": 0.7613934621808638, |
|
"eval_f1": 0.6024861147844485, |
|
"eval_loss": 1.7496830224990845, |
|
"eval_precision": 0.5722180356694297, |
|
"eval_recall": 0.6361351577771572, |
|
"eval_runtime": 2.7227, |
|
"eval_samples_per_second": 408.425, |
|
"eval_steps_per_second": 25.71, |
|
"step": 13636 |
|
}, |
|
{ |
|
"epoch": 28.75, |
|
"learning_rate": 2.2813141683778235e-05, |
|
"loss": 0.0241, |
|
"step": 14000 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"eval_accuracy": 0.7637795275590551, |
|
"eval_f1": 0.5988181221273802, |
|
"eval_loss": 1.710971474647522, |
|
"eval_precision": 0.5651958353991076, |
|
"eval_recall": 0.6366936609885507, |
|
"eval_runtime": 2.7599, |
|
"eval_samples_per_second": 402.917, |
|
"eval_steps_per_second": 25.363, |
|
"step": 14123 |
|
}, |
|
{ |
|
"epoch": 29.77, |
|
"learning_rate": 2.25564681724846e-05, |
|
"loss": 0.0242, |
|
"step": 14500 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_accuracy": 0.7647339537103317, |
|
"eval_f1": 0.5951438374241224, |
|
"eval_loss": 1.794677734375, |
|
"eval_precision": 0.5641731298473855, |
|
"eval_recall": 0.6297123708461324, |
|
"eval_runtime": 2.7628, |
|
"eval_samples_per_second": 402.492, |
|
"eval_steps_per_second": 25.337, |
|
"step": 14610 |
|
}, |
|
{ |
|
"epoch": 30.8, |
|
"learning_rate": 2.2299794661190967e-05, |
|
"loss": 0.0219, |
|
"step": 15000 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"eval_accuracy": 0.7565258888093533, |
|
"eval_f1": 0.592573084013695, |
|
"eval_loss": 1.8282643556594849, |
|
"eval_precision": 0.5606777971592325, |
|
"eval_recall": 0.6283161128176487, |
|
"eval_runtime": 2.7362, |
|
"eval_samples_per_second": 406.407, |
|
"eval_steps_per_second": 25.583, |
|
"step": 15097 |
|
}, |
|
{ |
|
"epoch": 31.83, |
|
"learning_rate": 2.204312114989733e-05, |
|
"loss": 0.0193, |
|
"step": 15500 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"eval_accuracy": 0.7648293963254593, |
|
"eval_f1": 0.5969198088157196, |
|
"eval_loss": 1.8161470890045166, |
|
"eval_precision": 0.568969881042774, |
|
"eval_recall": 0.6277576096062553, |
|
"eval_runtime": 2.7545, |
|
"eval_samples_per_second": 403.709, |
|
"eval_steps_per_second": 25.413, |
|
"step": 15584 |
|
}, |
|
{ |
|
"epoch": 32.85, |
|
"learning_rate": 2.1786447638603696e-05, |
|
"loss": 0.0185, |
|
"step": 16000 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"eval_accuracy": 0.7608685277976617, |
|
"eval_f1": 0.5930080876597965, |
|
"eval_loss": 1.846176028251648, |
|
"eval_precision": 0.5564259485924112, |
|
"eval_recall": 0.6347388997486736, |
|
"eval_runtime": 2.7276, |
|
"eval_samples_per_second": 407.69, |
|
"eval_steps_per_second": 25.664, |
|
"step": 16071 |
|
}, |
|
{ |
|
"epoch": 33.88, |
|
"learning_rate": 2.1529774127310062e-05, |
|
"loss": 0.0195, |
|
"step": 16500 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"eval_accuracy": 0.755810069195896, |
|
"eval_f1": 0.5868997912317329, |
|
"eval_loss": 1.9018374681472778, |
|
"eval_precision": 0.5508204751408278, |
|
"eval_recall": 0.628036861211952, |
|
"eval_runtime": 2.7537, |
|
"eval_samples_per_second": 403.819, |
|
"eval_steps_per_second": 25.42, |
|
"step": 16558 |
|
}, |
|
{ |
|
"epoch": 34.91, |
|
"learning_rate": 2.127310061601643e-05, |
|
"loss": 0.0181, |
|
"step": 17000 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"eval_accuracy": 0.7597470770699117, |
|
"eval_f1": 0.5975321606720924, |
|
"eval_loss": 1.8523436784744263, |
|
"eval_precision": 0.5637849888531088, |
|
"eval_recall": 0.6355766545657637, |
|
"eval_runtime": 2.7278, |
|
"eval_samples_per_second": 407.651, |
|
"eval_steps_per_second": 25.661, |
|
"step": 17045 |
|
}, |
|
{ |
|
"epoch": 35.93, |
|
"learning_rate": 2.1016427104722795e-05, |
|
"loss": 0.0182, |
|
"step": 17500 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"eval_accuracy": 0.7611309949892627, |
|
"eval_f1": 0.6036228023441662, |
|
"eval_loss": 1.8343547582626343, |
|
"eval_precision": 0.5770308123249299, |
|
"eval_recall": 0.6327841385087964, |
|
"eval_runtime": 2.7612, |
|
"eval_samples_per_second": 402.717, |
|
"eval_steps_per_second": 25.351, |
|
"step": 17532 |
|
}, |
|
{ |
|
"epoch": 36.96, |
|
"learning_rate": 2.0759753593429157e-05, |
|
"loss": 0.0153, |
|
"step": 18000 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"eval_accuracy": 0.7668814125507039, |
|
"eval_f1": 0.603166156711454, |
|
"eval_loss": 1.8464767932891846, |
|
"eval_precision": 0.5759654471544715, |
|
"eval_recall": 0.6330633901144932, |
|
"eval_runtime": 2.7392, |
|
"eval_samples_per_second": 405.958, |
|
"eval_steps_per_second": 25.555, |
|
"step": 18019 |
|
}, |
|
{ |
|
"epoch": 37.99, |
|
"learning_rate": 2.0503080082135523e-05, |
|
"loss": 0.0142, |
|
"step": 18500 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"eval_accuracy": 0.7632068718682892, |
|
"eval_f1": 0.5945442448436461, |
|
"eval_loss": 1.8911150693893433, |
|
"eval_precision": 0.5678698525673614, |
|
"eval_recall": 0.623848087126501, |
|
"eval_runtime": 2.7453, |
|
"eval_samples_per_second": 405.06, |
|
"eval_steps_per_second": 25.498, |
|
"step": 18506 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"eval_accuracy": 0.7622763063707946, |
|
"eval_f1": 0.6007257089100927, |
|
"eval_loss": 1.8849174976348877, |
|
"eval_precision": 0.5790155440414507, |
|
"eval_recall": 0.6241273387321977, |
|
"eval_runtime": 2.7696, |
|
"eval_samples_per_second": 401.495, |
|
"eval_steps_per_second": 25.274, |
|
"step": 18993 |
|
}, |
|
{ |
|
"epoch": 39.01, |
|
"learning_rate": 2.024640657084189e-05, |
|
"loss": 0.0151, |
|
"step": 19000 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_accuracy": 0.7665235027439752, |
|
"eval_f1": 0.5976520811099254, |
|
"eval_loss": 1.8399417400360107, |
|
"eval_precision": 0.5721583652618135, |
|
"eval_recall": 0.6255235967606814, |
|
"eval_runtime": 2.8345, |
|
"eval_samples_per_second": 392.315, |
|
"eval_steps_per_second": 24.696, |
|
"step": 19480 |
|
}, |
|
{ |
|
"epoch": 40.04, |
|
"learning_rate": 1.9989733059548256e-05, |
|
"loss": 0.0148, |
|
"step": 19500 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"eval_accuracy": 0.7649248389405869, |
|
"eval_f1": 0.596647742633144, |
|
"eval_loss": 1.843032956123352, |
|
"eval_precision": 0.5782027770500393, |
|
"eval_recall": 0.6163082937726891, |
|
"eval_runtime": 2.7539, |
|
"eval_samples_per_second": 403.796, |
|
"eval_steps_per_second": 25.419, |
|
"step": 19967 |
|
}, |
|
{ |
|
"epoch": 41.07, |
|
"learning_rate": 1.973305954825462e-05, |
|
"loss": 0.0138, |
|
"step": 20000 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"eval_accuracy": 0.7691481746599856, |
|
"eval_f1": 0.5887899423782085, |
|
"eval_loss": 1.8764090538024902, |
|
"eval_precision": 0.5543773119605425, |
|
"eval_recall": 0.6277576096062553, |
|
"eval_runtime": 2.7704, |
|
"eval_samples_per_second": 401.388, |
|
"eval_steps_per_second": 25.267, |
|
"step": 20454 |
|
}, |
|
{ |
|
"epoch": 42.09, |
|
"learning_rate": 1.9476386036960984e-05, |
|
"loss": 0.0147, |
|
"step": 20500 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"eval_accuracy": 0.7666428060128847, |
|
"eval_f1": 0.6014559894109861, |
|
"eval_loss": 1.9270243644714355, |
|
"eval_precision": 0.571716155007549, |
|
"eval_recall": 0.6344596481429768, |
|
"eval_runtime": 2.7281, |
|
"eval_samples_per_second": 407.612, |
|
"eval_steps_per_second": 25.659, |
|
"step": 20941 |
|
}, |
|
{ |
|
"epoch": 43.12, |
|
"learning_rate": 1.921971252566735e-05, |
|
"loss": 0.0148, |
|
"step": 21000 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"eval_accuracy": 0.7710570269625387, |
|
"eval_f1": 0.5908850026497084, |
|
"eval_loss": 1.8888484239578247, |
|
"eval_precision": 0.5621376354928157, |
|
"eval_recall": 0.6227310807037141, |
|
"eval_runtime": 2.775, |
|
"eval_samples_per_second": 400.718, |
|
"eval_steps_per_second": 25.225, |
|
"step": 21428 |
|
}, |
|
{ |
|
"epoch": 44.15, |
|
"learning_rate": 1.896303901437372e-05, |
|
"loss": 0.0123, |
|
"step": 21500 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"eval_accuracy": 0.7653066094010976, |
|
"eval_f1": 0.5868878357030016, |
|
"eval_loss": 1.8992524147033691, |
|
"eval_precision": 0.5551681195516812, |
|
"eval_recall": 0.6224518290980173, |
|
"eval_runtime": 2.7417, |
|
"eval_samples_per_second": 405.586, |
|
"eval_steps_per_second": 25.531, |
|
"step": 21915 |
|
}, |
|
{ |
|
"epoch": 45.17, |
|
"learning_rate": 1.8706365503080083e-05, |
|
"loss": 0.0115, |
|
"step": 22000 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"eval_accuracy": 0.7644714865187306, |
|
"eval_f1": 0.597897503285151, |
|
"eval_loss": 1.947526216506958, |
|
"eval_precision": 0.5646562422437329, |
|
"eval_recall": 0.635297402960067, |
|
"eval_runtime": 2.7396, |
|
"eval_samples_per_second": 405.892, |
|
"eval_steps_per_second": 25.551, |
|
"step": 22402 |
|
}, |
|
{ |
|
"epoch": 46.2, |
|
"learning_rate": 1.844969199178645e-05, |
|
"loss": 0.0107, |
|
"step": 22500 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"eval_accuracy": 0.7674302075876879, |
|
"eval_f1": 0.605424089337942, |
|
"eval_loss": 1.994935393333435, |
|
"eval_precision": 0.5777721390510023, |
|
"eval_recall": 0.6358559061714605, |
|
"eval_runtime": 2.7286, |
|
"eval_samples_per_second": 407.535, |
|
"eval_steps_per_second": 25.654, |
|
"step": 22889 |
|
}, |
|
{ |
|
"epoch": 47.23, |
|
"learning_rate": 1.8193018480492815e-05, |
|
"loss": 0.0098, |
|
"step": 23000 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"eval_accuracy": 0.7680744452397996, |
|
"eval_f1": 0.5976063829787234, |
|
"eval_loss": 1.9606735706329346, |
|
"eval_precision": 0.5704493526275705, |
|
"eval_recall": 0.6274783580005585, |
|
"eval_runtime": 2.772, |
|
"eval_samples_per_second": 401.157, |
|
"eval_steps_per_second": 25.253, |
|
"step": 23376 |
|
}, |
|
{ |
|
"epoch": 48.25, |
|
"learning_rate": 1.793634496919918e-05, |
|
"loss": 0.012, |
|
"step": 23500 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"eval_accuracy": 0.7675733715103794, |
|
"eval_f1": 0.6134034165571617, |
|
"eval_loss": 1.918538212776184, |
|
"eval_precision": 0.5793000744601638, |
|
"eval_recall": 0.6517732476961743, |
|
"eval_runtime": 2.7319, |
|
"eval_samples_per_second": 407.049, |
|
"eval_steps_per_second": 25.624, |
|
"step": 23863 |
|
}, |
|
{ |
|
"epoch": 49.28, |
|
"learning_rate": 1.7679671457905544e-05, |
|
"loss": 0.0117, |
|
"step": 24000 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_accuracy": 0.7698401336196612, |
|
"eval_f1": 0.6049822064056939, |
|
"eval_loss": 1.9814343452453613, |
|
"eval_precision": 0.572890664003994, |
|
"eval_recall": 0.6408824350740017, |
|
"eval_runtime": 2.761, |
|
"eval_samples_per_second": 402.752, |
|
"eval_steps_per_second": 25.353, |
|
"step": 24350 |
|
}, |
|
{ |
|
"epoch": 50.31, |
|
"learning_rate": 1.742299794661191e-05, |
|
"loss": 0.0093, |
|
"step": 24500 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"eval_accuracy": 0.7662371748985922, |
|
"eval_f1": 0.6067415730337078, |
|
"eval_loss": 2.035374164581299, |
|
"eval_precision": 0.5760542168674698, |
|
"eval_recall": 0.6408824350740017, |
|
"eval_runtime": 2.7628, |
|
"eval_samples_per_second": 402.494, |
|
"eval_steps_per_second": 25.337, |
|
"step": 24837 |
|
}, |
|
{ |
|
"epoch": 51.33, |
|
"learning_rate": 1.7166324435318276e-05, |
|
"loss": 0.0082, |
|
"step": 25000 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"eval_accuracy": 0.7683130517776187, |
|
"eval_f1": 0.6179188429087987, |
|
"eval_loss": 1.9876421689987183, |
|
"eval_precision": 0.5936695831188883, |
|
"eval_recall": 0.6442334543423625, |
|
"eval_runtime": 2.751, |
|
"eval_samples_per_second": 404.224, |
|
"eval_steps_per_second": 25.446, |
|
"step": 25324 |
|
}, |
|
{ |
|
"epoch": 52.36, |
|
"learning_rate": 1.6909650924024642e-05, |
|
"loss": 0.0077, |
|
"step": 25500 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"eval_accuracy": 0.7691481746599856, |
|
"eval_f1": 0.6208498428747096, |
|
"eval_loss": 2.0615577697753906, |
|
"eval_precision": 0.6078116639914393, |
|
"eval_recall": 0.6344596481429768, |
|
"eval_runtime": 2.7544, |
|
"eval_samples_per_second": 403.721, |
|
"eval_steps_per_second": 25.414, |
|
"step": 25811 |
|
}, |
|
{ |
|
"epoch": 53.39, |
|
"learning_rate": 1.6652977412731005e-05, |
|
"loss": 0.0087, |
|
"step": 26000 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"eval_accuracy": 0.7652588880935338, |
|
"eval_f1": 0.5977975878342947, |
|
"eval_loss": 1.9790315628051758, |
|
"eval_precision": 0.5633802816901409, |
|
"eval_recall": 0.6366936609885507, |
|
"eval_runtime": 2.7387, |
|
"eval_samples_per_second": 406.036, |
|
"eval_steps_per_second": 25.56, |
|
"step": 26298 |
|
}, |
|
{ |
|
"epoch": 54.41, |
|
"learning_rate": 1.639630390143737e-05, |
|
"loss": 0.0102, |
|
"step": 26500 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"eval_accuracy": 0.7677642567406346, |
|
"eval_f1": 0.6056356660933986, |
|
"eval_loss": 2.068793773651123, |
|
"eval_precision": 0.5754147812971342, |
|
"eval_recall": 0.6392069254398213, |
|
"eval_runtime": 2.8605, |
|
"eval_samples_per_second": 388.746, |
|
"eval_steps_per_second": 24.471, |
|
"step": 26785 |
|
}, |
|
{ |
|
"epoch": 55.44, |
|
"learning_rate": 1.6139630390143737e-05, |
|
"loss": 0.0073, |
|
"step": 27000 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"eval_accuracy": 0.7678596993557624, |
|
"eval_f1": 0.6073495759860008, |
|
"eval_loss": 1.960081696510315, |
|
"eval_precision": 0.5862785862785863, |
|
"eval_recall": 0.629991622451829, |
|
"eval_runtime": 2.7429, |
|
"eval_samples_per_second": 405.41, |
|
"eval_steps_per_second": 25.52, |
|
"step": 27272 |
|
}, |
|
{ |
|
"epoch": 56.47, |
|
"learning_rate": 1.5882956878850103e-05, |
|
"loss": 0.0087, |
|
"step": 27500 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"eval_accuracy": 0.7683369124314006, |
|
"eval_f1": 0.6085343228200372, |
|
"eval_loss": 2.0414817333221436, |
|
"eval_precision": 0.5790668348045397, |
|
"eval_recall": 0.6411616866796984, |
|
"eval_runtime": 2.7325, |
|
"eval_samples_per_second": 406.95, |
|
"eval_steps_per_second": 25.617, |
|
"step": 27759 |
|
}, |
|
{ |
|
"epoch": 57.49, |
|
"learning_rate": 1.5626283367556466e-05, |
|
"loss": 0.0082, |
|
"step": 28000 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"eval_accuracy": 0.766571224051539, |
|
"eval_f1": 0.6019978969505784, |
|
"eval_loss": 2.077375888824463, |
|
"eval_precision": 0.5686615346411721, |
|
"eval_recall": 0.639486177045518, |
|
"eval_runtime": 2.7299, |
|
"eval_samples_per_second": 407.338, |
|
"eval_steps_per_second": 25.642, |
|
"step": 28246 |
|
}, |
|
{ |
|
"epoch": 58.52, |
|
"learning_rate": 1.5369609856262832e-05, |
|
"loss": 0.0056, |
|
"step": 28500 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"eval_accuracy": 0.7637318062514913, |
|
"eval_f1": 0.6061579651941098, |
|
"eval_loss": 2.077326536178589, |
|
"eval_precision": 0.5821547955772692, |
|
"eval_recall": 0.6322256352974029, |
|
"eval_runtime": 2.7596, |
|
"eval_samples_per_second": 402.96, |
|
"eval_steps_per_second": 25.366, |
|
"step": 28733 |
|
}, |
|
{ |
|
"epoch": 59.55, |
|
"learning_rate": 1.5112936344969198e-05, |
|
"loss": 0.0076, |
|
"step": 29000 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"eval_accuracy": 0.7695299451204963, |
|
"eval_f1": 0.6170241467691892, |
|
"eval_loss": 2.104527235031128, |
|
"eval_precision": 0.5968162839248434, |
|
"eval_recall": 0.6386484222284278, |
|
"eval_runtime": 2.73, |
|
"eval_samples_per_second": 407.333, |
|
"eval_steps_per_second": 25.641, |
|
"step": 29220 |
|
}, |
|
{ |
|
"epoch": 60.57, |
|
"learning_rate": 1.4856262833675564e-05, |
|
"loss": 0.0071, |
|
"step": 29500 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"eval_accuracy": 0.768241469816273, |
|
"eval_f1": 0.6094618408567168, |
|
"eval_loss": 2.0994060039520264, |
|
"eval_precision": 0.5922023182297155, |
|
"eval_recall": 0.6277576096062553, |
|
"eval_runtime": 2.7589, |
|
"eval_samples_per_second": 403.058, |
|
"eval_steps_per_second": 25.372, |
|
"step": 29707 |
|
}, |
|
{ |
|
"epoch": 61.6, |
|
"learning_rate": 1.459958932238193e-05, |
|
"loss": 0.0076, |
|
"step": 30000 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"eval_accuracy": 0.7649725602481507, |
|
"eval_f1": 0.609375, |
|
"eval_loss": 2.0936837196350098, |
|
"eval_precision": 0.5794510198942332, |
|
"eval_recall": 0.6425579447081821, |
|
"eval_runtime": 2.7348, |
|
"eval_samples_per_second": 406.615, |
|
"eval_steps_per_second": 25.596, |
|
"step": 30194 |
|
}, |
|
{ |
|
"epoch": 62.63, |
|
"learning_rate": 1.4342915811088295e-05, |
|
"loss": 0.0082, |
|
"step": 30500 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"eval_accuracy": 0.7682653304700549, |
|
"eval_f1": 0.6062616078535421, |
|
"eval_loss": 2.0307247638702393, |
|
"eval_precision": 0.5774576699519838, |
|
"eval_recall": 0.6380899190170344, |
|
"eval_runtime": 2.7517, |
|
"eval_samples_per_second": 404.118, |
|
"eval_steps_per_second": 25.439, |
|
"step": 30681 |
|
}, |
|
{ |
|
"epoch": 63.66, |
|
"learning_rate": 1.4086242299794661e-05, |
|
"loss": 0.0068, |
|
"step": 31000 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"eval_accuracy": 0.7597232164161298, |
|
"eval_f1": 0.6074766355140186, |
|
"eval_loss": 2.1657230854034424, |
|
"eval_precision": 0.581990278843694, |
|
"eval_recall": 0.635297402960067, |
|
"eval_runtime": 2.7205, |
|
"eval_samples_per_second": 408.743, |
|
"eval_steps_per_second": 25.73, |
|
"step": 31168 |
|
}, |
|
{ |
|
"epoch": 64.68, |
|
"learning_rate": 1.3829568788501027e-05, |
|
"loss": 0.0065, |
|
"step": 31500 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"eval_accuracy": 0.7691720353137675, |
|
"eval_f1": 0.6134431455897981, |
|
"eval_loss": 2.0141701698303223, |
|
"eval_precision": 0.5850012667848999, |
|
"eval_recall": 0.644791957553756, |
|
"eval_runtime": 2.7583, |
|
"eval_samples_per_second": 403.142, |
|
"eval_steps_per_second": 25.378, |
|
"step": 31655 |
|
}, |
|
{ |
|
"epoch": 65.71, |
|
"learning_rate": 1.3572895277207393e-05, |
|
"loss": 0.0062, |
|
"step": 32000 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"eval_accuracy": 0.76022429014555, |
|
"eval_f1": 0.6064225053078556, |
|
"eval_loss": 2.1378581523895264, |
|
"eval_precision": 0.5777496839443742, |
|
"eval_recall": 0.6380899190170344, |
|
"eval_runtime": 2.7502, |
|
"eval_samples_per_second": 404.334, |
|
"eval_steps_per_second": 25.453, |
|
"step": 32142 |
|
}, |
|
{ |
|
"epoch": 66.74, |
|
"learning_rate": 1.331622176591376e-05, |
|
"loss": 0.0059, |
|
"step": 32500 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"eval_accuracy": 0.7631352899069435, |
|
"eval_f1": 0.6117240462581417, |
|
"eval_loss": 2.1318540573120117, |
|
"eval_precision": 0.5837138508371386, |
|
"eval_recall": 0.6425579447081821, |
|
"eval_runtime": 2.7357, |
|
"eval_samples_per_second": 406.471, |
|
"eval_steps_per_second": 25.587, |
|
"step": 32629 |
|
}, |
|
{ |
|
"epoch": 67.76, |
|
"learning_rate": 1.3059548254620124e-05, |
|
"loss": 0.0053, |
|
"step": 33000 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"eval_accuracy": 0.768217609162491, |
|
"eval_f1": 0.6046449900464498, |
|
"eval_loss": 2.1246144771575928, |
|
"eval_precision": 0.5761254425897825, |
|
"eval_recall": 0.6361351577771572, |
|
"eval_runtime": 2.7525, |
|
"eval_samples_per_second": 404.001, |
|
"eval_steps_per_second": 25.432, |
|
"step": 33116 |
|
}, |
|
{ |
|
"epoch": 68.79, |
|
"learning_rate": 1.280287474332649e-05, |
|
"loss": 0.0049, |
|
"step": 33500 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"eval_accuracy": 0.765736101169172, |
|
"eval_f1": 0.60803618946248, |
|
"eval_loss": 2.151386022567749, |
|
"eval_precision": 0.5806861499364676, |
|
"eval_recall": 0.6380899190170344, |
|
"eval_runtime": 2.7251, |
|
"eval_samples_per_second": 408.061, |
|
"eval_steps_per_second": 25.687, |
|
"step": 33603 |
|
}, |
|
{ |
|
"epoch": 69.82, |
|
"learning_rate": 1.2546201232032854e-05, |
|
"loss": 0.0037, |
|
"step": 34000 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"eval_accuracy": 0.7679790026246719, |
|
"eval_f1": 0.6107114308553158, |
|
"eval_loss": 2.163627862930298, |
|
"eval_precision": 0.5839490445859873, |
|
"eval_recall": 0.6400446802569115, |
|
"eval_runtime": 2.8617, |
|
"eval_samples_per_second": 388.576, |
|
"eval_steps_per_second": 24.461, |
|
"step": 34090 |
|
}, |
|
{ |
|
"epoch": 70.84, |
|
"learning_rate": 1.228952772073922e-05, |
|
"loss": 0.0053, |
|
"step": 34500 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"eval_accuracy": 0.7639465521355285, |
|
"eval_f1": 0.6052596089008766, |
|
"eval_loss": 2.1477560997009277, |
|
"eval_precision": 0.5852895148669797, |
|
"eval_recall": 0.6266406031834683, |
|
"eval_runtime": 2.752, |
|
"eval_samples_per_second": 404.075, |
|
"eval_steps_per_second": 25.436, |
|
"step": 34577 |
|
}, |
|
{ |
|
"epoch": 71.87, |
|
"learning_rate": 1.2032854209445585e-05, |
|
"loss": 0.0051, |
|
"step": 35000 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"eval_accuracy": 0.7688141255070389, |
|
"eval_f1": 0.6074976818121606, |
|
"eval_loss": 2.1522202491760254, |
|
"eval_precision": 0.5778729838709677, |
|
"eval_recall": 0.6403239318626082, |
|
"eval_runtime": 2.7541, |
|
"eval_samples_per_second": 403.762, |
|
"eval_steps_per_second": 25.417, |
|
"step": 35064 |
|
}, |
|
{ |
|
"epoch": 72.9, |
|
"learning_rate": 1.1776180698151951e-05, |
|
"loss": 0.0047, |
|
"step": 35500 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"eval_accuracy": 0.767120019088523, |
|
"eval_f1": 0.6093333333333334, |
|
"eval_loss": 2.1609299182891846, |
|
"eval_precision": 0.5830569022709875, |
|
"eval_recall": 0.6380899190170344, |
|
"eval_runtime": 2.741, |
|
"eval_samples_per_second": 405.695, |
|
"eval_steps_per_second": 25.538, |
|
"step": 35551 |
|
}, |
|
{ |
|
"epoch": 73.92, |
|
"learning_rate": 1.1519507186858315e-05, |
|
"loss": 0.0036, |
|
"step": 36000 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"eval_accuracy": 0.7705559532331185, |
|
"eval_f1": 0.6200566878121204, |
|
"eval_loss": 2.175739288330078, |
|
"eval_precision": 0.6000522466039707, |
|
"eval_recall": 0.6414409382853952, |
|
"eval_runtime": 2.7261, |
|
"eval_samples_per_second": 407.915, |
|
"eval_steps_per_second": 25.678, |
|
"step": 36038 |
|
}, |
|
{ |
|
"epoch": 74.95, |
|
"learning_rate": 1.1262833675564683e-05, |
|
"loss": 0.004, |
|
"step": 36500 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"eval_accuracy": 0.7661894535910284, |
|
"eval_f1": 0.6165353279016962, |
|
"eval_loss": 2.2280185222625732, |
|
"eval_precision": 0.5908858166922683, |
|
"eval_recall": 0.6445127059480592, |
|
"eval_runtime": 2.75, |
|
"eval_samples_per_second": 404.367, |
|
"eval_steps_per_second": 25.455, |
|
"step": 36525 |
|
}, |
|
{ |
|
"epoch": 75.98, |
|
"learning_rate": 1.1006160164271048e-05, |
|
"loss": 0.0036, |
|
"step": 37000 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"eval_accuracy": 0.770985445001193, |
|
"eval_f1": 0.6190347071583514, |
|
"eval_loss": 2.219874382019043, |
|
"eval_precision": 0.6015810276679842, |
|
"eval_recall": 0.6375314158056409, |
|
"eval_runtime": 2.7612, |
|
"eval_samples_per_second": 402.72, |
|
"eval_steps_per_second": 25.351, |
|
"step": 37012 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"eval_accuracy": 0.7684800763540921, |
|
"eval_f1": 0.6117552978808477, |
|
"eval_loss": 2.1809566020965576, |
|
"eval_precision": 0.5851606323304437, |
|
"eval_recall": 0.6408824350740017, |
|
"eval_runtime": 2.7598, |
|
"eval_samples_per_second": 402.922, |
|
"eval_steps_per_second": 25.364, |
|
"step": 37499 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"learning_rate": 1.0749486652977414e-05, |
|
"loss": 0.0043, |
|
"step": 37500 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"eval_accuracy": 0.7688857074683846, |
|
"eval_f1": 0.6095212623696176, |
|
"eval_loss": 2.2160749435424805, |
|
"eval_precision": 0.5848088273030536, |
|
"eval_recall": 0.636414409382854, |
|
"eval_runtime": 2.7615, |
|
"eval_samples_per_second": 402.681, |
|
"eval_steps_per_second": 25.349, |
|
"step": 37986 |
|
}, |
|
{ |
|
"epoch": 78.03, |
|
"learning_rate": 1.0492813141683778e-05, |
|
"loss": 0.0039, |
|
"step": 38000 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"eval_accuracy": 0.7693867811978048, |
|
"eval_f1": 0.6086727989487517, |
|
"eval_loss": 2.187803030014038, |
|
"eval_precision": 0.5748324646314222, |
|
"eval_recall": 0.6467467187936331, |
|
"eval_runtime": 2.7479, |
|
"eval_samples_per_second": 404.677, |
|
"eval_steps_per_second": 25.474, |
|
"step": 38473 |
|
}, |
|
{ |
|
"epoch": 79.06, |
|
"learning_rate": 1.0236139630390144e-05, |
|
"loss": 0.0052, |
|
"step": 38500 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"eval_accuracy": 0.7653066094010976, |
|
"eval_f1": 0.6083209909788608, |
|
"eval_loss": 2.271164894104004, |
|
"eval_precision": 0.5873634945397815, |
|
"eval_recall": 0.6308293772689193, |
|
"eval_runtime": 2.7444, |
|
"eval_samples_per_second": 405.19, |
|
"eval_steps_per_second": 25.507, |
|
"step": 38960 |
|
}, |
|
{ |
|
"epoch": 80.08, |
|
"learning_rate": 9.979466119096509e-06, |
|
"loss": 0.0034, |
|
"step": 39000 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"eval_accuracy": 0.7658076831305177, |
|
"eval_f1": 0.6129723934601984, |
|
"eval_loss": 2.264491319656372, |
|
"eval_precision": 0.5892811131151765, |
|
"eval_recall": 0.6386484222284278, |
|
"eval_runtime": 2.7444, |
|
"eval_samples_per_second": 405.192, |
|
"eval_steps_per_second": 25.507, |
|
"step": 39447 |
|
}, |
|
{ |
|
"epoch": 81.11, |
|
"learning_rate": 9.722792607802875e-06, |
|
"loss": 0.0027, |
|
"step": 39500 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"eval_accuracy": 0.7651157241708423, |
|
"eval_f1": 0.6160738528373609, |
|
"eval_loss": 2.2353475093841553, |
|
"eval_precision": 0.5994715984147952, |
|
"eval_recall": 0.6336218933258866, |
|
"eval_runtime": 2.7335, |
|
"eval_samples_per_second": 406.808, |
|
"eval_steps_per_second": 25.608, |
|
"step": 39934 |
|
}, |
|
{ |
|
"epoch": 82.14, |
|
"learning_rate": 9.46611909650924e-06, |
|
"loss": 0.0026, |
|
"step": 40000 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"eval_accuracy": 0.7630398472918158, |
|
"eval_f1": 0.6092892517735242, |
|
"eval_loss": 2.3130922317504883, |
|
"eval_precision": 0.5850899742930591, |
|
"eval_recall": 0.6355766545657637, |
|
"eval_runtime": 2.7731, |
|
"eval_samples_per_second": 400.996, |
|
"eval_steps_per_second": 25.243, |
|
"step": 40421 |
|
}, |
|
{ |
|
"epoch": 83.16, |
|
"learning_rate": 9.209445585215607e-06, |
|
"loss": 0.0017, |
|
"step": 40500 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"eval_accuracy": 0.766022429014555, |
|
"eval_f1": 0.6101919258769026, |
|
"eval_loss": 2.279829978942871, |
|
"eval_precision": 0.5800201308505284, |
|
"eval_recall": 0.643674951130969, |
|
"eval_runtime": 2.8746, |
|
"eval_samples_per_second": 386.835, |
|
"eval_steps_per_second": 24.351, |
|
"step": 40908 |
|
}, |
|
{ |
|
"epoch": 84.19, |
|
"learning_rate": 8.952772073921972e-06, |
|
"loss": 0.0022, |
|
"step": 41000 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"eval_accuracy": 0.7636840849439275, |
|
"eval_f1": 0.6126270733012306, |
|
"eval_loss": 2.3181393146514893, |
|
"eval_precision": 0.5879332477535302, |
|
"eval_recall": 0.639486177045518, |
|
"eval_runtime": 2.7182, |
|
"eval_samples_per_second": 409.097, |
|
"eval_steps_per_second": 25.752, |
|
"step": 41395 |
|
}, |
|
{ |
|
"epoch": 85.22, |
|
"learning_rate": 8.696098562628338e-06, |
|
"loss": 0.0032, |
|
"step": 41500 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"eval_accuracy": 0.769625387735624, |
|
"eval_f1": 0.6169463995668651, |
|
"eval_loss": 2.296386480331421, |
|
"eval_precision": 0.5986340950879958, |
|
"eval_recall": 0.636414409382854, |
|
"eval_runtime": 2.7321, |
|
"eval_samples_per_second": 407.016, |
|
"eval_steps_per_second": 25.622, |
|
"step": 41882 |
|
}, |
|
{ |
|
"epoch": 86.24, |
|
"learning_rate": 8.439425051334702e-06, |
|
"loss": 0.003, |
|
"step": 42000 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"eval_accuracy": 0.7664996420901933, |
|
"eval_f1": 0.6199271942834029, |
|
"eval_loss": 2.250883102416992, |
|
"eval_precision": 0.5993222106360793, |
|
"eval_recall": 0.6419994414967886, |
|
"eval_runtime": 2.7205, |
|
"eval_samples_per_second": 408.748, |
|
"eval_steps_per_second": 25.731, |
|
"step": 42369 |
|
}, |
|
{ |
|
"epoch": 87.27, |
|
"learning_rate": 8.182751540041068e-06, |
|
"loss": 0.003, |
|
"step": 42500 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"eval_accuracy": 0.7704843712717728, |
|
"eval_f1": 0.6209611729568286, |
|
"eval_loss": 2.2512495517730713, |
|
"eval_precision": 0.604227212681638, |
|
"eval_recall": 0.6386484222284278, |
|
"eval_runtime": 2.7574, |
|
"eval_samples_per_second": 403.273, |
|
"eval_steps_per_second": 25.386, |
|
"step": 42856 |
|
}, |
|
{ |
|
"epoch": 88.3, |
|
"learning_rate": 7.926078028747433e-06, |
|
"loss": 0.0027, |
|
"step": 43000 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"eval_accuracy": 0.7695299451204963, |
|
"eval_f1": 0.612212529738303, |
|
"eval_loss": 2.2786777019500732, |
|
"eval_precision": 0.5811794228356336, |
|
"eval_recall": 0.6467467187936331, |
|
"eval_runtime": 2.7267, |
|
"eval_samples_per_second": 407.814, |
|
"eval_steps_per_second": 25.672, |
|
"step": 43343 |
|
}, |
|
{ |
|
"epoch": 89.32, |
|
"learning_rate": 7.669404517453799e-06, |
|
"loss": 0.0016, |
|
"step": 43500 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"eval_accuracy": 0.7652588880935338, |
|
"eval_f1": 0.6130278406820301, |
|
"eval_loss": 2.2572543621063232, |
|
"eval_precision": 0.5860927152317881, |
|
"eval_recall": 0.6425579447081821, |
|
"eval_runtime": 2.7593, |
|
"eval_samples_per_second": 403.005, |
|
"eval_steps_per_second": 25.369, |
|
"step": 43830 |
|
}, |
|
{ |
|
"epoch": 90.35, |
|
"learning_rate": 7.412731006160165e-06, |
|
"loss": 0.0028, |
|
"step": 44000 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"eval_accuracy": 0.7694106418515867, |
|
"eval_f1": 0.6204956463496316, |
|
"eval_loss": 2.247675895690918, |
|
"eval_precision": 0.596292481977343, |
|
"eval_recall": 0.6467467187936331, |
|
"eval_runtime": 2.7505, |
|
"eval_samples_per_second": 404.29, |
|
"eval_steps_per_second": 25.45, |
|
"step": 44317 |
|
}, |
|
{ |
|
"epoch": 91.38, |
|
"learning_rate": 7.15605749486653e-06, |
|
"loss": 0.0022, |
|
"step": 44500 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"eval_accuracy": 0.765187306132188, |
|
"eval_f1": 0.6163021868787275, |
|
"eval_loss": 2.2445809841156006, |
|
"eval_precision": 0.5865287588294652, |
|
"eval_recall": 0.6492599832449036, |
|
"eval_runtime": 2.7626, |
|
"eval_samples_per_second": 402.524, |
|
"eval_steps_per_second": 25.339, |
|
"step": 44804 |
|
}, |
|
{ |
|
"epoch": 92.4, |
|
"learning_rate": 6.899383983572895e-06, |
|
"loss": 0.0017, |
|
"step": 45000 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"eval_accuracy": 0.7661417322834646, |
|
"eval_f1": 0.6177255739455418, |
|
"eval_loss": 2.25286602973938, |
|
"eval_precision": 0.591664535924316, |
|
"eval_recall": 0.6461882155822396, |
|
"eval_runtime": 2.7411, |
|
"eval_samples_per_second": 405.68, |
|
"eval_steps_per_second": 25.537, |
|
"step": 45291 |
|
}, |
|
{ |
|
"epoch": 93.43, |
|
"learning_rate": 6.642710472279261e-06, |
|
"loss": 0.0017, |
|
"step": 45500 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"eval_accuracy": 0.7649725602481507, |
|
"eval_f1": 0.6157979580870501, |
|
"eval_loss": 2.2623953819274902, |
|
"eval_precision": 0.5933212529122444, |
|
"eval_recall": 0.6400446802569115, |
|
"eval_runtime": 2.7635, |
|
"eval_samples_per_second": 402.391, |
|
"eval_steps_per_second": 25.33, |
|
"step": 45778 |
|
}, |
|
{ |
|
"epoch": 94.46, |
|
"learning_rate": 6.386036960985627e-06, |
|
"loss": 0.0015, |
|
"step": 46000 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"eval_accuracy": 0.7649964209019328, |
|
"eval_f1": 0.6160291931342073, |
|
"eval_loss": 2.2783970832824707, |
|
"eval_precision": 0.5969093766369827, |
|
"eval_recall": 0.636414409382854, |
|
"eval_runtime": 2.7635, |
|
"eval_samples_per_second": 402.387, |
|
"eval_steps_per_second": 25.33, |
|
"step": 46265 |
|
}, |
|
{ |
|
"epoch": 95.48, |
|
"learning_rate": 6.129363449691992e-06, |
|
"loss": 0.0012, |
|
"step": 46500 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"eval_accuracy": 0.7629444046766881, |
|
"eval_f1": 0.6143217749435366, |
|
"eval_loss": 2.303816318511963, |
|
"eval_precision": 0.58590978205778, |
|
"eval_recall": 0.6456297123708461, |
|
"eval_runtime": 2.7486, |
|
"eval_samples_per_second": 404.571, |
|
"eval_steps_per_second": 25.468, |
|
"step": 46752 |
|
}, |
|
{ |
|
"epoch": 96.51, |
|
"learning_rate": 5.872689938398357e-06, |
|
"loss": 0.0019, |
|
"step": 47000 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"eval_accuracy": 0.764900978286805, |
|
"eval_f1": 0.6164437971666887, |
|
"eval_loss": 2.3128607273101807, |
|
"eval_precision": 0.5861027190332326, |
|
"eval_recall": 0.6500977380619939, |
|
"eval_runtime": 2.7259, |
|
"eval_samples_per_second": 407.943, |
|
"eval_steps_per_second": 25.68, |
|
"step": 47239 |
|
}, |
|
{ |
|
"epoch": 97.54, |
|
"learning_rate": 5.6160164271047226e-06, |
|
"loss": 0.001, |
|
"step": 47500 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"eval_accuracy": 0.7681698878549272, |
|
"eval_f1": 0.615528781793842, |
|
"eval_loss": 2.3077099323272705, |
|
"eval_precision": 0.5911545384417588, |
|
"eval_recall": 0.6419994414967886, |
|
"eval_runtime": 2.7427, |
|
"eval_samples_per_second": 405.435, |
|
"eval_steps_per_second": 25.522, |
|
"step": 47726 |
|
}, |
|
{ |
|
"epoch": 98.56, |
|
"learning_rate": 5.359342915811089e-06, |
|
"loss": 0.0009, |
|
"step": 48000 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"eval_accuracy": 0.7633023144834169, |
|
"eval_f1": 0.6161656646626587, |
|
"eval_loss": 2.3493497371673584, |
|
"eval_precision": 0.5906762295081968, |
|
"eval_recall": 0.6439542027366657, |
|
"eval_runtime": 2.7482, |
|
"eval_samples_per_second": 404.633, |
|
"eval_steps_per_second": 25.471, |
|
"step": 48213 |
|
}, |
|
{ |
|
"epoch": 99.59, |
|
"learning_rate": 5.102669404517454e-06, |
|
"loss": 0.0015, |
|
"step": 48500 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"eval_accuracy": 0.7701264614650442, |
|
"eval_f1": 0.62121007950411, |
|
"eval_loss": 2.319547414779663, |
|
"eval_precision": 0.6002604166666666, |
|
"eval_recall": 0.643674951130969, |
|
"eval_runtime": 2.8329, |
|
"eval_samples_per_second": 392.534, |
|
"eval_steps_per_second": 24.71, |
|
"step": 48700 |
|
}, |
|
{ |
|
"epoch": 100.62, |
|
"learning_rate": 4.845995893223819e-06, |
|
"loss": 0.001, |
|
"step": 49000 |
|
}, |
|
{ |
|
"epoch": 101.0, |
|
"eval_accuracy": 0.7711286089238845, |
|
"eval_f1": 0.6214266631044617, |
|
"eval_loss": 2.3443996906280518, |
|
"eval_precision": 0.5956466069142126, |
|
"eval_recall": 0.6495392348506004, |
|
"eval_runtime": 2.7763, |
|
"eval_samples_per_second": 400.528, |
|
"eval_steps_per_second": 25.213, |
|
"step": 49187 |
|
}, |
|
{ |
|
"epoch": 101.64, |
|
"learning_rate": 4.5893223819301845e-06, |
|
"loss": 0.0008, |
|
"step": 49500 |
|
}, |
|
{ |
|
"epoch": 102.0, |
|
"eval_accuracy": 0.7638749701741828, |
|
"eval_f1": 0.6155906777390839, |
|
"eval_loss": 2.404651403427124, |
|
"eval_precision": 0.5915057915057915, |
|
"eval_recall": 0.6417201898910919, |
|
"eval_runtime": 2.7517, |
|
"eval_samples_per_second": 404.111, |
|
"eval_steps_per_second": 25.439, |
|
"step": 49674 |
|
}, |
|
{ |
|
"epoch": 102.67, |
|
"learning_rate": 4.332648870636551e-06, |
|
"loss": 0.0011, |
|
"step": 50000 |
|
}, |
|
{ |
|
"epoch": 103.0, |
|
"eval_accuracy": 0.7672393223574326, |
|
"eval_f1": 0.6098464796188459, |
|
"eval_loss": 2.344151258468628, |
|
"eval_precision": 0.579622641509434, |
|
"eval_recall": 0.6433956995252723, |
|
"eval_runtime": 2.7536, |
|
"eval_samples_per_second": 403.83, |
|
"eval_steps_per_second": 25.421, |
|
"step": 50161 |
|
}, |
|
{ |
|
"epoch": 103.7, |
|
"learning_rate": 4.075975359342916e-06, |
|
"loss": 0.0009, |
|
"step": 50500 |
|
}, |
|
{ |
|
"epoch": 104.0, |
|
"eval_accuracy": 0.768217609162491, |
|
"eval_f1": 0.6160439266104192, |
|
"eval_loss": 2.3377583026885986, |
|
"eval_precision": 0.5918682449819866, |
|
"eval_recall": 0.6422786931024853, |
|
"eval_runtime": 2.718, |
|
"eval_samples_per_second": 409.123, |
|
"eval_steps_per_second": 25.754, |
|
"step": 50648 |
|
}, |
|
{ |
|
"epoch": 104.72, |
|
"learning_rate": 3.819301848049281e-06, |
|
"loss": 0.0011, |
|
"step": 51000 |
|
}, |
|
{ |
|
"epoch": 105.0, |
|
"eval_accuracy": 0.7702934860415175, |
|
"eval_f1": 0.6217602591792657, |
|
"eval_loss": 2.319119691848755, |
|
"eval_precision": 0.6017768487065587, |
|
"eval_recall": 0.6431164479195756, |
|
"eval_runtime": 2.7509, |
|
"eval_samples_per_second": 404.228, |
|
"eval_steps_per_second": 25.446, |
|
"step": 51135 |
|
}, |
|
{ |
|
"epoch": 105.75, |
|
"learning_rate": 3.5626283367556473e-06, |
|
"loss": 0.0007, |
|
"step": 51500 |
|
}, |
|
{ |
|
"epoch": 106.0, |
|
"eval_accuracy": 0.7682891911238368, |
|
"eval_f1": 0.6160821442859047, |
|
"eval_loss": 2.376638412475586, |
|
"eval_precision": 0.5895865237366003, |
|
"eval_recall": 0.6450712091594527, |
|
"eval_runtime": 2.7518, |
|
"eval_samples_per_second": 404.103, |
|
"eval_steps_per_second": 25.438, |
|
"step": 51622 |
|
}, |
|
{ |
|
"epoch": 106.78, |
|
"learning_rate": 3.3059548254620125e-06, |
|
"loss": 0.0004, |
|
"step": 52000 |
|
}, |
|
{ |
|
"epoch": 107.0, |
|
"eval_accuracy": 0.77568599379623, |
|
"eval_f1": 0.624123043712898, |
|
"eval_loss": 2.3492467403411865, |
|
"eval_precision": 0.6037588097102584, |
|
"eval_recall": 0.6459089639765428, |
|
"eval_runtime": 2.7841, |
|
"eval_samples_per_second": 399.413, |
|
"eval_steps_per_second": 25.143, |
|
"step": 52109 |
|
}, |
|
{ |
|
"epoch": 107.8, |
|
"learning_rate": 3.049281314168378e-06, |
|
"loss": 0.0008, |
|
"step": 52500 |
|
}, |
|
{ |
|
"epoch": 108.0, |
|
"eval_accuracy": 0.7681221665473634, |
|
"eval_f1": 0.620874698148645, |
|
"eval_loss": 2.3653135299682617, |
|
"eval_precision": 0.5974696617609089, |
|
"eval_recall": 0.6461882155822396, |
|
"eval_runtime": 2.742, |
|
"eval_samples_per_second": 405.547, |
|
"eval_steps_per_second": 25.529, |
|
"step": 52596 |
|
}, |
|
{ |
|
"epoch": 108.83, |
|
"learning_rate": 2.7926078028747435e-06, |
|
"loss": 0.0005, |
|
"step": 53000 |
|
}, |
|
{ |
|
"epoch": 109.0, |
|
"eval_accuracy": 0.7691720353137675, |
|
"eval_f1": 0.6206246634356489, |
|
"eval_loss": 2.3852195739746094, |
|
"eval_precision": 0.5991681829997401, |
|
"eval_recall": 0.643674951130969, |
|
"eval_runtime": 2.756, |
|
"eval_samples_per_second": 403.488, |
|
"eval_steps_per_second": 25.399, |
|
"step": 53083 |
|
}, |
|
{ |
|
"epoch": 109.86, |
|
"learning_rate": 2.5359342915811088e-06, |
|
"loss": 0.0005, |
|
"step": 53500 |
|
}, |
|
{ |
|
"epoch": 110.0, |
|
"eval_accuracy": 0.7685277976616559, |
|
"eval_f1": 0.6224392891059558, |
|
"eval_loss": 2.406304359436035, |
|
"eval_precision": 0.6052770448548813, |
|
"eval_recall": 0.6406031834683049, |
|
"eval_runtime": 2.7427, |
|
"eval_samples_per_second": 405.436, |
|
"eval_steps_per_second": 25.522, |
|
"step": 53570 |
|
}, |
|
{ |
|
"epoch": 110.88, |
|
"learning_rate": 2.2792607802874745e-06, |
|
"loss": 0.0008, |
|
"step": 54000 |
|
}, |
|
{ |
|
"epoch": 111.0, |
|
"eval_accuracy": 0.7683369124314006, |
|
"eval_f1": 0.6195049371026647, |
|
"eval_loss": 2.4256536960601807, |
|
"eval_precision": 0.6007345225603358, |
|
"eval_recall": 0.639486177045518, |
|
"eval_runtime": 2.7562, |
|
"eval_samples_per_second": 403.45, |
|
"eval_steps_per_second": 25.397, |
|
"step": 54057 |
|
}, |
|
{ |
|
"epoch": 111.91, |
|
"learning_rate": 2.0225872689938397e-06, |
|
"loss": 0.0009, |
|
"step": 54500 |
|
}, |
|
{ |
|
"epoch": 112.0, |
|
"eval_accuracy": 0.7700071581961345, |
|
"eval_f1": 0.6207082267402719, |
|
"eval_loss": 2.40315842628479, |
|
"eval_precision": 0.5993239729589184, |
|
"eval_recall": 0.643674951130969, |
|
"eval_runtime": 2.7393, |
|
"eval_samples_per_second": 405.937, |
|
"eval_steps_per_second": 25.554, |
|
"step": 54544 |
|
}, |
|
{ |
|
"epoch": 112.94, |
|
"learning_rate": 1.7659137577002054e-06, |
|
"loss": 0.0006, |
|
"step": 55000 |
|
}, |
|
{ |
|
"epoch": 113.0, |
|
"eval_accuracy": 0.770722977809592, |
|
"eval_f1": 0.6195783536994763, |
|
"eval_loss": 2.3877792358398438, |
|
"eval_precision": 0.5967408173823073, |
|
"eval_recall": 0.6442334543423625, |
|
"eval_runtime": 2.7437, |
|
"eval_samples_per_second": 405.288, |
|
"eval_steps_per_second": 25.513, |
|
"step": 55031 |
|
}, |
|
{ |
|
"epoch": 113.96, |
|
"learning_rate": 1.509240246406571e-06, |
|
"loss": 0.0003, |
|
"step": 55500 |
|
}, |
|
{ |
|
"epoch": 114.0, |
|
"eval_accuracy": 0.771271772846576, |
|
"eval_f1": 0.6211180124223602, |
|
"eval_loss": 2.3938703536987305, |
|
"eval_precision": 0.6013071895424836, |
|
"eval_recall": 0.6422786931024853, |
|
"eval_runtime": 2.7378, |
|
"eval_samples_per_second": 406.165, |
|
"eval_steps_per_second": 25.568, |
|
"step": 55518 |
|
}, |
|
{ |
|
"epoch": 114.99, |
|
"learning_rate": 1.2525667351129362e-06, |
|
"loss": 0.0003, |
|
"step": 56000 |
|
}, |
|
{ |
|
"epoch": 115.0, |
|
"eval_accuracy": 0.7702934860415175, |
|
"eval_f1": 0.618289722147289, |
|
"eval_loss": 2.412465810775757, |
|
"eval_precision": 0.597965040438299, |
|
"eval_recall": 0.6400446802569115, |
|
"eval_runtime": 2.8471, |
|
"eval_samples_per_second": 390.575, |
|
"eval_steps_per_second": 24.587, |
|
"step": 56005 |
|
}, |
|
{ |
|
"epoch": 116.0, |
|
"eval_accuracy": 0.7705798138869006, |
|
"eval_f1": 0.6196730099169123, |
|
"eval_loss": 2.420255661010742, |
|
"eval_precision": 0.5957227518680752, |
|
"eval_recall": 0.6456297123708461, |
|
"eval_runtime": 2.7618, |
|
"eval_samples_per_second": 402.642, |
|
"eval_steps_per_second": 25.346, |
|
"step": 56492 |
|
}, |
|
{ |
|
"epoch": 116.02, |
|
"learning_rate": 9.958932238193019e-07, |
|
"loss": 0.0003, |
|
"step": 56500 |
|
}, |
|
{ |
|
"epoch": 117.0, |
|
"eval_accuracy": 0.770722977809592, |
|
"eval_f1": 0.6205501618122977, |
|
"eval_loss": 2.410393476486206, |
|
"eval_precision": 0.6, |
|
"eval_recall": 0.6425579447081821, |
|
"eval_runtime": 2.7288, |
|
"eval_samples_per_second": 407.51, |
|
"eval_steps_per_second": 25.653, |
|
"step": 56979 |
|
}, |
|
{ |
|
"epoch": 117.04, |
|
"learning_rate": 7.392197125256674e-07, |
|
"loss": 0.0004, |
|
"step": 57000 |
|
}, |
|
{ |
|
"epoch": 118.0, |
|
"eval_accuracy": 0.7695538057742782, |
|
"eval_f1": 0.6216835016835018, |
|
"eval_loss": 2.4210033416748047, |
|
"eval_precision": 0.6004162330905307, |
|
"eval_recall": 0.6445127059480592, |
|
"eval_runtime": 2.7601, |
|
"eval_samples_per_second": 402.887, |
|
"eval_steps_per_second": 25.362, |
|
"step": 57466 |
|
}, |
|
{ |
|
"epoch": 118.07, |
|
"learning_rate": 4.82546201232033e-07, |
|
"loss": 0.0004, |
|
"step": 57500 |
|
}, |
|
{ |
|
"epoch": 119.0, |
|
"eval_accuracy": 0.7691720353137675, |
|
"eval_f1": 0.6201508620689655, |
|
"eval_loss": 2.4213058948516846, |
|
"eval_precision": 0.5990111891751236, |
|
"eval_recall": 0.6428371963138788, |
|
"eval_runtime": 2.776, |
|
"eval_samples_per_second": 400.579, |
|
"eval_steps_per_second": 25.216, |
|
"step": 57953 |
|
}, |
|
{ |
|
"epoch": 119.1, |
|
"learning_rate": 2.2587268993839835e-07, |
|
"loss": 0.0004, |
|
"step": 58000 |
|
}, |
|
{ |
|
"epoch": 120.0, |
|
"eval_accuracy": 0.7694106418515867, |
|
"eval_f1": 0.6200296535921282, |
|
"eval_loss": 2.4216408729553223, |
|
"eval_precision": 0.5992704533611256, |
|
"eval_recall": 0.6422786931024853, |
|
"eval_runtime": 2.7416, |
|
"eval_samples_per_second": 405.598, |
|
"eval_steps_per_second": 25.532, |
|
"step": 58440 |
|
}, |
|
{ |
|
"epoch": 120.0, |
|
"step": 58440, |
|
"total_flos": 1.220726808511488e+17, |
|
"train_loss": 0.04618847079620959, |
|
"train_runtime": 7270.5358, |
|
"train_samples_per_second": 128.491, |
|
"train_steps_per_second": 8.038 |
|
} |
|
], |
|
"max_steps": 58440, |
|
"num_train_epochs": 120, |
|
"total_flos": 1.220726808511488e+17, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|