rankers / ranker_6 /checkpoint-200 /trainer_state.json
minimario's picture
add rankers
1ef15eb
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 0.23873470605789315,
"global_step": 200,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.01,
"learning_rate": 9.994026284348866e-05,
"loss": 0.7347,
"step": 5
},
{
"epoch": 0.01,
"learning_rate": 9.98805256869773e-05,
"loss": 0.6862,
"step": 10
},
{
"epoch": 0.02,
"learning_rate": 9.982078853046596e-05,
"loss": 0.6505,
"step": 15
},
{
"epoch": 0.02,
"learning_rate": 9.97610513739546e-05,
"loss": 0.6177,
"step": 20
},
{
"epoch": 0.03,
"learning_rate": 9.970131421744326e-05,
"loss": 0.5992,
"step": 25
},
{
"epoch": 0.04,
"learning_rate": 9.96415770609319e-05,
"loss": 0.5671,
"step": 30
},
{
"epoch": 0.04,
"learning_rate": 9.958183990442056e-05,
"loss": 0.5407,
"step": 35
},
{
"epoch": 0.05,
"learning_rate": 9.952210274790921e-05,
"loss": 0.5186,
"step": 40
},
{
"epoch": 0.05,
"learning_rate": 9.946236559139786e-05,
"loss": 0.5068,
"step": 45
},
{
"epoch": 0.06,
"learning_rate": 9.940262843488651e-05,
"loss": 0.5162,
"step": 50
},
{
"epoch": 0.07,
"learning_rate": 9.934289127837514e-05,
"loss": 0.527,
"step": 55
},
{
"epoch": 0.07,
"learning_rate": 9.928315412186381e-05,
"loss": 0.4849,
"step": 60
},
{
"epoch": 0.08,
"learning_rate": 9.922341696535246e-05,
"loss": 0.477,
"step": 65
},
{
"epoch": 0.08,
"learning_rate": 9.916367980884111e-05,
"loss": 0.4702,
"step": 70
},
{
"epoch": 0.09,
"learning_rate": 9.910394265232975e-05,
"loss": 0.4504,
"step": 75
},
{
"epoch": 0.1,
"learning_rate": 9.90442054958184e-05,
"loss": 0.4422,
"step": 80
},
{
"epoch": 0.1,
"learning_rate": 9.898446833930706e-05,
"loss": 0.4383,
"step": 85
},
{
"epoch": 0.11,
"learning_rate": 9.892473118279571e-05,
"loss": 0.4356,
"step": 90
},
{
"epoch": 0.11,
"learning_rate": 9.886499402628435e-05,
"loss": 0.4446,
"step": 95
},
{
"epoch": 0.12,
"learning_rate": 9.8805256869773e-05,
"loss": 0.4251,
"step": 100
},
{
"epoch": 0.13,
"learning_rate": 9.874551971326166e-05,
"loss": 0.4201,
"step": 105
},
{
"epoch": 0.13,
"learning_rate": 9.868578255675031e-05,
"loss": 0.4389,
"step": 110
},
{
"epoch": 0.14,
"learning_rate": 9.862604540023895e-05,
"loss": 0.4319,
"step": 115
},
{
"epoch": 0.14,
"learning_rate": 9.85663082437276e-05,
"loss": 0.455,
"step": 120
},
{
"epoch": 0.15,
"learning_rate": 9.850657108721625e-05,
"loss": 0.4297,
"step": 125
},
{
"epoch": 0.16,
"learning_rate": 9.844683393070491e-05,
"loss": 0.4383,
"step": 130
},
{
"epoch": 0.16,
"learning_rate": 9.838709677419355e-05,
"loss": 0.4658,
"step": 135
},
{
"epoch": 0.17,
"learning_rate": 9.83273596176822e-05,
"loss": 0.4499,
"step": 140
},
{
"epoch": 0.17,
"learning_rate": 9.826762246117085e-05,
"loss": 0.41,
"step": 145
},
{
"epoch": 0.18,
"learning_rate": 9.820788530465951e-05,
"loss": 0.3866,
"step": 150
},
{
"epoch": 0.19,
"learning_rate": 9.814814814814815e-05,
"loss": 0.3897,
"step": 155
},
{
"epoch": 0.19,
"learning_rate": 9.80884109916368e-05,
"loss": 0.4053,
"step": 160
},
{
"epoch": 0.2,
"learning_rate": 9.802867383512545e-05,
"loss": 0.4022,
"step": 165
},
{
"epoch": 0.2,
"learning_rate": 9.79689366786141e-05,
"loss": 0.4074,
"step": 170
},
{
"epoch": 0.21,
"learning_rate": 9.790919952210275e-05,
"loss": 0.4,
"step": 175
},
{
"epoch": 0.21,
"learning_rate": 9.78494623655914e-05,
"loss": 0.4282,
"step": 180
},
{
"epoch": 0.22,
"learning_rate": 9.778972520908005e-05,
"loss": 0.4028,
"step": 185
},
{
"epoch": 0.23,
"learning_rate": 9.77299880525687e-05,
"loss": 0.3937,
"step": 190
},
{
"epoch": 0.23,
"learning_rate": 9.767025089605735e-05,
"loss": 0.3665,
"step": 195
},
{
"epoch": 0.24,
"learning_rate": 9.7610513739546e-05,
"loss": 0.3743,
"step": 200
},
{
"epoch": 0.24,
"eval_accuracy": 0.7354377926759424,
"eval_accuracy_sklearn": 0.7354377926759424,
"eval_f1": 0.7483577402505849,
"eval_loss": 0.5406955480575562,
"eval_precision": 0.8060886373049841,
"eval_recall": 0.6983434005143233,
"eval_runtime": 162.5908,
"eval_samples_per_second": 182.563,
"eval_steps_per_second": 11.415,
"step": 200
}
],
"max_steps": 8370,
"num_train_epochs": 10,
"total_flos": 2.6942572068864e+16,
"trial_name": null,
"trial_params": null
}