|
{ |
|
"best_metric": 0.13593988120555878, |
|
"best_model_checkpoint": "/home/sdonoso/data/all_results/ner-c/distillbert/epochs_4_bs_64_lr_5e-5/checkpoint-500", |
|
"epoch": 4.0, |
|
"global_step": 524, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.76, |
|
"eval_accuracy": 0.9476202751909258, |
|
"eval_f1": 0.7172177028136428, |
|
"eval_loss": 0.1729145497083664, |
|
"eval_precision": 0.7087020648967551, |
|
"eval_recall": 0.7259404743919021, |
|
"eval_runtime": 1.7788, |
|
"eval_samples_per_second": 1077.132, |
|
"eval_steps_per_second": 16.865, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 1.53, |
|
"eval_accuracy": 0.9522766087713079, |
|
"eval_f1": 0.7523824162311713, |
|
"eval_loss": 0.1584220975637436, |
|
"eval_precision": 0.765681213827624, |
|
"eval_recall": 0.7395376945157879, |
|
"eval_runtime": 1.776, |
|
"eval_samples_per_second": 1078.832, |
|
"eval_steps_per_second": 16.892, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 2.29, |
|
"eval_accuracy": 0.9581574453001643, |
|
"eval_f1": 0.7900313386061781, |
|
"eval_loss": 0.13973243534564972, |
|
"eval_precision": 0.7804806132979507, |
|
"eval_recall": 0.7998187037316815, |
|
"eval_runtime": 1.7908, |
|
"eval_samples_per_second": 1069.888, |
|
"eval_steps_per_second": 16.752, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 3.05, |
|
"eval_accuracy": 0.9592047175587278, |
|
"eval_f1": 0.7948698717467937, |
|
"eval_loss": 0.1360633671283722, |
|
"eval_precision": 0.7892463509085493, |
|
"eval_recall": 0.8005741048496752, |
|
"eval_runtime": 1.7307, |
|
"eval_samples_per_second": 1107.051, |
|
"eval_steps_per_second": 17.334, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 3.82, |
|
"learning_rate": 2.5763358778625957e-06, |
|
"loss": 0.1581, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 3.82, |
|
"eval_accuracy": 0.9594786195340445, |
|
"eval_f1": 0.7985358930305521, |
|
"eval_loss": 0.13593988120555878, |
|
"eval_precision": 0.7897458628841607, |
|
"eval_recall": 0.8075237951352168, |
|
"eval_runtime": 1.769, |
|
"eval_samples_per_second": 1083.1, |
|
"eval_steps_per_second": 16.959, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"step": 524, |
|
"total_flos": 997670842354368.0, |
|
"train_loss": 0.15398232195213551, |
|
"train_runtime": 729.0203, |
|
"train_samples_per_second": 45.672, |
|
"train_steps_per_second": 0.719 |
|
} |
|
], |
|
"max_steps": 524, |
|
"num_train_epochs": 4, |
|
"total_flos": 997670842354368.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|