|
{ |
|
"best_metric": 0.2930234372615814, |
|
"best_model_checkpoint": "hf-ner-sample_004-gbert-large.model/checkpoint-115", |
|
"epoch": 5.0, |
|
"eval_steps": 500, |
|
"global_step": 115, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"eval_f1": 0.3486529318541997, |
|
"eval_loss": 0.8595609068870544, |
|
"eval_precision": 0.32934131736526945, |
|
"eval_recall": 0.37037037037037035, |
|
"eval_runtime": 1.0185, |
|
"eval_samples_per_second": 57.93, |
|
"eval_steps_per_second": 2.946, |
|
"step": 23 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_f1": 0.6369230769230769, |
|
"eval_loss": 0.47271719574928284, |
|
"eval_precision": 0.5864022662889519, |
|
"eval_recall": 0.696969696969697, |
|
"eval_runtime": 0.9355, |
|
"eval_samples_per_second": 63.071, |
|
"eval_steps_per_second": 3.207, |
|
"step": 46 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_f1": 0.7248764415156508, |
|
"eval_loss": 0.33701092004776, |
|
"eval_precision": 0.7096774193548387, |
|
"eval_recall": 0.7407407407407407, |
|
"eval_runtime": 0.9711, |
|
"eval_samples_per_second": 60.758, |
|
"eval_steps_per_second": 3.089, |
|
"step": 69 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_f1": 0.765472312703583, |
|
"eval_loss": 0.296609491109848, |
|
"eval_precision": 0.7413249211356467, |
|
"eval_recall": 0.7912457912457912, |
|
"eval_runtime": 0.9576, |
|
"eval_samples_per_second": 61.61, |
|
"eval_steps_per_second": 3.133, |
|
"step": 92 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_f1": 0.7568438003220611, |
|
"eval_loss": 0.2930234372615814, |
|
"eval_precision": 0.7253086419753086, |
|
"eval_recall": 0.7912457912457912, |
|
"eval_runtime": 0.9995, |
|
"eval_samples_per_second": 59.03, |
|
"eval_steps_per_second": 3.002, |
|
"step": 115 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 230, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 10, |
|
"save_steps": 500, |
|
"stateful_callbacks": { |
|
"TrainerControl": { |
|
"args": { |
|
"should_epoch_stop": false, |
|
"should_evaluate": false, |
|
"should_log": false, |
|
"should_save": true, |
|
"should_training_stop": false |
|
}, |
|
"attributes": {} |
|
} |
|
}, |
|
"total_flos": 555656517635304.0, |
|
"train_batch_size": 24, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|