Rodrigo1771's picture
Training in progress, epoch 1
6bb1803 verified
raw
history blame
5.35 kB
{
"best_metric": 0.6946045049764275,
"best_model_checkpoint": "/content/dissertation/scripts/ner/output/checkpoint-1088",
"epoch": 9.967845659163988,
"eval_steps": 500,
"global_step": 1550,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.9967845659163987,
"eval_accuracy": 0.9435978055118868,
"eval_f1": 0.593056643174106,
"eval_loss": 0.14849668741226196,
"eval_precision": 0.5668662674650699,
"eval_recall": 0.6217843459222769,
"eval_runtime": 5.8633,
"eval_samples_per_second": 429.618,
"eval_steps_per_second": 53.724,
"step": 155
},
{
"epoch": 2.0,
"eval_accuracy": 0.9408546953704001,
"eval_f1": 0.6299060919817,
"eval_loss": 0.16094118356704712,
"eval_precision": 0.5623387790197765,
"eval_recall": 0.715927750410509,
"eval_runtime": 5.9155,
"eval_samples_per_second": 425.831,
"eval_steps_per_second": 53.25,
"step": 311
},
{
"epoch": 2.996784565916399,
"eval_accuracy": 0.9486669447207161,
"eval_f1": 0.6676790685902303,
"eval_loss": 0.1634686440229416,
"eval_precision": 0.6209981167608286,
"eval_recall": 0.7219485495347564,
"eval_runtime": 5.9009,
"eval_samples_per_second": 426.884,
"eval_steps_per_second": 53.382,
"step": 466
},
{
"epoch": 3.215434083601286,
"grad_norm": 0.9288749098777771,
"learning_rate": 3.387096774193548e-05,
"loss": 0.1246,
"step": 500
},
{
"epoch": 4.0,
"eval_accuracy": 0.9492604831723828,
"eval_f1": 0.6711919630735812,
"eval_loss": 0.20466655492782593,
"eval_precision": 0.665948275862069,
"eval_recall": 0.6765188834154351,
"eval_runtime": 5.9155,
"eval_samples_per_second": 425.831,
"eval_steps_per_second": 53.25,
"step": 622
},
{
"epoch": 4.996784565916399,
"eval_accuracy": 0.9479771567904007,
"eval_f1": 0.6827731092436975,
"eval_loss": 0.2133806049823761,
"eval_precision": 0.6562342251388188,
"eval_recall": 0.7115489874110563,
"eval_runtime": 5.8759,
"eval_samples_per_second": 428.701,
"eval_steps_per_second": 53.609,
"step": 777
},
{
"epoch": 6.0,
"eval_accuracy": 0.949388815810581,
"eval_f1": 0.6795913020696882,
"eval_loss": 0.2258971482515335,
"eval_precision": 0.6517587939698493,
"eval_recall": 0.7099069512862616,
"eval_runtime": 5.9106,
"eval_samples_per_second": 426.187,
"eval_steps_per_second": 53.294,
"step": 933
},
{
"epoch": 6.430868167202572,
"grad_norm": 0.18494442105293274,
"learning_rate": 1.774193548387097e-05,
"loss": 0.0242,
"step": 1000
},
{
"epoch": 6.996784565916399,
"eval_accuracy": 0.9496615226667522,
"eval_f1": 0.6946045049764275,
"eval_loss": 0.24502409994602203,
"eval_precision": 0.6659969864389754,
"eval_recall": 0.7257799671592775,
"eval_runtime": 5.8918,
"eval_samples_per_second": 427.542,
"eval_steps_per_second": 53.464,
"step": 1088
},
{
"epoch": 8.0,
"eval_accuracy": 0.9490679842150855,
"eval_f1": 0.6841015018125324,
"eval_loss": 0.26501980423927307,
"eval_precision": 0.6491400491400492,
"eval_recall": 0.7230432402846196,
"eval_runtime": 5.9184,
"eval_samples_per_second": 425.624,
"eval_steps_per_second": 53.224,
"step": 1244
},
{
"epoch": 8.996784565916398,
"eval_accuracy": 0.9497577721454009,
"eval_f1": 0.687797147385103,
"eval_loss": 0.27453720569610596,
"eval_precision": 0.664624808575804,
"eval_recall": 0.7126436781609196,
"eval_runtime": 5.9283,
"eval_samples_per_second": 424.913,
"eval_steps_per_second": 53.135,
"step": 1399
},
{
"epoch": 9.646302250803858,
"grad_norm": 0.35425594449043274,
"learning_rate": 1.6129032258064516e-06,
"loss": 0.0083,
"step": 1500
},
{
"epoch": 9.967845659163988,
"eval_accuracy": 0.950255061118419,
"eval_f1": 0.6896008403361344,
"eval_loss": 0.27744925022125244,
"eval_precision": 0.662796567390207,
"eval_recall": 0.7186644772851669,
"eval_runtime": 6.1493,
"eval_samples_per_second": 409.643,
"eval_steps_per_second": 51.226,
"step": 1550
},
{
"epoch": 9.967845659163988,
"step": 1550,
"total_flos": 4644619911314910.0,
"train_loss": 0.050868147861573,
"train_runtime": 855.1929,
"train_samples_per_second": 116.102,
"train_steps_per_second": 1.812
}
],
"logging_steps": 500,
"max_steps": 1550,
"num_input_tokens_seen": 0,
"num_train_epochs": 10,
"save_steps": 500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 4644619911314910.0,
"train_batch_size": 32,
"trial_name": null,
"trial_params": null
}