File size: 1,683 Bytes
b557d4a 0486018 b557d4a 0486018 b557d4a 0486018 b557d4a 0486018 b557d4a 0486018 b557d4a 0486018 b557d4a 0486018 b557d4a 0486018 b557d4a 0486018 b557d4a 0486018 b557d4a 0486018 b557d4a 0486018 b557d4a 0486018 b557d4a 0486018 b557d4a |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 |
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 0.03031705623698218,
"global_step": 262,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.0,
"learning_rate": 1.9997685720897943e-05,
"loss": 2.316,
"step": 1
},
{
"epoch": 0.0,
"learning_rate": 1.993982874334645e-05,
"loss": 3.0145,
"step": 26
},
{
"epoch": 0.01,
"learning_rate": 1.9881971765794957e-05,
"loss": 2.9775,
"step": 52
},
{
"epoch": 0.01,
"learning_rate": 1.9821800509141405e-05,
"loss": 2.9141,
"step": 78
},
{
"epoch": 0.01,
"learning_rate": 1.976162925248785e-05,
"loss": 2.8213,
"step": 104
},
{
"epoch": 0.02,
"learning_rate": 1.9701457995834298e-05,
"loss": 2.8003,
"step": 130
},
{
"epoch": 0.02,
"learning_rate": 1.9641286739180746e-05,
"loss": 2.8823,
"step": 156
},
{
"epoch": 0.02,
"learning_rate": 1.9581115482527195e-05,
"loss": 2.8253,
"step": 182
},
{
"epoch": 0.02,
"learning_rate": 1.9520944225873643e-05,
"loss": 2.7823,
"step": 208
},
{
"epoch": 0.03,
"learning_rate": 1.946077296922009e-05,
"loss": 2.7374,
"step": 234
},
{
"epoch": 0.03,
"learning_rate": 1.9402915991668595e-05,
"loss": 2.8325,
"step": 260
}
],
"max_steps": 8642,
"num_train_epochs": 1,
"total_flos": 487908402266112.0,
"trial_name": null,
"trial_params": null
}
|