Update checkpoint to step 10100
Browse files- trainer_state.json +1 -1
- training_log.json +64 -0
trainer_state.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"global_step":
|
|
|
1 |
+
{"global_step": 10100}
|
training_log.json
CHANGED
@@ -6398,5 +6398,69 @@
|
|
6398 |
{
|
6399 |
"step": 10000,
|
6400 |
"val_loss": 7.314393242200215
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
6401 |
}
|
6402 |
]
|
|
|
6398 |
{
|
6399 |
"step": 10000,
|
6400 |
"val_loss": 7.314393242200215
|
6401 |
+
},
|
6402 |
+
{
|
6403 |
+
"step": 10010,
|
6404 |
+
"train_loss": 7.3590466439723965,
|
6405 |
+
"lr": 4.974824120603016e-05,
|
6406 |
+
"epoch": 1
|
6407 |
+
},
|
6408 |
+
{
|
6409 |
+
"step": 10020,
|
6410 |
+
"train_loss": 7.403801316022873,
|
6411 |
+
"lr": 4.974773869346734e-05,
|
6412 |
+
"epoch": 1
|
6413 |
+
},
|
6414 |
+
{
|
6415 |
+
"step": 10030,
|
6416 |
+
"train_loss": 7.375410264730453,
|
6417 |
+
"lr": 4.974723618090453e-05,
|
6418 |
+
"epoch": 1
|
6419 |
+
},
|
6420 |
+
{
|
6421 |
+
"step": 10040,
|
6422 |
+
"train_loss": 7.343051743507385,
|
6423 |
+
"lr": 4.974673366834171e-05,
|
6424 |
+
"epoch": 1
|
6425 |
+
},
|
6426 |
+
{
|
6427 |
+
"step": 10050,
|
6428 |
+
"train_loss": 7.365369713306427,
|
6429 |
+
"lr": 4.97462311557789e-05,
|
6430 |
+
"epoch": 1
|
6431 |
+
},
|
6432 |
+
{
|
6433 |
+
"step": 10060,
|
6434 |
+
"train_loss": 7.386003789305687,
|
6435 |
+
"lr": 4.974572864321608e-05,
|
6436 |
+
"epoch": 1
|
6437 |
+
},
|
6438 |
+
{
|
6439 |
+
"step": 10070,
|
6440 |
+
"train_loss": 7.346861115097999,
|
6441 |
+
"lr": 4.9745226130653264e-05,
|
6442 |
+
"epoch": 1
|
6443 |
+
},
|
6444 |
+
{
|
6445 |
+
"step": 10080,
|
6446 |
+
"train_loss": 7.371396270394325,
|
6447 |
+
"lr": 4.974472361809045e-05,
|
6448 |
+
"epoch": 1
|
6449 |
+
},
|
6450 |
+
{
|
6451 |
+
"step": 10090,
|
6452 |
+
"train_loss": 7.349104163050652,
|
6453 |
+
"lr": 4.974422110552764e-05,
|
6454 |
+
"epoch": 1
|
6455 |
+
},
|
6456 |
+
{
|
6457 |
+
"step": 10100,
|
6458 |
+
"train_loss": 7.353458693623542,
|
6459 |
+
"lr": 4.974371859296483e-05,
|
6460 |
+
"epoch": 1
|
6461 |
+
},
|
6462 |
+
{
|
6463 |
+
"step": 10100,
|
6464 |
+
"val_loss": 7.300538818041484
|
6465 |
}
|
6466 |
]
|