Update checkpoint to step 10000
Browse files- trainer_state.json +1 -1
- training_log.json +64 -0
trainer_state.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"global_step":
|
|
|
1 |
+
{"global_step": 10000}
|
training_log.json
CHANGED
@@ -6334,5 +6334,69 @@
|
|
6334 |
{
|
6335 |
"step": 9900,
|
6336 |
"val_loss": 7.325656294822693
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
6337 |
}
|
6338 |
]
|
|
|
6334 |
{
|
6335 |
"step": 9900,
|
6336 |
"val_loss": 7.325656294822693
|
6337 |
+
},
|
6338 |
+
{
|
6339 |
+
"step": 9910,
|
6340 |
+
"train_loss": 7.333984071016312,
|
6341 |
+
"lr": 4.9753266331658295e-05,
|
6342 |
+
"epoch": 1
|
6343 |
+
},
|
6344 |
+
{
|
6345 |
+
"step": 9920,
|
6346 |
+
"train_loss": 7.407251310348511,
|
6347 |
+
"lr": 4.975276381909548e-05,
|
6348 |
+
"epoch": 1
|
6349 |
+
},
|
6350 |
+
{
|
6351 |
+
"step": 9930,
|
6352 |
+
"train_loss": 7.3805774509906765,
|
6353 |
+
"lr": 4.9752261306532667e-05,
|
6354 |
+
"epoch": 1
|
6355 |
+
},
|
6356 |
+
{
|
6357 |
+
"step": 9940,
|
6358 |
+
"train_loss": 7.349178448319435,
|
6359 |
+
"lr": 4.975175879396985e-05,
|
6360 |
+
"epoch": 1
|
6361 |
+
},
|
6362 |
+
{
|
6363 |
+
"step": 9950,
|
6364 |
+
"train_loss": 7.3482857018709185,
|
6365 |
+
"lr": 4.975125628140704e-05,
|
6366 |
+
"epoch": 1
|
6367 |
+
},
|
6368 |
+
{
|
6369 |
+
"step": 9960,
|
6370 |
+
"train_loss": 7.382177627086639,
|
6371 |
+
"lr": 4.975075376884422e-05,
|
6372 |
+
"epoch": 1
|
6373 |
+
},
|
6374 |
+
{
|
6375 |
+
"step": 9970,
|
6376 |
+
"train_loss": 7.363121953606606,
|
6377 |
+
"lr": 4.975025125628141e-05,
|
6378 |
+
"epoch": 1
|
6379 |
+
},
|
6380 |
+
{
|
6381 |
+
"step": 9980,
|
6382 |
+
"train_loss": 7.388920494914055,
|
6383 |
+
"lr": 4.974974874371859e-05,
|
6384 |
+
"epoch": 1
|
6385 |
+
},
|
6386 |
+
{
|
6387 |
+
"step": 9990,
|
6388 |
+
"train_loss": 7.371771231293678,
|
6389 |
+
"lr": 4.974924623115578e-05,
|
6390 |
+
"epoch": 1
|
6391 |
+
},
|
6392 |
+
{
|
6393 |
+
"step": 10000,
|
6394 |
+
"train_loss": 7.354285871982574,
|
6395 |
+
"lr": 4.974874371859297e-05,
|
6396 |
+
"epoch": 1
|
6397 |
+
},
|
6398 |
+
{
|
6399 |
+
"step": 10000,
|
6400 |
+
"val_loss": 7.314393242200215
|
6401 |
}
|
6402 |
]
|