Training in progress, step 55400, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1261,6 +1261,10 @@ You can finetune this model on your own dataset.
|
|
| 1261 |
| 0.9737 | 55100 | 0.2965 |
|
| 1262 |
| 0.9745 | 55150 | 0.2382 |
|
| 1263 |
| 0.9754 | 55200 | 0.3863 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1264 |
|
| 1265 |
|
| 1266 |
### Framework Versions
|
|
|
|
| 1261 |
| 0.9737 | 55100 | 0.2965 |
|
| 1262 |
| 0.9745 | 55150 | 0.2382 |
|
| 1263 |
| 0.9754 | 55200 | 0.3863 |
|
| 1264 |
+
| 0.9763 | 55250 | 0.2909 |
|
| 1265 |
+
| 0.9772 | 55300 | 0.3787 |
|
| 1266 |
+
| 0.9781 | 55350 | 0.3196 |
|
| 1267 |
+
| 0.9790 | 55400 | 0.3738 |
|
| 1268 |
|
| 1269 |
|
| 1270 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e7e0a1455740180aedb80f8bb0aec516cb7153da241701244132cb399617a794
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f3a83cdaa07d04d231b900b829ca00bf94bbd812391baa3af8be0f339dc5c09a
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7c32e0fe828ffd94931d917ede7d98af8f116069bcef2571793c504c5a05f607
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:380ffdc8abce86595967f2c6febf85c303c1ae3d84e66897af982ed22c990884
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:67d3a94240ec5e377beed092b82635ec739c5c48243fbb51753d92a8d8f55ac7
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -7736,6 +7736,34 @@
|
|
| 7736 |
"learning_rate": 1.388152598613811e-06,
|
| 7737 |
"loss": 0.3863,
|
| 7738 |
"step": 55200
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 7739 |
}
|
| 7740 |
],
|
| 7741 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.9789542506759026,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 55400,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 7736 |
"learning_rate": 1.388152598613811e-06,
|
| 7737 |
"loss": 0.3863,
|
| 7738 |
"step": 55200
|
| 7739 |
+
},
|
| 7740 |
+
{
|
| 7741 |
+
"epoch": 0.976303652524253,
|
| 7742 |
+
"grad_norm": 1.0731230974197388,
|
| 7743 |
+
"learning_rate": 1.3390665802752744e-06,
|
| 7744 |
+
"loss": 0.2909,
|
| 7745 |
+
"step": 55250
|
| 7746 |
+
},
|
| 7747 |
+
{
|
| 7748 |
+
"epoch": 0.9771871852414695,
|
| 7749 |
+
"grad_norm": 1.6253186464309692,
|
| 7750 |
+
"learning_rate": 1.289980561936738e-06,
|
| 7751 |
+
"loss": 0.3787,
|
| 7752 |
+
"step": 55300
|
| 7753 |
+
},
|
| 7754 |
+
{
|
| 7755 |
+
"epoch": 0.978070717958686,
|
| 7756 |
+
"grad_norm": 1.9667285680770874,
|
| 7757 |
+
"learning_rate": 1.2408945435982016e-06,
|
| 7758 |
+
"loss": 0.3196,
|
| 7759 |
+
"step": 55350
|
| 7760 |
+
},
|
| 7761 |
+
{
|
| 7762 |
+
"epoch": 0.9789542506759026,
|
| 7763 |
+
"grad_norm": 1.1798194646835327,
|
| 7764 |
+
"learning_rate": 1.191808525259665e-06,
|
| 7765 |
+
"loss": 0.3738,
|
| 7766 |
+
"step": 55400
|
| 7767 |
}
|
| 7768 |
],
|
| 7769 |
"logging_steps": 50,
|