Training in progress, step 51800, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
@@ -1189,10 +1189,10 @@ You can finetune this model on your own dataset.
|
|
1189 |
### Training Logs
|
1190 |
| Epoch | Step | Training Loss |
|
1191 |
|:------:|:-----:|:-------------:|
|
1192 |
-
| 0.
|
1193 |
-
| 0.
|
1194 |
-
| 0.
|
1195 |
-
| 0.
|
1196 |
|
1197 |
|
1198 |
### Framework Versions
|
|
|
1189 |
### Training Logs
|
1190 |
| Epoch | Step | Training Loss |
|
1191 |
|:------:|:-----:|:-------------:|
|
1192 |
+
| 0.9127 | 51650 | 0.2493 |
|
1193 |
+
| 0.9136 | 51700 | 0.3088 |
|
1194 |
+
| 0.9145 | 51750 | 0.2287 |
|
1195 |
+
| 0.9153 | 51800 | 0.2067 |
|
1196 |
|
1197 |
|
1198 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 90864192
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8adbf03525b39d3cbba1bbdde2da90cb7be2d698601f862e040d6383edf785e8
|
3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 180609210
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ddba7d83c634a4905db07a12f6761ec90e0847d3c3a75cb805e5a2c45f6f055e
|
3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14244
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ed3acf2d762800b6693f2eadfe02d38f79ee54f3a4fcf7d7f00a5e20954d4a73
|
3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 988
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e37c94dad9c27aa070c66f020f85050e7628adbe8df381c470c2f01ed333d243
|
3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad4fc38cbd3a40df512cafd836390b147d408874f4ecc602c76931ee4bd316f8
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -2,9 +2,9 @@
|
|
2 |
"best_global_step": null,
|
3 |
"best_metric": null,
|
4 |
"best_model_checkpoint": null,
|
5 |
-
"epoch": 0.
|
6 |
"eval_steps": 500,
|
7 |
-
"global_step":
|
8 |
"is_hyper_param_search": false,
|
9 |
"is_local_process_zero": true,
|
10 |
"is_world_process_zero": true,
|
@@ -7232,6 +7232,34 @@
|
|
7232 |
"learning_rate": 4.920382478254894e-06,
|
7233 |
"loss": 0.3295,
|
7234 |
"step": 51600
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
7235 |
}
|
7236 |
],
|
7237 |
"logging_steps": 50,
|
|
|
2 |
"best_global_step": null,
|
3 |
"best_metric": null,
|
4 |
"best_model_checkpoint": null,
|
5 |
+
"epoch": 0.9153398950363132,
|
6 |
"eval_steps": 500,
|
7 |
+
"global_step": 51800,
|
8 |
"is_hyper_param_search": false,
|
9 |
"is_local_process_zero": true,
|
10 |
"is_world_process_zero": true,
|
|
|
7232 |
"learning_rate": 4.920382478254894e-06,
|
7233 |
"loss": 0.3295,
|
7234 |
"step": 51600
|
7235 |
+
},
|
7236 |
+
{
|
7237 |
+
"epoch": 0.9126892968846636,
|
7238 |
+
"grad_norm": 1.4896866083145142,
|
7239 |
+
"learning_rate": 4.871296459916358e-06,
|
7240 |
+
"loss": 0.2493,
|
7241 |
+
"step": 51650
|
7242 |
+
},
|
7243 |
+
{
|
7244 |
+
"epoch": 0.9135728296018801,
|
7245 |
+
"grad_norm": 4.590723037719727,
|
7246 |
+
"learning_rate": 4.8222104415778216e-06,
|
7247 |
+
"loss": 0.3088,
|
7248 |
+
"step": 51700
|
7249 |
+
},
|
7250 |
+
{
|
7251 |
+
"epoch": 0.9144563623190967,
|
7252 |
+
"grad_norm": 1.653506875038147,
|
7253 |
+
"learning_rate": 4.7731244232392845e-06,
|
7254 |
+
"loss": 0.2287,
|
7255 |
+
"step": 51750
|
7256 |
+
},
|
7257 |
+
{
|
7258 |
+
"epoch": 0.9153398950363132,
|
7259 |
+
"grad_norm": 1.7086869478225708,
|
7260 |
+
"learning_rate": 4.724038404900748e-06,
|
7261 |
+
"loss": 0.2067,
|
7262 |
+
"step": 51800
|
7263 |
}
|
7264 |
],
|
7265 |
"logging_steps": 50,
|
last-checkpoint/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5560
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c6646a21e44808e01dce45e09fa7fbd1fffd2b29b00d00306ba050ea82ef5a2
|
3 |
size 5560
|