Training in progress, epoch 24
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c423e46d21dd651e93994a77cb57436a04e15c2ea704fa90d9f8cc4e23cf18fc
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9c27e7a00ae5152328e38d6891a5a934b389633a33a4da7ad1e9235a97da36c1
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:90d4fcc4e9b32dc44372d851e07ea94edb013d04d1ee81849b536b2a6e63fbe7
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:498dbc192a60766292f27930335619a72f681cf62eabdc2982cefbe3093ffee8
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -420,3 +420,18 @@
|
|
420 |
{"current_steps": 3970, "total_steps": 4125, "loss": 0.018, "lr": 5e-06, "epoch": 23.9336850037679, "percentage": 96.24, "elapsed_time": "1 day, 13:20:10", "remaining_time": "1:27:27"}
|
421 |
{"current_steps": 3980, "total_steps": 4125, "loss": 0.0186, "lr": 5e-06, "epoch": 23.9939713639789, "percentage": 96.48, "elapsed_time": "1 day, 13:25:32", "remaining_time": "1:21:48"}
|
422 |
{"current_steps": 3981, "total_steps": 4125, "eval_loss": 2.3888232707977295, "epoch": 24.0, "percentage": 96.51, "elapsed_time": "1 day, 13:27:59", "remaining_time": "1:21:18"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
420 |
{"current_steps": 3970, "total_steps": 4125, "loss": 0.018, "lr": 5e-06, "epoch": 23.9336850037679, "percentage": 96.24, "elapsed_time": "1 day, 13:20:10", "remaining_time": "1:27:27"}
|
421 |
{"current_steps": 3980, "total_steps": 4125, "loss": 0.0186, "lr": 5e-06, "epoch": 23.9939713639789, "percentage": 96.48, "elapsed_time": "1 day, 13:25:32", "remaining_time": "1:21:48"}
|
422 |
{"current_steps": 3981, "total_steps": 4125, "eval_loss": 2.3888232707977295, "epoch": 24.0, "percentage": 96.51, "elapsed_time": "1 day, 13:27:59", "remaining_time": "1:21:18"}
|
423 |
+
{"current_steps": 3990, "total_steps": 4125, "loss": 0.0141, "lr": 5e-06, "epoch": 24.054257724189902, "percentage": 96.73, "elapsed_time": "1 day, 13:34:34", "remaining_time": "1:16:16"}
|
424 |
+
{"current_steps": 4000, "total_steps": 4125, "loss": 0.0141, "lr": 5e-06, "epoch": 24.114544084400904, "percentage": 96.97, "elapsed_time": "1 day, 13:39:57", "remaining_time": "1:10:37"}
|
425 |
+
{"current_steps": 4010, "total_steps": 4125, "loss": 0.0144, "lr": 5e-06, "epoch": 24.174830444611906, "percentage": 97.21, "elapsed_time": "1 day, 13:45:20", "remaining_time": "1:04:57"}
|
426 |
+
{"current_steps": 4020, "total_steps": 4125, "loss": 0.0148, "lr": 5e-06, "epoch": 24.23511680482291, "percentage": 97.45, "elapsed_time": "1 day, 13:50:45", "remaining_time": "0:59:18"}
|
427 |
+
{"current_steps": 4030, "total_steps": 4125, "loss": 0.0151, "lr": 5e-06, "epoch": 24.29540316503391, "percentage": 97.7, "elapsed_time": "1 day, 13:56:08", "remaining_time": "0:53:39"}
|
428 |
+
{"current_steps": 4040, "total_steps": 4125, "loss": 0.0156, "lr": 5e-06, "epoch": 24.355689525244912, "percentage": 97.94, "elapsed_time": "1 day, 14:01:30", "remaining_time": "0:48:00"}
|
429 |
+
{"current_steps": 4050, "total_steps": 4125, "loss": 0.0154, "lr": 5e-06, "epoch": 24.415975885455914, "percentage": 98.18, "elapsed_time": "1 day, 14:06:53", "remaining_time": "0:42:20"}
|
430 |
+
{"current_steps": 4060, "total_steps": 4125, "loss": 0.0159, "lr": 5e-06, "epoch": 24.476262245666916, "percentage": 98.42, "elapsed_time": "1 day, 14:12:17", "remaining_time": "0:36:41"}
|
431 |
+
{"current_steps": 4070, "total_steps": 4125, "loss": 0.0157, "lr": 5e-06, "epoch": 24.53654860587792, "percentage": 98.67, "elapsed_time": "1 day, 14:17:39", "remaining_time": "0:31:02"}
|
432 |
+
{"current_steps": 4080, "total_steps": 4125, "loss": 0.0158, "lr": 5e-06, "epoch": 24.596834966088924, "percentage": 98.91, "elapsed_time": "1 day, 14:23:03", "remaining_time": "0:25:24"}
|
433 |
+
{"current_steps": 4090, "total_steps": 4125, "loss": 0.0163, "lr": 5e-06, "epoch": 24.657121326299926, "percentage": 99.15, "elapsed_time": "1 day, 14:28:26", "remaining_time": "0:19:45"}
|
434 |
+
{"current_steps": 4100, "total_steps": 4125, "loss": 0.0164, "lr": 5e-06, "epoch": 24.717407686510928, "percentage": 99.39, "elapsed_time": "1 day, 14:33:50", "remaining_time": "0:14:06"}
|
435 |
+
{"current_steps": 4110, "total_steps": 4125, "loss": 0.0166, "lr": 5e-06, "epoch": 24.77769404672193, "percentage": 99.64, "elapsed_time": "1 day, 14:39:14", "remaining_time": "0:08:27"}
|
436 |
+
{"current_steps": 4120, "total_steps": 4125, "loss": 0.0169, "lr": 5e-06, "epoch": 24.83798040693293, "percentage": 99.88, "elapsed_time": "1 day, 14:44:34", "remaining_time": "0:02:49"}
|
437 |
+
{"current_steps": 4125, "total_steps": 4125, "eval_loss": 2.4057514667510986, "epoch": 24.868123587038433, "percentage": 100.0, "elapsed_time": "1 day, 14:50:50", "remaining_time": "0:00:00"}
|