Training in progress, epoch 3
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:177bf8229926a926ab64731991d342ceffd59dd0c05d2121d961dc4c30aa6f59
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b592e1f5b4a39683a31df53ee615b3ef83bb183e97f078e5bc0c8cba9e7c05b8
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d5bc3c5735476f56c8f354673a624b8d8d361a5bc9e86efcec89ad6efe70722a
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:25264608b27a5a4cb984833d7afe5a84b9dcb83576fe322ad7c5cdddc41ae5a5
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -63,3 +63,33 @@
|
|
63 |
{"current_steps": 612, "total_steps": 918, "eval_loss": 0.6249033808708191, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "1:03:15", "remaining_time": "0:31:37"}
|
64 |
{"current_steps": 620, "total_steps": 918, "loss": 0.5586, "learning_rate": 5e-06, "epoch": 2.026143790849673, "percentage": 67.54, "elapsed_time": "1:05:23", "remaining_time": "0:31:25"}
|
65 |
{"current_steps": 630, "total_steps": 918, "loss": 0.5407, "learning_rate": 5e-06, "epoch": 2.0588235294117645, "percentage": 68.63, "elapsed_time": "1:06:23", "remaining_time": "0:30:21"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
63 |
{"current_steps": 612, "total_steps": 918, "eval_loss": 0.6249033808708191, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "1:03:15", "remaining_time": "0:31:37"}
|
64 |
{"current_steps": 620, "total_steps": 918, "loss": 0.5586, "learning_rate": 5e-06, "epoch": 2.026143790849673, "percentage": 67.54, "elapsed_time": "1:05:23", "remaining_time": "0:31:25"}
|
65 |
{"current_steps": 630, "total_steps": 918, "loss": 0.5407, "learning_rate": 5e-06, "epoch": 2.0588235294117645, "percentage": 68.63, "elapsed_time": "1:06:23", "remaining_time": "0:30:21"}
|
66 |
+
{"current_steps": 640, "total_steps": 918, "loss": 0.5442, "learning_rate": 5e-06, "epoch": 2.0915032679738563, "percentage": 69.72, "elapsed_time": "1:07:23", "remaining_time": "0:29:16"}
|
67 |
+
{"current_steps": 650, "total_steps": 918, "loss": 0.5411, "learning_rate": 5e-06, "epoch": 2.1241830065359477, "percentage": 70.81, "elapsed_time": "1:08:23", "remaining_time": "0:28:11"}
|
68 |
+
{"current_steps": 660, "total_steps": 918, "loss": 0.5495, "learning_rate": 5e-06, "epoch": 2.156862745098039, "percentage": 71.9, "elapsed_time": "1:09:23", "remaining_time": "0:27:07"}
|
69 |
+
{"current_steps": 670, "total_steps": 918, "loss": 0.5477, "learning_rate": 5e-06, "epoch": 2.189542483660131, "percentage": 72.98, "elapsed_time": "1:10:23", "remaining_time": "0:26:03"}
|
70 |
+
{"current_steps": 680, "total_steps": 918, "loss": 0.5453, "learning_rate": 5e-06, "epoch": 2.2222222222222223, "percentage": 74.07, "elapsed_time": "1:11:24", "remaining_time": "0:24:59"}
|
71 |
+
{"current_steps": 690, "total_steps": 918, "loss": 0.5491, "learning_rate": 5e-06, "epoch": 2.2549019607843137, "percentage": 75.16, "elapsed_time": "1:12:24", "remaining_time": "0:23:55"}
|
72 |
+
{"current_steps": 700, "total_steps": 918, "loss": 0.5411, "learning_rate": 5e-06, "epoch": 2.287581699346405, "percentage": 76.25, "elapsed_time": "1:13:25", "remaining_time": "0:22:51"}
|
73 |
+
{"current_steps": 710, "total_steps": 918, "loss": 0.539, "learning_rate": 5e-06, "epoch": 2.3202614379084965, "percentage": 77.34, "elapsed_time": "1:14:25", "remaining_time": "0:21:48"}
|
74 |
+
{"current_steps": 720, "total_steps": 918, "loss": 0.546, "learning_rate": 5e-06, "epoch": 2.3529411764705883, "percentage": 78.43, "elapsed_time": "1:15:25", "remaining_time": "0:20:44"}
|
75 |
+
{"current_steps": 730, "total_steps": 918, "loss": 0.5424, "learning_rate": 5e-06, "epoch": 2.3856209150326797, "percentage": 79.52, "elapsed_time": "1:16:25", "remaining_time": "0:19:40"}
|
76 |
+
{"current_steps": 740, "total_steps": 918, "loss": 0.5467, "learning_rate": 5e-06, "epoch": 2.418300653594771, "percentage": 80.61, "elapsed_time": "1:17:25", "remaining_time": "0:18:37"}
|
77 |
+
{"current_steps": 750, "total_steps": 918, "loss": 0.551, "learning_rate": 5e-06, "epoch": 2.450980392156863, "percentage": 81.7, "elapsed_time": "1:18:24", "remaining_time": "0:17:33"}
|
78 |
+
{"current_steps": 760, "total_steps": 918, "loss": 0.5454, "learning_rate": 5e-06, "epoch": 2.4836601307189543, "percentage": 82.79, "elapsed_time": "1:19:24", "remaining_time": "0:16:30"}
|
79 |
+
{"current_steps": 770, "total_steps": 918, "loss": 0.546, "learning_rate": 5e-06, "epoch": 2.5163398692810457, "percentage": 83.88, "elapsed_time": "1:20:25", "remaining_time": "0:15:27"}
|
80 |
+
{"current_steps": 780, "total_steps": 918, "loss": 0.5434, "learning_rate": 5e-06, "epoch": 2.549019607843137, "percentage": 84.97, "elapsed_time": "1:21:25", "remaining_time": "0:14:24"}
|
81 |
+
{"current_steps": 790, "total_steps": 918, "loss": 0.5515, "learning_rate": 5e-06, "epoch": 2.581699346405229, "percentage": 86.06, "elapsed_time": "1:22:26", "remaining_time": "0:13:21"}
|
82 |
+
{"current_steps": 800, "total_steps": 918, "loss": 0.5513, "learning_rate": 5e-06, "epoch": 2.6143790849673203, "percentage": 87.15, "elapsed_time": "1:23:26", "remaining_time": "0:12:18"}
|
83 |
+
{"current_steps": 810, "total_steps": 918, "loss": 0.5472, "learning_rate": 5e-06, "epoch": 2.6470588235294117, "percentage": 88.24, "elapsed_time": "1:24:26", "remaining_time": "0:11:15"}
|
84 |
+
{"current_steps": 820, "total_steps": 918, "loss": 0.5496, "learning_rate": 5e-06, "epoch": 2.6797385620915035, "percentage": 89.32, "elapsed_time": "1:25:25", "remaining_time": "0:10:12"}
|
85 |
+
{"current_steps": 830, "total_steps": 918, "loss": 0.5444, "learning_rate": 5e-06, "epoch": 2.712418300653595, "percentage": 90.41, "elapsed_time": "1:26:26", "remaining_time": "0:09:09"}
|
86 |
+
{"current_steps": 840, "total_steps": 918, "loss": 0.5501, "learning_rate": 5e-06, "epoch": 2.7450980392156863, "percentage": 91.5, "elapsed_time": "1:27:27", "remaining_time": "0:08:07"}
|
87 |
+
{"current_steps": 850, "total_steps": 918, "loss": 0.5477, "learning_rate": 5e-06, "epoch": 2.7777777777777777, "percentage": 92.59, "elapsed_time": "1:28:26", "remaining_time": "0:07:04"}
|
88 |
+
{"current_steps": 860, "total_steps": 918, "loss": 0.5472, "learning_rate": 5e-06, "epoch": 2.810457516339869, "percentage": 93.68, "elapsed_time": "1:29:26", "remaining_time": "0:06:01"}
|
89 |
+
{"current_steps": 870, "total_steps": 918, "loss": 0.5512, "learning_rate": 5e-06, "epoch": 2.843137254901961, "percentage": 94.77, "elapsed_time": "1:30:26", "remaining_time": "0:04:59"}
|
90 |
+
{"current_steps": 880, "total_steps": 918, "loss": 0.5521, "learning_rate": 5e-06, "epoch": 2.8758169934640523, "percentage": 95.86, "elapsed_time": "1:31:26", "remaining_time": "0:03:56"}
|
91 |
+
{"current_steps": 890, "total_steps": 918, "loss": 0.5449, "learning_rate": 5e-06, "epoch": 2.9084967320261437, "percentage": 96.95, "elapsed_time": "1:32:26", "remaining_time": "0:02:54"}
|
92 |
+
{"current_steps": 900, "total_steps": 918, "loss": 0.5498, "learning_rate": 5e-06, "epoch": 2.9411764705882355, "percentage": 98.04, "elapsed_time": "1:33:26", "remaining_time": "0:01:52"}
|
93 |
+
{"current_steps": 910, "total_steps": 918, "loss": 0.5495, "learning_rate": 5e-06, "epoch": 2.973856209150327, "percentage": 99.13, "elapsed_time": "1:34:25", "remaining_time": "0:00:49"}
|
94 |
+
{"current_steps": 918, "total_steps": 918, "eval_loss": 0.628399670124054, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "1:36:59", "remaining_time": "0:00:00"}
|
95 |
+
{"current_steps": 918, "total_steps": 918, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "1:38:17", "remaining_time": "0:00:00"}
|