Training in progress, epoch 1
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:130847ad394e11751930b2386f550e7d17dd502aa7454f1a07b1ca1f284f4c01
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d9c25bd1e5e4cc0fd1f90dfbd404ea2a6fcf90f9d74d8ef9a373720bea0c4d92
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3bc6f8ee075e5c8b6f690be633949b85e54640df9ee0c8f95a131d856b5c0f6b
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f8e2a37bfa82e64d9ed6e1d6ec287b0c2dd0340bad0698e1ed849e20bfc011f
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -12,3 +12,11 @@
|
|
12 |
{"current_steps": 12, "total_steps": 24, "loss": 0.7131, "lr": 6.112604669781572e-06, "epoch": 1.4230769230769231, "percentage": 50.0, "elapsed_time": "0:05:06", "remaining_time": "0:05:06"}
|
13 |
{"current_steps": 13, "total_steps": 24, "loss": 0.6444, "lr": 5.373650467932122e-06, "epoch": 1.5384615384615383, "percentage": 54.17, "elapsed_time": "0:05:24", "remaining_time": "0:04:34"}
|
14 |
{"current_steps": 14, "total_steps": 24, "loss": 0.7125, "lr": 4.626349532067879e-06, "epoch": 1.6538461538461537, "percentage": 58.33, "elapsed_time": "0:05:42", "remaining_time": "0:04:04"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
12 |
{"current_steps": 12, "total_steps": 24, "loss": 0.7131, "lr": 6.112604669781572e-06, "epoch": 1.4230769230769231, "percentage": 50.0, "elapsed_time": "0:05:06", "remaining_time": "0:05:06"}
|
13 |
{"current_steps": 13, "total_steps": 24, "loss": 0.6444, "lr": 5.373650467932122e-06, "epoch": 1.5384615384615383, "percentage": 54.17, "elapsed_time": "0:05:24", "remaining_time": "0:04:34"}
|
14 |
{"current_steps": 14, "total_steps": 24, "loss": 0.7125, "lr": 4.626349532067879e-06, "epoch": 1.6538461538461537, "percentage": 58.33, "elapsed_time": "0:05:42", "remaining_time": "0:04:04"}
|
15 |
+
{"current_steps": 15, "total_steps": 24, "loss": 0.6467, "lr": 3.887395330218429e-06, "epoch": 1.7692307692307692, "percentage": 62.5, "elapsed_time": "0:06:03", "remaining_time": "0:03:38"}
|
16 |
+
{"current_steps": 16, "total_steps": 24, "loss": 0.6705, "lr": 3.173294878168025e-06, "epoch": 1.8846153846153846, "percentage": 66.67, "elapsed_time": "0:06:24", "remaining_time": "0:03:12"}
|
17 |
+
{"current_steps": 17, "total_steps": 24, "loss": 1.0619, "lr": 2.5000000000000015e-06, "epoch": 2.0384615384615383, "percentage": 70.83, "elapsed_time": "0:07:35", "remaining_time": "0:03:07"}
|
18 |
+
{"current_steps": 18, "total_steps": 24, "loss": 0.6591, "lr": 1.8825509907063328e-06, "epoch": 2.1538461538461537, "percentage": 75.0, "elapsed_time": "0:07:57", "remaining_time": "0:02:39"}
|
19 |
+
{"current_steps": 19, "total_steps": 24, "loss": 0.5755, "lr": 1.3347406408508695e-06, "epoch": 2.269230769230769, "percentage": 79.17, "elapsed_time": "0:08:18", "remaining_time": "0:02:11"}
|
20 |
+
{"current_steps": 20, "total_steps": 24, "loss": 0.6509, "lr": 8.688061284200266e-07, "epoch": 2.3846153846153846, "percentage": 83.33, "elapsed_time": "0:08:35", "remaining_time": "0:01:43"}
|
21 |
+
{"current_steps": 21, "total_steps": 24, "loss": 0.6663, "lr": 4.951556604879049e-07, "epoch": 2.5, "percentage": 87.5, "elapsed_time": "0:08:58", "remaining_time": "0:01:16"}
|
22 |
+
{"current_steps": 22, "total_steps": 24, "loss": 0.6374, "lr": 2.2213597106929608e-07, "epoch": 2.6153846153846154, "percentage": 91.67, "elapsed_time": "0:09:18", "remaining_time": "0:00:50"}
|