Commit
·
d03fe13
1
Parent(s):
a5f3b3b
Training in progress, step 3406
Browse files- adapter_model.bin +1 -1
- last-checkpoint/adapter_model.bin +1 -1
- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/rng_state.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +15 -3
- runs/Jul30_21-59-54_04d48b04b124/events.out.tfevents.1690754399.04d48b04b124.17705.0 +2 -2
adapter_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3163457
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dc71cd7108d9ba72e4b1bbcd605200598e28504fe244d83b8a107877ce1e0a08
|
3 |
size 3163457
|
last-checkpoint/adapter_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3163457
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dc71cd7108d9ba72e4b1bbcd605200598e28504fe244d83b8a107877ce1e0a08
|
3 |
size 3163457
|
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 6319689
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e460fb4f88d3862e29c85824beb220c3a440e38e495d2d21bb431256d976f53
|
3 |
size 6319689
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14639
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:81334a5dfd85c0801a30a1eea8b9cd541f8e62f06aaad2e0abae818e3755642d
|
3 |
size 14639
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 627
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:314792ac9e515ae832ad8130bd6e039000a1e8e45a9c056a7c485a1d5b51a39f
|
3 |
size 627
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch": 0.
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -156,11 +156,23 @@
|
|
156 |
"learning_rate": 1.2730849340430457e-05,
|
157 |
"loss": 2.3715,
|
158 |
"step": 3144
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
159 |
}
|
160 |
],
|
161 |
"max_steps": 8642,
|
162 |
"num_train_epochs": 1,
|
163 |
-
"total_flos":
|
164 |
"trial_name": null,
|
165 |
"trial_params": null
|
166 |
}
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 0.39412173108076837,
|
5 |
+
"global_step": 3406,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
156 |
"learning_rate": 1.2730849340430457e-05,
|
157 |
"loss": 2.3715,
|
158 |
"step": 3144
|
159 |
+
},
|
160 |
+
{
|
161 |
+
"epoch": 0.38,
|
162 |
+
"learning_rate": 1.2429993057162695e-05,
|
163 |
+
"loss": 2.3903,
|
164 |
+
"step": 3275
|
165 |
+
},
|
166 |
+
{
|
167 |
+
"epoch": 0.39,
|
168 |
+
"learning_rate": 1.2126822494792874e-05,
|
169 |
+
"loss": 2.3352,
|
170 |
+
"step": 3406
|
171 |
}
|
172 |
],
|
173 |
"max_steps": 8642,
|
174 |
"num_train_epochs": 1,
|
175 |
+
"total_flos": 6342809229459456.0,
|
176 |
"trial_name": null,
|
177 |
"trial_params": null
|
178 |
}
|
runs/Jul30_21-59-54_04d48b04b124/events.out.tfevents.1690754399.04d48b04b124.17705.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:679137deebfe550bc6154188469577d30001363465caa1e926dc5cffb384d93d
|
3 |
+
size 8440
|