Training in progress, step 15, checkpoint
Browse files- last-checkpoint/adapter_model.safetensors +1 -1
- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +11 -4
last-checkpoint/adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 83115256
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a715b0ec25dead1ad4763fe70873842017cbbe11a65d5528aee0bf11ef6355eb
|
3 |
size 83115256
|
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 42608388
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2fc4a7085cba1d75eed52201ca0a67243fd78485fd83d5a7c543c3346a9a3242
|
3 |
size 42608388
|
last-checkpoint/rng_state_0.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a83ecd52c7dc407f6f72e509d7f4de78b565f9b992b7b9c3481784fbf20b246f
|
3 |
size 15024
|
last-checkpoint/rng_state_1.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:919f21951de9fd197bb9e559b3421a6af8da448a30b0c5b1a2b6c9a110007bbc
|
3 |
size 15024
|
last-checkpoint/rng_state_2.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e4ae6bbde22084d121c985af2d0bf879a744e6e7966c28357e4469e532205868
|
3 |
size 15024
|
last-checkpoint/rng_state_3.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:877bc2813569967981b03024ab5a1ebc2127ea6afc46bb56f38cd06cf5722b8e
|
3 |
size 15024
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:008d83c4f5ee0c3b0aa2ca88e92cb7f21d43acfd48a8bc37442b67fb3134fa7c
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch": 3.
|
5 |
"eval_steps": 2,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -99,6 +99,13 @@
|
|
99 |
"eval_samples_per_second": 221.351,
|
100 |
"eval_steps_per_second": 6.917,
|
101 |
"step": 14
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
102 |
}
|
103 |
],
|
104 |
"logging_steps": 3,
|
@@ -113,12 +120,12 @@
|
|
113 |
"should_evaluate": false,
|
114 |
"should_log": false,
|
115 |
"should_save": true,
|
116 |
-
"should_training_stop":
|
117 |
},
|
118 |
"attributes": {}
|
119 |
}
|
120 |
},
|
121 |
-
"total_flos": 2.
|
122 |
"train_batch_size": 8,
|
123 |
"trial_name": null,
|
124 |
"trial_params": null
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 3.3157894736842106,
|
5 |
"eval_steps": 2,
|
6 |
+
"global_step": 15,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
99 |
"eval_samples_per_second": 221.351,
|
100 |
"eval_steps_per_second": 6.917,
|
101 |
"step": 14
|
102 |
+
},
|
103 |
+
{
|
104 |
+
"epoch": 3.3157894736842106,
|
105 |
+
"grad_norm": 1.4032217264175415,
|
106 |
+
"learning_rate": 0.0,
|
107 |
+
"loss": 1.4173,
|
108 |
+
"step": 15
|
109 |
}
|
110 |
],
|
111 |
"logging_steps": 3,
|
|
|
120 |
"should_evaluate": false,
|
121 |
"should_log": false,
|
122 |
"should_save": true,
|
123 |
+
"should_training_stop": true
|
124 |
},
|
125 |
"attributes": {}
|
126 |
}
|
127 |
},
|
128 |
+
"total_flos": 2.41271599792128e+16,
|
129 |
"train_batch_size": 8,
|
130 |
"trial_name": null,
|
131 |
"trial_params": null
|