TracyTank commited on
Commit
367f3f7
·
verified ·
1 Parent(s): 1dcc12a

Training in progress, step 63, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0ba64bad8552e0c9fa8e5c0cba4dfd84da312a799b94eaa654a185791a7c2c91
3
  size 83115256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72c4365c90e4673e37a4a2c158f4b3127797f0351d6eea9b8490f9b553c5b266
3
  size 83115256
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:48dac4f7c5175a62c2d1a3914987c0bea4dd1bd3b234a472f2e9b22aa244d978
3
  size 42608388
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:290fb60611823f559a1778dd2e7fd99444caee266092dc9891526caca2f08df6
3
  size 42608388
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1d06609511f040c8c42a7e00cea1ec053a60567af34ba4410b1ad054b2eb6247
3
  size 14960
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:42dd685047e6d843f81d8c7a97b9fe8e3a8a836d0baa0ca1458618da98aab18c
3
  size 14960
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c980deaa36d5045c0af89e3e197d07224f4a228b702151413212eb3c9e980524
3
  size 14960
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c303d82f711309bdf0967f8f4652d2e044e68225e894969369a6e258f673387
3
  size 14960
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4cb270cabc01be9731b23f750c54fb072017bd017706d55fcca97da50f8b0ff8
3
  size 14960
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb886efaa016e515326abe05c4e04003a68e6a0c5f0758d9cac3926ffc093da1
3
  size 14960
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a686836c4cfc5a5fdcd6156f1963e12b5f5985ce7c1ab1c8500c5b965b0e85c0
3
  size 14960
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89bbd9e9f39698108fc006d2cafcf2df8819db67c29ee6862b47f75b545174af
3
  size 14960
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2011b1e019073e4bafc29de9703ff0a6e7c1252c3a53d804807bd1c99d390d1c
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e53b95eff99f2334cbf7ed4c962db83cb42e931305982518e928382563b5670d
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.3456,
5
  "eval_steps": 9,
6
- "global_step": 54,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -189,6 +189,35 @@
189
  "eval_samples_per_second": 228.948,
190
  "eval_steps_per_second": 7.182,
191
  "step": 54
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
192
  }
193
  ],
194
  "logging_steps": 3,
@@ -208,7 +237,7 @@
208
  "attributes": {}
209
  }
210
  },
211
- "total_flos": 8.70588303236137e+16,
212
  "train_batch_size": 8,
213
  "trial_name": null,
214
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.4032,
5
  "eval_steps": 9,
6
+ "global_step": 63,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
189
  "eval_samples_per_second": 228.948,
190
  "eval_steps_per_second": 7.182,
191
  "step": 54
192
+ },
193
+ {
194
+ "epoch": 0.3648,
195
+ "grad_norm": 0.898175060749054,
196
+ "learning_rate": 4.6512176312793736e-05,
197
+ "loss": 2.0437,
198
+ "step": 57
199
+ },
200
+ {
201
+ "epoch": 0.384,
202
+ "grad_norm": 0.8860452175140381,
203
+ "learning_rate": 4.131759111665349e-05,
204
+ "loss": 2.0314,
205
+ "step": 60
206
+ },
207
+ {
208
+ "epoch": 0.4032,
209
+ "grad_norm": 0.7955260872840881,
210
+ "learning_rate": 3.6218132209150045e-05,
211
+ "loss": 2.0663,
212
+ "step": 63
213
+ },
214
+ {
215
+ "epoch": 0.4032,
216
+ "eval_loss": 2.0011115074157715,
217
+ "eval_runtime": 4.6261,
218
+ "eval_samples_per_second": 227.405,
219
+ "eval_steps_per_second": 7.133,
220
+ "step": 63
221
  }
222
  ],
223
  "logging_steps": 3,
 
237
  "attributes": {}
238
  }
239
  },
240
+ "total_flos": 1.0163565512097792e+17,
241
  "train_batch_size": 8,
242
  "trial_name": null,
243
  "trial_params": null