brixeus commited on
Commit
dfb1f24
·
verified ·
1 Parent(s): 140cea1

Training in progress, step 32, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:83dac7f2ae5c4e98c98e1d48d308347bb0ab2e862904b6eb87abeffc410f10d1
3
  size 78480072
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8eebf8a72782d8a6d10ac9868dd817b1f02574eca60388a6aa12c3df0b64bf29
3
  size 78480072
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:018d9f9cfe3499003a0f3ba3a53b396ea2aff34ccbb3d694cd4004c7cd1a9bb1
3
  size 40131268
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b993b463cbd60d0a0d34713757e389882b393a688c8872ad39ca58ad24ed942b
3
  size 40131268
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cf011371356bc8a3dc38bd5025d4f28c386b7543e52e6476f1c1e80305359c88
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6aef71fd23d8a2bd13f4b2bd6e1a29fa4b8c3c44066fb0395694fc49aaa81d21
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ffdfbb96ef899b42f33247163db9f040cf148861f99ef1ab5ca02e35847effc0
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a387b210316633d05904a757c86d6d5b1f723a9084c82125f530fbd1f5f4ae32
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.9047619047619047,
5
  "eval_steps": 3,
6
- "global_step": 30,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -179,12 +179,12 @@
179
  "should_evaluate": false,
180
  "should_log": false,
181
  "should_save": true,
182
- "should_training_stop": false
183
  },
184
  "attributes": {}
185
  }
186
  },
187
- "total_flos": 1.180530414452736e+16,
188
  "train_batch_size": 8,
189
  "trial_name": null,
190
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 3.119047619047619,
5
  "eval_steps": 3,
6
+ "global_step": 32,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
179
  "should_evaluate": false,
180
  "should_log": false,
181
  "should_save": true,
182
+ "should_training_stop": true
183
  },
184
  "attributes": {}
185
  }
186
  },
187
+ "total_flos": 1.2592324420829184e+16,
188
  "train_batch_size": 8,
189
  "trial_name": null,
190
  "trial_params": null