jssky commited on
Commit
3acae49
·
verified ·
1 Parent(s): a2669f9

Training in progress, step 10, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ff1f1c7995d36156a8be4e4e3781a3de815fedc7dbabc2f3f2000eb44db968ea
3
  size 63592
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5b4036814ea6ebc519e179ce115e74545f14dea03bf107a6ea7783ed3c38d73
3
  size 63592
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:628e9f3b165ddd57f211900f0fad27047990e84538320468266f0237d48e8ad7
3
  size 132798
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30bc2356e85a31be8d163215c0a521c22e99f537fb18024404488d9941a7f960
3
  size 132798
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:130a4817f279520af77199dd42cfe37117aa5a80f4f47a83e4ce4ffd703225e8
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:086575062c0bed8e9eadc952915db35487fe304153021669369e21328c5f92ff
3
  size 15984
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5ce832b0bc79ceb292a621d3a04b07c47bedaaa273036406343d169de473543a
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b78cfce40ca3f29bad0b5f3ea86fb09ea2acbbacad6432113460ae3f9ae3ee4c
3
  size 15984
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7eb4792b082408543f1f81b7312692c86c5c6fa9529cb1cb2974620aef9db475
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d7acd2fd374e01ab4207567e1742a9577201a18b80961feee02a234d73c070f6
3
  size 15984
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:081b82e0dcfc94fe383b962c8243795f817dd269c3e9a8642c2270f1b678e5d3
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3a1e5312e9969bc361d61d2254ce7b23bc52ac85d7f4c03475138be7f4a99d5
3
  size 15984
last-checkpoint/rng_state_4.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e6fceeedbf4260961cb70678e67afb103efe4228c70593decfaea3fc69afbdcb
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf2402608d6a6916eda64fd344e8fdea20eb6ecaae8fa4ff30e83f7f0a795bef
3
  size 15984
last-checkpoint/rng_state_5.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:806fdff23908b2cb3eaf085ea29ccebb1c2764e61ea98e5f46b30864a683a45c
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:60527139a25b2f34c4c6d3c321ed6aae5cab4244ded979b1f8c95209ab1db36c
3
  size 15984
last-checkpoint/rng_state_6.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2eb4ac8e97914a207a71ff5f3ba208f868ef5f748830c0fc4f7cfca000796510
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ed50c5751ef23cb4304daf8ac04bfdf1a8e75bd5e154825461adb8aa7afb20f
3
  size 15984
last-checkpoint/rng_state_7.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7710803b72c4a46e34d6599dca7b70dd6d7b92a90af6e926e9a1a9da54b9ece3
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:428a610145c46220e34b200ee2b80ccaa5f3f6e3dd392be99a81a4397861a0e2
3
  size 15984
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0099cb7287625b29b67c4fcf42ff20fae623b429bfb10f5ac695bc54f2be54fd
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8bdda546a1390be3b85a90dd4ef31050dfb7b691765ffc12ed691b6786ed6e3d
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.004424778761061947,
5
  "eval_steps": 3,
6
- "global_step": 9,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -102,6 +102,13 @@
102
  "eval_samples_per_second": 683.801,
103
  "eval_steps_per_second": 85.625,
104
  "step": 9
 
 
 
 
 
 
 
105
  }
106
  ],
107
  "logging_steps": 1,
@@ -116,12 +123,12 @@
116
  "should_evaluate": false,
117
  "should_log": false,
118
  "should_save": true,
119
- "should_training_stop": false
120
  },
121
  "attributes": {}
122
  }
123
  },
124
- "total_flos": 269525975040.0,
125
  "train_batch_size": 1,
126
  "trial_name": null,
127
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.004916420845624385,
5
  "eval_steps": 3,
6
+ "global_step": 10,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
102
  "eval_samples_per_second": 683.801,
103
  "eval_steps_per_second": 85.625,
104
  "step": 9
105
+ },
106
+ {
107
+ "epoch": 0.004916420845624385,
108
+ "grad_norm": 10.2720947265625,
109
+ "learning_rate": 0.00014,
110
+ "loss": 44.2197,
111
+ "step": 10
112
  }
113
  ],
114
  "logging_steps": 1,
 
123
  "should_evaluate": false,
124
  "should_log": false,
125
  "should_save": true,
126
+ "should_training_stop": true
127
  },
128
  "attributes": {}
129
  }
130
  },
131
+ "total_flos": 299473305600.0,
132
  "train_batch_size": 1,
133
  "trial_name": null,
134
  "trial_params": null