Training in progress, step 10, checkpoint

Files changed (12) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ff1f1c7995d36156a8be4e4e3781a3de815fedc7dbabc2f3f2000eb44db968ea
 size 63592

 version https://git-lfs.github.com/spec/v1
+oid sha256:a5b4036814ea6ebc519e179ce115e74545f14dea03bf107a6ea7783ed3c38d73
 size 63592

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:628e9f3b165ddd57f211900f0fad27047990e84538320468266f0237d48e8ad7
 size 132798

 version https://git-lfs.github.com/spec/v1
+oid sha256:30bc2356e85a31be8d163215c0a521c22e99f537fb18024404488d9941a7f960
 size 132798

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:130a4817f279520af77199dd42cfe37117aa5a80f4f47a83e4ce4ffd703225e8
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:086575062c0bed8e9eadc952915db35487fe304153021669369e21328c5f92ff
 size 15984

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5ce832b0bc79ceb292a621d3a04b07c47bedaaa273036406343d169de473543a
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:b78cfce40ca3f29bad0b5f3ea86fb09ea2acbbacad6432113460ae3f9ae3ee4c
 size 15984

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7eb4792b082408543f1f81b7312692c86c5c6fa9529cb1cb2974620aef9db475
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:d7acd2fd374e01ab4207567e1742a9577201a18b80961feee02a234d73c070f6
 size 15984

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:081b82e0dcfc94fe383b962c8243795f817dd269c3e9a8642c2270f1b678e5d3
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:e3a1e5312e9969bc361d61d2254ce7b23bc52ac85d7f4c03475138be7f4a99d5
 size 15984

last-checkpoint/rng_state_4.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e6fceeedbf4260961cb70678e67afb103efe4228c70593decfaea3fc69afbdcb
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:bf2402608d6a6916eda64fd344e8fdea20eb6ecaae8fa4ff30e83f7f0a795bef
 size 15984

last-checkpoint/rng_state_5.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:806fdff23908b2cb3eaf085ea29ccebb1c2764e61ea98e5f46b30864a683a45c
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:60527139a25b2f34c4c6d3c321ed6aae5cab4244ded979b1f8c95209ab1db36c
 size 15984

last-checkpoint/rng_state_6.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2eb4ac8e97914a207a71ff5f3ba208f868ef5f748830c0fc4f7cfca000796510
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:9ed50c5751ef23cb4304daf8ac04bfdf1a8e75bd5e154825461adb8aa7afb20f
 size 15984

last-checkpoint/rng_state_7.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7710803b72c4a46e34d6599dca7b70dd6d7b92a90af6e926e9a1a9da54b9ece3
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:428a610145c46220e34b200ee2b80ccaa5f3f6e3dd392be99a81a4397861a0e2
 size 15984

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0099cb7287625b29b67c4fcf42ff20fae623b429bfb10f5ac695bc54f2be54fd
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:8bdda546a1390be3b85a90dd4ef31050dfb7b691765ffc12ed691b6786ed6e3d
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.004424778761061947,
   "eval_steps": 3,
-  "global_step": 9,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -102,6 +102,13 @@
       "eval_samples_per_second": 683.801,
       "eval_steps_per_second": 85.625,
       "step": 9
     }
   ],
   "logging_steps": 1,
@@ -116,12 +123,12 @@
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
-        "should_training_stop": false
       },
       "attributes": {}
     }
   },
-  "total_flos": 269525975040.0,
   "train_batch_size": 1,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.004916420845624385,
   "eval_steps": 3,
+  "global_step": 10,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 683.801,
       "eval_steps_per_second": 85.625,
       "step": 9
+    },
+    {
+      "epoch": 0.004916420845624385,
+      "grad_norm": 10.2720947265625,
+      "learning_rate": 0.00014,
+      "loss": 44.2197,
+      "step": 10
     }
   ],
   "logging_steps": 1,
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
+        "should_training_stop": true
       },
       "attributes": {}
     }
   },
+  "total_flos": 299473305600.0,
   "train_batch_size": 1,
   "trial_name": null,
   "trial_params": null