Training in progress, step 245, checkpoint

Files changed (4) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2d7f289734593a3f7ee939562d24196078125028a858356847a6bb957f59a600
 size 73911112

 version https://git-lfs.github.com/spec/v1
+oid sha256:f46b71e95a580f108269251cfe3defd72132358de06c0d928b83f8aefd50304d
 size 73911112

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6942bdb9d086b28b0925199c7fe1fdaa7b25eebd757be776937103f7a5f230b8
 size 37430836

 version https://git-lfs.github.com/spec/v1
+oid sha256:99106769548268574aadd158585d14f464e53c8ad6243c5158dc3c182ccfe6a5
 size 37430836

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:db79331c8992e3a7af2306518ac9df31b4a39a542a11b37b6cba8afaa66b1eba
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:e1164145c3cb1723f88e8b2678949166f87c794da442d33d7cc2eddf22f1da61
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.663923182441701,
   "eval_steps": 500,
-  "global_step": 242,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -1701,6 +1701,27 @@
       "learning_rate": 9.242424242424242e-05,
       "loss": 1.2732,
       "step": 242
     }
   ],
   "logging_steps": 1,
@@ -1720,7 +1741,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 2.995266789026488e+17,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.6721536351165981,
   "eval_steps": 500,
+  "global_step": 245,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 9.242424242424242e-05,
       "loss": 1.2732,
       "step": 242
+    },
+    {
+      "epoch": 0.6666666666666666,
+      "grad_norm": 0.16092891991138458,
+      "learning_rate": 9.166666666666667e-05,
+      "loss": 1.1607,
+      "step": 243
+    },
+    {
+      "epoch": 0.6694101508916324,
+      "grad_norm": 0.1687157154083252,
+      "learning_rate": 9.090909090909092e-05,
+      "loss": 1.1149,
+      "step": 244
+    },
+    {
+      "epoch": 0.6721536351165981,
+      "grad_norm": 0.18511663377285004,
+      "learning_rate": 9.015151515151515e-05,
+      "loss": 1.1934,
+      "step": 245
     }
   ],
   "logging_steps": 1,
       "attributes": {}
     }
   },
+  "total_flos": 3.031087305198797e+17,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null