Training in progress, step 357, checkpoint

Files changed (4) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a375c24028700bd557f667d40973690c740ce729b6073aa79b5a7971a2f2cc78
 size 73911112

 version https://git-lfs.github.com/spec/v1
+oid sha256:cc2624a8ffcf1841a9421ca1f17277f4c8d9b072e238a8603e30cdfdae2cb8ca
 size 73911112

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:22f7b1a71febb4b763b6acf5823fda57ab9eca3184ec8cbb2a84cd959eb1b39b
 size 37431220

 version https://git-lfs.github.com/spec/v1
+oid sha256:210d9ceabe7e26d81c6de62edaa8bf5373afa8e36c75a23d9b951a596eda2c05
 size 37431220

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:77b94402f5dd54b877f7ef15b329b04f5ba33d08b944e588160c2e2559f18f1f
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:56085f5a51542351a94b27a3e2abb809af51b595632f72dc4fabbe92e8070a60
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.9711934156378601,
   "eval_steps": 500,
-  "global_step": 354,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -2485,6 +2485,27 @@
       "learning_rate": 7.5757575757575764e-06,
       "loss": 1.175,
       "step": 354
     }
   ],
   "logging_steps": 1,
@@ -2504,7 +2525,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 4.38308805541675e+17,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.9794238683127572,
   "eval_steps": 500,
+  "global_step": 357,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 7.5757575757575764e-06,
       "loss": 1.175,
       "step": 354
+    },
+    {
+      "epoch": 0.9739368998628258,
+      "grad_norm": 0.16342799365520477,
+      "learning_rate": 6.818181818181818e-06,
+      "loss": 1.2179,
+      "step": 355
+    },
+    {
+      "epoch": 0.9766803840877915,
+      "grad_norm": 0.1597851812839508,
+      "learning_rate": 6.060606060606061e-06,
+      "loss": 1.1208,
+      "step": 356
+    },
+    {
+      "epoch": 0.9794238683127572,
+      "grad_norm": 0.16428720951080322,
+      "learning_rate": 5.303030303030304e-06,
+      "loss": 1.1197,
+      "step": 357
     }
   ],
   "logging_steps": 1,
       "attributes": {}
     }
   },
+  "total_flos": 4.4192512511902925e+17,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null