Training in progress, step 115, checkpoint

Files changed (4) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c529a85454a3d96a5940fa5d781d9577b35d06f3dc016844d7b8b300f297013a
 size 73911112

 version https://git-lfs.github.com/spec/v1
+oid sha256:7bdbb740496dc2a7f3c0f6f02d269d15e42820dee4870aed7c52aa1bfd807fd2
 size 73911112

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ebe248069e09f4931f12d918e0d5b47cbf7e6f6c3a440eed76b31cd6eacbb695
 size 37430836

 version https://git-lfs.github.com/spec/v1
+oid sha256:19aea021c17d22587f9f50dc0bd30b3284a28d1ab85db70a8c705c5ef04b8d19
 size 37430836

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:74a8f3454c415665d0358e152faea0ef684bc7b623fa35ef64763c0af976fed2
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:f9741594e204ffb908586b8ab5263be1fd7e41110b9026fc1281a70d1b1b6557
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.3100137174211248,
   "eval_steps": 500,
-  "global_step": 113,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -798,6 +798,20 @@
       "learning_rate": 0.00019015151515151517,
       "loss": 1.2836,
       "step": 113
     }
   ],
   "logging_steps": 1,
@@ -817,7 +831,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 1.4010395508772454e+17,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.31550068587105623,
   "eval_steps": 500,
+  "global_step": 115,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 0.00019015151515151517,
       "loss": 1.2836,
       "step": 113
+    },
+    {
+      "epoch": 0.31275720164609055,
+      "grad_norm": 0.1297687143087387,
+      "learning_rate": 0.00018939393939393942,
+      "loss": 1.2813,
+      "step": 114
+    },
+    {
+      "epoch": 0.31550068587105623,
+      "grad_norm": 0.13718412816524506,
+      "learning_rate": 0.00018863636363636364,
+      "loss": 1.3138,
+      "step": 115
     }
   ],
   "logging_steps": 1,
       "attributes": {}
     }
   },
+  "total_flos": 1.4257615970761114e+17,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null