Training in progress, epoch 1

Files changed (8) hide show

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b5b3ada415323df4681659f8a3c19121e9379a2b0c7922cade957c3cc9526017
 size 409103316

 version https://git-lfs.github.com/spec/v1
+oid sha256:01943b36fe2d099072ef77b2811221d172183457a8423ec8462545bbe2d496e3
 size 409103316

run-3/checkpoint-267/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:135197ad3195b359042613773b71696c5cf012cf3d066a9a2511d3838c3c35a9
 size 409103316

 version https://git-lfs.github.com/spec/v1
+oid sha256:01943b36fe2d099072ef77b2811221d172183457a8423ec8462545bbe2d496e3
 size 409103316

run-3/checkpoint-267/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:255a584a26fcc2be699bafc46e1aae1a8b151ee8fc9ea40b342553f5d2d467f7
 size 818327802

 version https://git-lfs.github.com/spec/v1
+oid sha256:65e47361cac1e35bd4bb3eca381d3691bf21be971b356c5736ccb58b481861fe
 size 818327802

run-3/checkpoint-267/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e8ff2c2e29acd16c1aadf33df0772847990f6dfc28d9f7049fdc9ef8259a339b
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:ef3be8be9037b2d6a9348611f95c19fb1d17ca7cb1da92486df22b7e0a3c655a
 size 1064

run-3/checkpoint-267/trainer_state.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "best_metric": 0.603171169757843,
   "best_model_checkpoint": "BERT-WMM/run-3/checkpoint-267",
   "epoch": 1.0,
   "eval_steps": 500,
@@ -10,23 +10,23 @@
   "log_history": [
     {
       "epoch": 1.0,
-      "eval_accuracy": 0.7549295774647887,
-      "eval_loss": 0.603171169757843,
-      "eval_runtime": 2.3997,
-      "eval_samples_per_second": 887.602,
-      "eval_steps_per_second": 55.84,
       "step": 267
     }
   ],
   "logging_steps": 500,
-  "max_steps": 1068,
   "num_input_tokens_seen": 0,
-  "num_train_epochs": 4,
   "save_steps": 500,
   "total_flos": 0,
   "train_batch_size": 32,
   "trial_name": null,
   "trial_params": {
-    "num_train_epochs": 4
   }
 }

 {
+  "best_metric": 0.6065873503684998,
   "best_model_checkpoint": "BERT-WMM/run-3/checkpoint-267",
   "epoch": 1.0,
   "eval_steps": 500,
   "log_history": [
     {
       "epoch": 1.0,
+      "eval_accuracy": 0.7530516431924883,
+      "eval_loss": 0.6065873503684998,
+      "eval_runtime": 2.5921,
+      "eval_samples_per_second": 821.724,
+      "eval_steps_per_second": 51.695,
       "step": 267
     }
   ],
   "logging_steps": 500,
+  "max_steps": 534,
   "num_input_tokens_seen": 0,
+  "num_train_epochs": 2,
   "save_steps": 500,
   "total_flos": 0,
   "train_batch_size": 32,
   "trial_name": null,
   "trial_params": {
+    "weight_decay": 0.021167311357718124
   }
 }

run-3/checkpoint-267/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a8c637656beacaec83a46c1d786535828a5c615851f4d21b0069fcadd723fa83
 size 4856

 version https://git-lfs.github.com/spec/v1
+oid sha256:1238f3e9130ff13042dcb9e0ded88b87b25d59c0eb7bc889417ea846582c3c9b
 size 4856

runs/Apr19_10-19-01_dcdaa3e6ec43/events.out.tfevents.1713522305.dcdaa3e6ec43.789.3 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:5908acf12b09c9364f37fdcc1828450a70123a37e71027bfb4acc38d127db0d0
+size 5233

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0110ce032162455ab9f249ecc09efcf6160c1647641e207a11aab2a661b9c4f1
 size 4856

 version https://git-lfs.github.com/spec/v1
+oid sha256:1238f3e9130ff13042dcb9e0ded88b87b25d59c0eb7bc889417ea846582c3c9b
 size 4856