Training in progress, step 38600, checkpoint

Browse files

Files changed (7) hide show

last-checkpoint/adapter_config.json +4 -4
last-checkpoint/adapter_model.safetensors +1 -1
last-checkpoint/optimizer.pt +1 -1
last-checkpoint/rng_state.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +73 -3
last-checkpoint/training_args.bin +1 -1

last-checkpoint/adapter_config.json CHANGED Viewed

@@ -21,12 +21,12 @@
   "revision": null,
   "target_modules": [
     "o_proj",
-    "gate_proj",
-    "v_proj",
-    "down_proj",
     "up_proj",
     "q_proj",
-    "k_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

   "revision": null,
   "target_modules": [
     "o_proj",
     "up_proj",
+    "v_proj",
+    "gate_proj",
     "q_proj",
+    "k_proj",
+    "down_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3a9c4e19223b95fb5758c3ee2527d0abc53c761261cd302c9e6121979523da93
 size 778096664

 version https://git-lfs.github.com/spec/v1
+oid sha256:be0e066e83eb70c8a860b58a923a975fe6a2d64aee934a2b357e59d232707fa1
 size 778096664

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9dc6513a85bf522d3571cc919b7acbd2c16e6d887df27f7af012d7ddd099d4c3
 size 396581506

 version https://git-lfs.github.com/spec/v1
+oid sha256:a106a17c115a2e9fff16d6446794d7d6fbe741348c1aa6c74b42543757baaa4a
 size 396581506

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:adde30e974d4a4ac089075ed12c4f52f5d65760a545bb6c18cbe5820c191fefe
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:8afd281dafdd97beb15aaaf8b2ec92cb9800a347ae9bb7063ac2a5052be62319
 size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9c088826c17789740316b8318f190a406722ca97fa4cf22bb36e1b18efcb243c
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:599df61887dcd53cea391cff665b823e3f91f12b6512b5072d914d3c9170f985
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.052300236742029084,
   "eval_steps": 500,
-  "global_step": 37600,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -2639,6 +2639,76 @@
       "learning_rate": 1.9865354891677735e-05,
       "loss": 1.8286,
       "step": 37600
     }
   ],
   "logging_steps": 100,
@@ -2658,7 +2728,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 2.5848762127644672e+17,
   "train_batch_size": 2,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.05369120048516816,
   "eval_steps": 500,
+  "global_step": 38600,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 1.9865354891677735e-05,
       "loss": 1.8286,
       "step": 37600
+    },
+    {
+      "epoch": 0.05243933311634299,
+      "grad_norm": 1.9087238311767578,
+      "learning_rate": 1.98646392688979e-05,
+      "loss": 1.8904,
+      "step": 37700
+    },
+    {
+      "epoch": 0.0525784294906569,
+      "grad_norm": 2.815120220184326,
+      "learning_rate": 1.9863921762388266e-05,
+      "loss": 1.9064,
+      "step": 37800
+    },
+    {
+      "epoch": 0.052717525864970805,
+      "grad_norm": 2.9733479022979736,
+      "learning_rate": 1.986320237228585e-05,
+      "loss": 1.9261,
+      "step": 37900
+    },
+    {
+      "epoch": 0.05285662223928471,
+      "grad_norm": 2.9672937393188477,
+      "learning_rate": 1.9862481098728022e-05,
+      "loss": 1.8735,
+      "step": 38000
+    },
+    {
+      "epoch": 0.05299571861359862,
+      "grad_norm": 2.93483567237854,
+      "learning_rate": 1.9861757941852518e-05,
+      "loss": 1.8418,
+      "step": 38100
+    },
+    {
+      "epoch": 0.053134814987912525,
+      "grad_norm": 4.23644495010376,
+      "learning_rate": 1.9861032901797425e-05,
+      "loss": 1.8763,
+      "step": 38200
+    },
+    {
+      "epoch": 0.05327391136222643,
+      "grad_norm": 3.7690341472625732,
+      "learning_rate": 1.98603059787012e-05,
+      "loss": 1.9315,
+      "step": 38300
+    },
+    {
+      "epoch": 0.05341300773654034,
+      "grad_norm": 2.4336416721343994,
+      "learning_rate": 1.9859577172702658e-05,
+      "loss": 1.9413,
+      "step": 38400
+    },
+    {
+      "epoch": 0.053552104110854246,
+      "grad_norm": 3.6931252479553223,
+      "learning_rate": 1.9858846483940964e-05,
+      "loss": 1.8801,
+      "step": 38500
+    },
+    {
+      "epoch": 0.05369120048516816,
+      "grad_norm": 3.142920970916748,
+      "learning_rate": 1.9858113912555646e-05,
+      "loss": 1.8627,
+      "step": 38600
     }
   ],
   "logging_steps": 100,
       "attributes": {}
     }
   },
+  "total_flos": 2.7191656821399552e+17,
   "train_batch_size": 2,
   "trial_name": null,
   "trial_params": null

last-checkpoint/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9a8a868f3f2f56114ee6bc2428526d9923f9b81003f8674ec8d9fc77334d371a
 size 5688

 version https://git-lfs.github.com/spec/v1
+oid sha256:b747b6f384138ada304508b811385d92b8a2e349ed40953edea15e5db18a6e2b
 size 5688