ncbateman commited on
Commit
3c1f335
·
verified ·
1 Parent(s): 039f165

Training in progress, step 1533, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f223caf7929ca318636f3ba59853e80da2c3442e58790b9aa9620469f077dcdd
3
  size 97307544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd4d1e46df8ec68b6c9e6ef9bc5ecf5f0ad16089ded3c1805891caf30fbe6f72
3
  size 97307544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:98b4fcee642581b59a7244a4e37836a0670b2039f4714e7c1ed25e132985dbe4
3
  size 49846644
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:893f018393ecbc033a95361d425c0b3602b2ffb2547981cb44eaeddaacbecdb4
3
  size 49846644
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:84b646cf536e8227b66dc69f9a778486c8a7ac0b176b0a4c53112763ef66fe62
3
  size 14960
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:896ad7dae661b5fa712333e29820e33b88ac3783953f98a388981dde046510a4
3
  size 14960
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0b3cae7afbbeecf2d5eebabe029b4fc894e107994ebf862a1691926e2168a23e
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e62d7598f5c49e3b437a4b23d93990537e226573e28bd010a4ea6395b0e2122
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f6b60196473d01acca54f1bfaab7782b1e9e71ebfb49f472a000c757182eb4c1
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c0de816f9b02b9ee5a2b349ad6f5a137bba325ea03a2d153fce825bff92786e7
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f306602a5392b7b4f66c9140309f102c7fa749834c21b02d757113b9665853a7
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88c46b6808dd9d7ce1226ecee5a6e06c39c94514246c005c8173fb95caf7000e
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9d7adbf4e044c8cb7edc3f270cc5c3a63ee883daa8cd11b2707b6bd0b9847b17
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c582b8eeaf5293cff12aebb879053ac0a11aad5efa379d7618133c7165704367
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.9975550122249389,
5
  "eval_steps": 767,
6
- "global_step": 1530,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -10733,6 +10733,27 @@
10733
  "learning_rate": 9.830211892492003e-10,
10734
  "loss": 1.1091,
10735
  "step": 1530
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
10736
  }
10737
  ],
10738
  "logging_steps": 1,
@@ -10747,12 +10768,12 @@
10747
  "should_evaluate": false,
10748
  "should_log": false,
10749
  "should_save": true,
10750
- "should_training_stop": false
10751
  },
10752
  "attributes": {}
10753
  }
10754
  },
10755
- "total_flos": 3.420887745382318e+18,
10756
  "train_batch_size": 2,
10757
  "trial_name": null,
10758
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.9995110024449878,
5
  "eval_steps": 767,
6
+ "global_step": 1533,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
10733
  "learning_rate": 9.830211892492003e-10,
10734
  "loss": 1.1091,
10735
  "step": 1530
10736
+ },
10737
+ {
10738
+ "epoch": 0.9982070089649552,
10739
+ "grad_norm": 0.3718799948692322,
10740
+ "learning_rate": 4.368991016689972e-10,
10741
+ "loss": 1.0742,
10742
+ "step": 1531
10743
+ },
10744
+ {
10745
+ "epoch": 0.9988590057049714,
10746
+ "grad_norm": 0.47078269720077515,
10747
+ "learning_rate": 1.0922489471765219e-10,
10748
+ "loss": 1.0806,
10749
+ "step": 1532
10750
+ },
10751
+ {
10752
+ "epoch": 0.9995110024449878,
10753
+ "grad_norm": 0.4701193571090698,
10754
+ "learning_rate": 0.0,
10755
+ "loss": 0.8084,
10756
+ "step": 1533
10757
  }
10758
  ],
10759
  "logging_steps": 1,
 
10768
  "should_evaluate": false,
10769
  "should_log": false,
10770
  "should_save": true,
10771
+ "should_training_stop": true
10772
  },
10773
  "attributes": {}
10774
  }
10775
  },
10776
+ "total_flos": 3.4275953684124795e+18,
10777
  "train_batch_size": 2,
10778
  "trial_name": null,
10779
  "trial_params": null