ncbateman commited on
Commit
a720948
·
verified ·
1 Parent(s): c566897

Training in progress, step 443, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ae1251f05ef70724f2a5bd541621a60fbc4213fb961de0bb1cb6893899908ba9
3
  size 167832240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75170cfd79552ed415d553b0a5759b6cbddd9e4dfb48b029476ed1655814bafa
3
  size 167832240
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8802ed5407d8a8f2dac66a8b4608afa77de6a43e7ff92e2511b5faa6783d07c1
3
  size 85723732
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd60c066e2bc5df04a60721bdeaa422c17efd4ca67433fd36c89a9f75c911c26
3
  size 85723732
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2cca9f96c96b922acaa204e7459a265396d5e1c98f1f296f230d8e331885b8ac
3
  size 14960
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b862da9e51cd65ba194067266b41a728636828ad2cd2b4cec3ac38adb1ae7d2
3
  size 14960
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:62fb05d1751019ac24743a26e17e60ff4857e4af1f72362a4b410a6c8410a65b
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0a6fa1f8ea24e79ddc54d54c9b1eebadb52949e41e7f120fa0737819f774d79
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:54547a23ea029fe03b5f58871d4527a748e7ac8f837926dd1a6e08b721fbdc33
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e724795976531e687125fbb945603a96f2112de8f393fc6fa4a9b74f9ac8e79e
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bef39a40db1a483262af7570836839950da73fbe882edbfe93922ade4768db34
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1edd3582e68db638a33154dba95f3473466b2e81ca61ce580cb51b83a6e90aee
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8323834fccc4192732a390e4554f47c9681faaee6040082de0c2920fe02fd450
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f430f59a9990175ce86df7bc8287717036151aba66a7f1f929e5118bcddc0e6
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.9937888198757764,
5
  "eval_steps": 222,
6
- "global_step": 440,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -3103,6 +3103,27 @@
3103
  "learning_rate": 1.3018570910466877e-08,
3104
  "loss": 1.1963,
3105
  "step": 440
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3106
  }
3107
  ],
3108
  "logging_steps": 1,
@@ -3117,12 +3138,12 @@
3117
  "should_evaluate": false,
3118
  "should_log": false,
3119
  "should_save": true,
3120
- "should_training_stop": false
3121
  },
3122
  "attributes": {}
3123
  }
3124
  },
3125
- "total_flos": 2.6129270118945915e+18,
3126
  "train_batch_size": 2,
3127
  "trial_name": null,
3128
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.0005646527385659,
5
  "eval_steps": 222,
6
+ "global_step": 443,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
3103
  "learning_rate": 1.3018570910466877e-08,
3104
  "loss": 1.1963,
3105
  "step": 440
3106
+ },
3107
+ {
3108
+ "epoch": 0.9960474308300395,
3109
+ "grad_norm": 0.48917847871780396,
3110
+ "learning_rate": 5.786171016708419e-09,
3111
+ "loss": 1.5957,
3112
+ "step": 441
3113
+ },
3114
+ {
3115
+ "epoch": 0.9983060417843026,
3116
+ "grad_norm": 0.6857689023017883,
3117
+ "learning_rate": 1.446563679641244e-09,
3118
+ "loss": 1.4271,
3119
+ "step": 442
3120
+ },
3121
+ {
3122
+ "epoch": 1.0005646527385659,
3123
+ "grad_norm": 0.6406208872795105,
3124
+ "learning_rate": 0.0,
3125
+ "loss": 1.5675,
3126
+ "step": 443
3127
  }
3128
  ],
3129
  "logging_steps": 1,
 
3138
  "should_evaluate": false,
3139
  "should_log": false,
3140
  "should_save": true,
3141
+ "should_training_stop": true
3142
  },
3143
  "attributes": {}
3144
  }
3145
  },
3146
+ "total_flos": 2.630732306700042e+18,
3147
  "train_batch_size": 2,
3148
  "trial_name": null,
3149
  "trial_params": null