lesso15 commited on
Commit
a50bf04
·
verified ·
1 Parent(s): c9ef032

Training in progress, step 150, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1b87151ff71f3075240e1a34c1d0098091d99e65fb5ee1ad5622760cbbad1bf5
3
  size 161533192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7de312a8e99302e407350ebbec58756a087c45b23dc22ecd5cbaf2bf255638aa
3
  size 161533192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1b6dcb58778735d168c93ef2df11cdd738a05ccdad1b675c9e835aa54a45d436
3
  size 82460660
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76c4e7dd175d1171233199ac5270115297bfa975d16ffbc4bbc1e069e1c71096
3
  size 82460660
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c118a7edf324ff6a1a38ff16f32a35eca90bf09908928dcd2cc8e742873a1ea2
3
  size 14308
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41665902630196f54d3bb1edfb2e49940aea6b83aae2e61e59c5648fef9e424c
3
  size 14308
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dcdcbf7cad190cbb1eebcf5d3a7c6ead1c2f7214ab2b43c16f7e1860aaee06af
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f2e88614aff46cd1ada70fbc3b2ec41b24cceb0ef1b4801de4a83c39b9b26bc
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 1.4174914360046387,
3
  "best_model_checkpoint": "miner_id_24/checkpoint-50",
4
- "epoch": 0.05762028233938346,
5
  "eval_steps": 50,
6
- "global_step": 100,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -101,6 +101,49 @@
101
  "eval_samples_per_second": 16.252,
102
  "eval_steps_per_second": 4.068,
103
  "step": 100
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
104
  }
105
  ],
106
  "logging_steps": 10,
@@ -115,7 +158,7 @@
115
  "early_stopping_threshold": 0.0
116
  },
117
  "attributes": {
118
- "early_stopping_patience_counter": 1
119
  }
120
  },
121
  "TrainerControl": {
@@ -129,7 +172,7 @@
129
  "attributes": {}
130
  }
131
  },
132
- "total_flos": 1.808762618983219e+16,
133
  "train_batch_size": 4,
134
  "trial_name": null,
135
  "trial_params": null
 
1
  {
2
  "best_metric": 1.4174914360046387,
3
  "best_model_checkpoint": "miner_id_24/checkpoint-50",
4
+ "epoch": 0.08643042350907519,
5
  "eval_steps": 50,
6
+ "global_step": 150,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
101
  "eval_samples_per_second": 16.252,
102
  "eval_steps_per_second": 4.068,
103
  "step": 100
104
+ },
105
+ {
106
+ "epoch": 0.0633823105733218,
107
+ "grad_norm": 0.610034704208374,
108
+ "learning_rate": 0.00020570613669657956,
109
+ "loss": 1.7989,
110
+ "step": 110
111
+ },
112
+ {
113
+ "epoch": 0.06914433880726016,
114
+ "grad_norm": 0.7986786365509033,
115
+ "learning_rate": 0.00020241686623233464,
116
+ "loss": 1.5293,
117
+ "step": 120
118
+ },
119
+ {
120
+ "epoch": 0.0749063670411985,
121
+ "grad_norm": 0.9212441444396973,
122
+ "learning_rate": 0.00019866517033681577,
123
+ "loss": 1.2778,
124
+ "step": 130
125
+ },
126
+ {
127
+ "epoch": 0.08066839527513685,
128
+ "grad_norm": 0.9731055498123169,
129
+ "learning_rate": 0.00019446932689530684,
130
+ "loss": 1.0822,
131
+ "step": 140
132
+ },
133
+ {
134
+ "epoch": 0.08643042350907519,
135
+ "grad_norm": 1.488525390625,
136
+ "learning_rate": 0.0001898497776352901,
137
+ "loss": 0.8345,
138
+ "step": 150
139
+ },
140
+ {
141
+ "epoch": 0.08643042350907519,
142
+ "eval_loss": 1.5110596418380737,
143
+ "eval_runtime": 45.1761,
144
+ "eval_samples_per_second": 16.181,
145
+ "eval_steps_per_second": 4.051,
146
+ "step": 150
147
  }
148
  ],
149
  "logging_steps": 10,
 
158
  "early_stopping_threshold": 0.0
159
  },
160
  "attributes": {
161
+ "early_stopping_patience_counter": 2
162
  }
163
  },
164
  "TrainerControl": {
 
172
  "attributes": {}
173
  }
174
  },
175
+ "total_flos": 2.708774936641536e+16,
176
  "train_batch_size": 4,
177
  "trial_name": null,
178
  "trial_params": null