DuongTrongChi commited on
Commit
319dccc
·
verified ·
1 Parent(s): 23b5d8c

Training in progress, step 174, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:44626cc94e4ae4ef2189f492ec6a02f6a9cf34d81e54c3c0d3c5d06f2b5db83b
3
  size 73911112
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56a2e73c9f0ba15318c013faf0d516ee65831595556a20e8cc91038732cbb63f
3
  size 73911112
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:20b50b88935790b9e8a1ab3ebd399aafd75c99d1e6cae3998824e30f7299dfba
3
  size 37430836
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79a0e23d7291a4e9f915b30d705155a393e8800f2f6f4e596397adff82be650e
3
  size 37430836
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dd41ad516c648e6a91e8eb789b6ec82ae8142cda642d8cd2955159250148cb8d
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77a17188e5eae813466d478a1f96ede6eeeb68c0c6586491c70042c476c86443
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.4663923182441701,
5
  "eval_steps": 500,
6
- "global_step": 170,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -1197,6 +1197,34 @@
1197
  "learning_rate": 0.00014696969696969698,
1198
  "loss": 1.3067,
1199
  "step": 170
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1200
  }
1201
  ],
1202
  "logging_steps": 1,
@@ -1216,7 +1244,7 @@
1216
  "attributes": {}
1217
  }
1218
  },
1219
- "total_flos": 2.109386405851054e+17,
1220
  "train_batch_size": 4,
1221
  "trial_name": null,
1222
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.4773662551440329,
5
  "eval_steps": 500,
6
+ "global_step": 174,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
1197
  "learning_rate": 0.00014696969696969698,
1198
  "loss": 1.3067,
1199
  "step": 170
1200
+ },
1201
+ {
1202
+ "epoch": 0.4691358024691358,
1203
+ "grad_norm": 0.14815697073936462,
1204
+ "learning_rate": 0.00014621212121212123,
1205
+ "loss": 1.2492,
1206
+ "step": 171
1207
+ },
1208
+ {
1209
+ "epoch": 0.4718792866941015,
1210
+ "grad_norm": 0.13748030364513397,
1211
+ "learning_rate": 0.00014545454545454546,
1212
+ "loss": 1.2281,
1213
+ "step": 172
1214
+ },
1215
+ {
1216
+ "epoch": 0.47462277091906724,
1217
+ "grad_norm": 0.14712287485599518,
1218
+ "learning_rate": 0.0001446969696969697,
1219
+ "loss": 1.1438,
1220
+ "step": 173
1221
+ },
1222
+ {
1223
+ "epoch": 0.4773662551440329,
1224
+ "grad_norm": 0.13734129071235657,
1225
+ "learning_rate": 0.00014393939393939396,
1226
+ "loss": 1.2528,
1227
+ "step": 174
1228
  }
1229
  ],
1230
  "logging_steps": 1,
 
1244
  "attributes": {}
1245
  }
1246
  },
1247
+ "total_flos": 2.1599650151780352e+17,
1248
  "train_batch_size": 4,
1249
  "trial_name": null,
1250
  "trial_params": null