DuongTrongChi commited on
Commit
0f1a91b
·
verified ·
1 Parent(s): 4948755

Training in progress, step 59, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:18e1fa113e6149ce9c6ce95ed8a7aeeab5f87e234d1b33709c3dbb7f598be74c
3
  size 73911112
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3aff3636ab3523c875e895edf1c22ffba31c1bd38d1a6e2f1984f4373d0f60d
3
  size 73911112
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:01036a507461b9269482d82d9e8e9d29fc4ea4955d2c69274168112f597313e8
3
  size 37430836
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0796cbd549515f8a66cd097c13d51c18287da5b3a0bfc23819777bcfeb7ae594
3
  size 37430836
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:060fb8d01e61c5a9e60483fa6352a837a9ab184977ffc490aaafd24dbde173a4
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea916cbeea5eaa52a1f1be13dd70aec5eda379a7398c920ae7786ff902929743
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.15089163237311384,
5
  "eval_steps": 500,
6
- "global_step": 55,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -392,6 +392,34 @@
392
  "learning_rate": 0.00011000000000000002,
393
  "loss": 1.3694,
394
  "step": 55
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
395
  }
396
  ],
397
  "logging_steps": 1,
@@ -411,7 +439,7 @@
411
  "attributes": {}
412
  }
413
  },
414
- "total_flos": 6.802733722810368e+16,
415
  "train_batch_size": 4,
416
  "trial_name": null,
417
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.16186556927297668,
5
  "eval_steps": 500,
6
+ "global_step": 59,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
392
  "learning_rate": 0.00011000000000000002,
393
  "loss": 1.3694,
394
  "step": 55
395
+ },
396
+ {
397
+ "epoch": 0.15363511659807957,
398
+ "grad_norm": 0.15829141438007355,
399
+ "learning_rate": 0.00011200000000000001,
400
+ "loss": 1.3351,
401
+ "step": 56
402
+ },
403
+ {
404
+ "epoch": 0.15637860082304528,
405
+ "grad_norm": 0.16939309239387512,
406
+ "learning_rate": 0.00011399999999999999,
407
+ "loss": 1.3487,
408
+ "step": 57
409
+ },
410
+ {
411
+ "epoch": 0.15912208504801098,
412
+ "grad_norm": 0.19683969020843506,
413
+ "learning_rate": 0.000116,
414
+ "loss": 1.2837,
415
+ "step": 58
416
+ },
417
+ {
418
+ "epoch": 0.16186556927297668,
419
+ "grad_norm": 0.17148783802986145,
420
+ "learning_rate": 0.000118,
421
+ "loss": 1.3372,
422
+ "step": 59
423
  }
424
  ],
425
  "logging_steps": 1,
 
439
  "attributes": {}
440
  }
441
  },
442
+ "total_flos": 7.302877225272115e+16,
443
  "train_batch_size": 4,
444
  "trial_name": null,
445
  "trial_params": null