tmnam20 commited on
Commit
abfe966
·
1 Parent(s): e76f4b9

Training in progress, step 100, checkpoint

Browse files
checkpoint-100/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:96df8dd678de7c9d23cf5f8dda9133a83dd98dfb460ea95a4fb2dc22d8752365
3
  size 1474893317
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:656ed54fe0a8b84aa66db81f903d3ddbb3aca7edcab5c1769c3d44f87fe90939
3
  size 1474893317
checkpoint-100/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4141ef29c5d1a3d0269840b8d7cb6b4cbd2f3c34a45521eb10df3e8f3d1ce399
3
  size 737457141
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:057eda2c682bf9d9c903eb92f7c38cd743ca463e0c19fef70ca36d331551a8b1
3
  size 737457141
checkpoint-100/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5ee42ba47149d52ce0f1b0e713f48f980d6f585d6f1d401fc0f38d3db1416b62
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e9624411eb0f1fd660261f3e4d9bcc1fe5110e59f1a1401372c693dafb1d75e
3
  size 14575
checkpoint-100/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6722ec8c45928bf7d3dc083d89fb6e8c1e5f98313ddbf4c3c80ba8ab0cf5d2ef
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20769b67f2ef261d19043e9e784bd3f0a87b8b69b311de1d28c2468463bc32ba
3
  size 627
checkpoint-100/trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.6272028088569641,
3
  "best_model_checkpoint": "/kaggle/output/checkpoint-100",
4
  "epoch": 0.2066115702479339,
5
  "eval_steps": 50,
@@ -10,34 +10,46 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.0,
13
- "learning_rate": 1.6666666666666667e-06,
14
- "loss": 0.6979,
15
  "step": 1
16
  },
 
 
 
 
 
 
17
  {
18
  "epoch": 0.1,
19
  "eval_accuracy": 0.75,
20
- "eval_loss": 0.6723740696907043,
21
- "eval_runtime": 28.903,
22
- "eval_samples_per_second": 40.965,
23
- "eval_steps_per_second": 20.482,
24
  "step": 50
25
  },
 
 
 
 
 
 
26
  {
27
  "epoch": 0.21,
28
  "eval_accuracy": 0.75,
29
- "eval_loss": 0.6272028088569641,
30
- "eval_runtime": 28.756,
31
- "eval_samples_per_second": 41.174,
32
- "eval_steps_per_second": 20.587,
33
  "step": 100
34
  }
35
  ],
36
- "logging_steps": 1000,
37
  "max_steps": 1000,
38
  "num_train_epochs": 3,
39
  "save_steps": 100,
40
- "total_flos": 322260294311640.0,
41
  "trial_name": null,
42
  "trial_params": null
43
  }
 
1
  {
2
+ "best_metric": 0.5696164965629578,
3
  "best_model_checkpoint": "/kaggle/output/checkpoint-100",
4
  "epoch": 0.2066115702479339,
5
  "eval_steps": 50,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.0,
13
+ "learning_rate": 0.0,
14
+ "loss": 0.7246,
15
  "step": 1
16
  },
17
+ {
18
+ "epoch": 0.1,
19
+ "learning_rate": 7.333333333333332e-05,
20
+ "loss": 0.5982,
21
+ "step": 50
22
+ },
23
  {
24
  "epoch": 0.1,
25
  "eval_accuracy": 0.75,
26
+ "eval_loss": 0.6296697854995728,
27
+ "eval_runtime": 30.5612,
28
+ "eval_samples_per_second": 38.742,
29
+ "eval_steps_per_second": 19.371,
30
  "step": 50
31
  },
32
+ {
33
+ "epoch": 0.21,
34
+ "learning_rate": 0.00015,
35
+ "loss": 0.5505,
36
+ "step": 100
37
+ },
38
  {
39
  "epoch": 0.21,
40
  "eval_accuracy": 0.75,
41
+ "eval_loss": 0.5696164965629578,
42
+ "eval_runtime": 30.5816,
43
+ "eval_samples_per_second": 38.716,
44
+ "eval_steps_per_second": 19.358,
45
  "step": 100
46
  }
47
  ],
48
+ "logging_steps": 50,
49
  "max_steps": 1000,
50
  "num_train_epochs": 3,
51
  "save_steps": 100,
52
+ "total_flos": 348571871706840.0,
53
  "trial_name": null,
54
  "trial_params": null
55
  }
checkpoint-100/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fbe5e88ca49040823bdb83dc035b8a4470c58ae105b0482f624b7d48f5e08cbe
3
  size 4027
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd0372335b8d69875fb40a5865f6914bab9ff539640d01b439e8f707b1e5a43d
3
  size 4027