xuancoblab2023 commited on
Commit
97ee9f5
·
verified ·
1 Parent(s): aaff26e

Training in progress, epoch 1

Browse files
logs/events.out.tfevents.1709699344.a2333cf40ebd.21010.9 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7d11f8656f960a8d66413d3f027d70c316fa595c20289fc0899ff6623b4aff68
3
- size 5315
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a915fc24599d0118bd0ce3f4c2df13cb9694a0c6ec2e9ab10020c882d0aefc18
3
+ size 5998
logs/events.out.tfevents.1709699573.a2333cf40ebd.21010.10 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74a80c0d3ab62a0fa626e8b75d0139975fbfc23c421938b426ea598551984455
3
+ size 5314
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3d8d6934d852376a5bc13fbfb17016d4c3adcd7b7bdd42a9aab8b9b5d9f62a1b
3
  size 17549312
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e79087651dbe07597bcc519c0603106d4238d761309189dc1d8c49bbe9fbdd0
3
  size 17549312
run-10/checkpoint-96/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3735ea28e3d6cd1886c3e5c7b2785a2ab71ac55d4b90d7f42c9458c9b695f9ba
3
  size 17549312
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e79087651dbe07597bcc519c0603106d4238d761309189dc1d8c49bbe9fbdd0
3
  size 17549312
run-10/checkpoint-96/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3bce6830ac8b5a9392d5fdf74c2ac9c0069f48622b95ea10f88257a2f7bea411
3
  size 35122746
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3771f7ce5a1e746e27d5b4f30b62b81054ea67cf657063408de78b4fac6385f5
3
  size 35122746
run-10/checkpoint-96/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:36e71e872b9193820685ba7498cf93679ddf638b478b2d60f14aa587fd2c9678
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35ad384a49732bbba66f365d68a02bf664cf1489238a42c775ec81b19b0b82fa
3
  size 1064
run-10/checkpoint-96/trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.799412915851272,
3
  "best_model_checkpoint": "tiny-bert-sst2-distilled/run-10/checkpoint-96",
4
  "epoch": 1.0,
5
  "eval_steps": 500,
@@ -10,36 +10,36 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "grad_norm": 1.9170680046081543,
14
- "learning_rate": 0.0005212663608648181,
15
- "loss": 0.5641,
16
  "step": 96
17
  },
18
  {
19
  "epoch": 1.0,
20
- "eval_accuracy": 0.799412915851272,
21
- "eval_f1": 0.8197009674582234,
22
- "eval_loss": 0.47259676456451416,
23
- "eval_precision": 0.744408945686901,
24
- "eval_recall": 0.9119373776908023,
25
- "eval_runtime": 30.8424,
26
- "eval_samples_per_second": 33.136,
27
- "eval_steps_per_second": 1.038,
28
  "step": 96
29
  }
30
  ],
31
  "logging_steps": 500,
32
- "max_steps": 288,
33
  "num_input_tokens_seen": 0,
34
- "num_train_epochs": 3,
35
  "save_steps": 500,
36
  "total_flos": 235695197280.0,
37
  "train_batch_size": 32,
38
  "trial_name": null,
39
  "trial_params": {
40
- "alpha": 0.9610512963031814,
41
- "learning_rate": 0.0007818995412972273,
42
- "num_train_epochs": 3,
43
- "temperature": 24
44
  }
45
  }
 
1
  {
2
+ "best_metric": 0.7524461839530333,
3
  "best_model_checkpoint": "tiny-bert-sst2-distilled/run-10/checkpoint-96",
4
  "epoch": 1.0,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "grad_norm": 2.535670757293701,
14
+ "learning_rate": 0.00048723007690763744,
15
+ "loss": 0.5767,
16
  "step": 96
17
  },
18
  {
19
  "epoch": 1.0,
20
+ "eval_accuracy": 0.7524461839530333,
21
+ "eval_f1": 0.7924528301886793,
22
+ "eval_loss": 0.4912106394767761,
23
+ "eval_precision": 0.6822033898305084,
24
+ "eval_recall": 0.9452054794520548,
25
+ "eval_runtime": 30.3562,
26
+ "eval_samples_per_second": 33.667,
27
+ "eval_steps_per_second": 1.054,
28
  "step": 96
29
  }
30
  ],
31
  "logging_steps": 500,
32
+ "max_steps": 192,
33
  "num_input_tokens_seen": 0,
34
+ "num_train_epochs": 2,
35
  "save_steps": 500,
36
  "total_flos": 235695197280.0,
37
  "train_batch_size": 32,
38
  "trial_name": null,
39
  "trial_params": {
40
+ "alpha": 0.964566953098255,
41
+ "learning_rate": 0.0009744601538152749,
42
+ "num_train_epochs": 2,
43
+ "temperature": 30
44
  }
45
  }
run-10/checkpoint-96/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9c48cb920a64a7322ad1d6d741321a643be4ed10af970a24a154150a0def2990
3
  size 4920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b603cc11f59a882aaaffb8f9536f958187e41d9698ff3658445388c161757421
3
  size 4920
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4c88ab003cb8d443d320a7d2a50b7663500e4bdf0605d3f2691a06db8acbcf72
3
  size 4920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b603cc11f59a882aaaffb8f9536f958187e41d9698ff3658445388c161757421
3
  size 4920