xuancoblab2023 commited on
Commit
d85e1c4
·
verified ·
1 Parent(s): 4152099

Training in progress, epoch 2

Browse files
logs/events.out.tfevents.1709716821.adc675a344d5.67573.3 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4cfec70353e1792393f9035254bbeb24c0f5630ab9c360b83e0ba97f5cb09f47
3
- size 5314
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3abafa2afbf81d92c37577fddf8088e64f889d1326f127e309cb795a84261afc
3
+ size 5997
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:12de485927495a54a42aa2b293b0adf412d00170117941f81fbe4835dce02946
3
  size 17549312
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c2bbc0e16334675397da6eae3f9cec97a7ba066c14dfe9bfaeecbe8ce680b43
3
  size 17549312
run-2/checkpoint-192/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:444ec7032343c5e48a0bebcbc727c0d6dcc53de822b7281218d78d3d52fc74a5
3
  size 17549312
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c2bbc0e16334675397da6eae3f9cec97a7ba066c14dfe9bfaeecbe8ce680b43
3
  size 17549312
run-2/checkpoint-192/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a7d65e468a5ea6ece563e4a260f8a916b8919ff2c935298cbc0e77b353da1ae9
3
  size 35122746
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f360aeb57e55cec8e68847ef51bb3de32b78e5a1d86bbea3082e69c5a0126e5b
3
  size 35122746
run-2/checkpoint-192/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:76b1ca96b43548704a5f4d11597321c5afbd7e065f2cc83810db95ee4c1c77f7
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1bff0ab8e040a10e09a99435f8ce9d9312e47d8d81f03c526f96c8267c11c97d
3
  size 1064
run-2/checkpoint-192/trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.8140900195694716,
3
  "best_model_checkpoint": "tiny-bert-sst2-distilled/run-2/checkpoint-192",
4
  "epoch": 2.0,
5
  "eval_steps": 500,
@@ -10,55 +10,55 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "grad_norm": 3.4323604106903076,
14
- "learning_rate": 0.0004667999543114754,
15
- "loss": 0.533,
16
  "step": 96
17
  },
18
  {
19
  "epoch": 1.0,
20
- "eval_accuracy": 0.7984344422700587,
21
- "eval_f1": 0.8049242424242424,
22
- "eval_loss": 0.4442267119884491,
23
- "eval_precision": 0.7798165137614679,
24
- "eval_recall": 0.8317025440313112,
25
- "eval_runtime": 28.6457,
26
- "eval_samples_per_second": 35.677,
27
- "eval_steps_per_second": 1.117,
28
  "step": 96
29
  },
30
  {
31
  "epoch": 2.0,
32
- "grad_norm": 2.4163033962249756,
33
- "learning_rate": 0.0,
34
- "loss": 0.4374,
35
  "step": 192
36
  },
37
  {
38
  "epoch": 2.0,
39
- "eval_accuracy": 0.8140900195694716,
40
- "eval_f1": 0.8243992606284659,
41
- "eval_loss": 0.4299594759941101,
42
- "eval_precision": 0.7810858143607706,
43
- "eval_recall": 0.87279843444227,
44
- "eval_runtime": 28.93,
45
- "eval_samples_per_second": 35.327,
46
- "eval_steps_per_second": 1.106,
47
  "step": 192
48
  }
49
  ],
50
  "logging_steps": 500,
51
- "max_steps": 192,
52
  "num_input_tokens_seen": 0,
53
- "num_train_epochs": 2,
54
  "save_steps": 500,
55
  "total_flos": 471390394560.0,
56
  "train_batch_size": 32,
57
  "trial_name": null,
58
  "trial_params": {
59
- "alpha": 0.88253398201078,
60
- "learning_rate": 0.0009335999086229508,
61
- "num_train_epochs": 2,
62
- "temperature": 19
63
  }
64
  }
 
1
  {
2
+ "best_metric": 0.5675146771037182,
3
  "best_model_checkpoint": "tiny-bert-sst2-distilled/run-2/checkpoint-192",
4
  "epoch": 2.0,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "grad_norm": 0.663398027420044,
14
+ "learning_rate": 0.00027867701883546326,
15
+ "loss": 0.2787,
16
  "step": 96
17
  },
18
  {
19
  "epoch": 1.0,
20
+ "eval_accuracy": 0.5499021526418787,
21
+ "eval_f1": 0.24092409240924093,
22
+ "eval_loss": 0.25340619683265686,
23
+ "eval_precision": 0.7684210526315789,
24
+ "eval_recall": 0.14285714285714285,
25
+ "eval_runtime": 28.5207,
26
+ "eval_samples_per_second": 35.834,
27
+ "eval_steps_per_second": 1.122,
28
  "step": 96
29
  },
30
  {
31
  "epoch": 2.0,
32
+ "grad_norm": 0.7603411078453064,
33
+ "learning_rate": 0.00024384239148103037,
34
+ "loss": 0.2582,
35
  "step": 192
36
  },
37
  {
38
  "epoch": 2.0,
39
+ "eval_accuracy": 0.5675146771037182,
40
+ "eval_f1": 0.300632911392405,
41
+ "eval_loss": 0.2482573688030243,
42
+ "eval_precision": 0.7851239669421488,
43
+ "eval_recall": 0.18590998043052837,
44
+ "eval_runtime": 28.5782,
45
+ "eval_samples_per_second": 35.762,
46
+ "eval_steps_per_second": 1.12,
47
  "step": 192
48
  }
49
  ],
50
  "logging_steps": 500,
51
+ "max_steps": 864,
52
  "num_input_tokens_seen": 0,
53
+ "num_train_epochs": 9,
54
  "save_steps": 500,
55
  "total_flos": 471390394560.0,
56
  "train_batch_size": 32,
57
  "trial_name": null,
58
  "trial_params": {
59
+ "alpha": 0.3483609408663828,
60
+ "learning_rate": 0.0003135116461898962,
61
+ "num_train_epochs": 9,
62
+ "temperature": 7
63
  }
64
  }
run-2/checkpoint-192/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2659042d49fa36ce1404b1f7057dd4643dc22f653d1fc44d521700862149e4b7
3
  size 4920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7adcc08e8d37cad0335688bbf483a90600b348a62bf08e2b72452e95967f2a4
3
  size 4920