xuancoblab2023 commited on
Commit
85b9aa8
·
verified ·
1 Parent(s): 112c097

Training in progress, epoch 1

Browse files
logs/events.out.tfevents.1711265559.73e3a81c01ef.413.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c360d659b9598e9424aca54f91f2d5cf27de071ff70f1c0cc9c41e4d90ba052
3
+ size 4184
logs/events.out.tfevents.1711265653.73e3a81c01ef.4225.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29328cc7547f41743a4985f8d99faf99f508f44dea209ce91b456a7d804ef40f
3
+ size 5407
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:29082dbaea3f8e47cfcc31c6e16d3679b1f3daafed858d8b69e14033805c58b9
3
  size 17549312
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70b7f7f1a78e0b340b57dfae4e8a71ef78a3dbee8319a311f6096e6cf4233908
3
  size 17549312
run-0/checkpoint-192/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9ad0bd06080c9950cf0b32ccbbbcf6703c55e10377efa299383ee3e5fbe872af
3
  size 17549312
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70b7f7f1a78e0b340b57dfae4e8a71ef78a3dbee8319a311f6096e6cf4233908
3
  size 17549312
run-0/checkpoint-192/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:010a84581763e78e630b72ef20feb9007b160dc66fe58d5b5e40e5c8dce9d715
3
  size 35122746
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:356dee3ad756ad1b2b75bf326a1853ce70012cbc769d26f68477c7f9a8c9d542
3
  size 35122746
run-0/checkpoint-192/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5c58c0607d97c986e9d4c30b0aa74b33350e0c7e86978aaaaadda4ebb78f21ad
3
  size 14054
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee09ea0d216727b799a80771850b95d7d61b646360702c64b2ec889cdc725399
3
  size 14054
run-0/checkpoint-192/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ae35fc790746b06c7bed32afc0cf4fb21caaf6a541d31f420d923a2b79458e53
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5203618527782331a9cff178ca211eed05dd20856984abcc56b6a5b95a15783
3
  size 1064
run-0/checkpoint-192/trainer_state.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "best_metric": 0.5,
3
  "best_model_checkpoint": "tiny-bert-sst2-distilled/run-0/checkpoint-192",
4
- "epoch": 2.0,
5
  "eval_steps": 500,
6
  "global_step": 192,
7
  "is_hyper_param_search": true,
@@ -10,55 +10,38 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "grad_norm": 0.8380242586135864,
14
- "learning_rate": 8.6265645867868e-06,
15
- "loss": 0.6538,
16
- "step": 96
17
- },
18
- {
19
- "epoch": 1.0,
20
- "eval_accuracy": 0.4980430528375734,
21
- "eval_f1": 0.06215722120658134,
22
- "eval_loss": 0.6460775136947632,
23
- "eval_precision": 0.4722222222222222,
24
- "eval_recall": 0.033268101761252444,
25
- "eval_runtime": 32.7473,
26
- "eval_samples_per_second": 31.209,
27
- "eval_steps_per_second": 0.977,
28
- "step": 96
29
- },
30
- {
31
- "epoch": 2.0,
32
- "grad_norm": 1.982408046722412,
33
- "learning_rate": 6.901251669429439e-06,
34
- "loss": 0.6453,
35
  "step": 192
36
  },
37
  {
38
- "epoch": 2.0,
39
- "eval_accuracy": 0.5,
40
- "eval_f1": 0.019193857965451058,
41
- "eval_loss": 0.6427881717681885,
42
- "eval_precision": 0.5,
43
- "eval_recall": 0.009784735812133072,
44
- "eval_runtime": 30.8528,
45
- "eval_samples_per_second": 33.125,
46
- "eval_steps_per_second": 1.037,
 
47
  "step": 192
48
  }
49
  ],
50
  "logging_steps": 500,
51
- "max_steps": 576,
52
  "num_input_tokens_seen": 0,
53
- "num_train_epochs": 6,
54
  "save_steps": 500,
55
- "total_flos": 471390394560.0,
56
- "train_batch_size": 32,
57
  "trial_name": null,
58
  "trial_params": {
59
- "alpha": 0.9136100763812092,
60
- "learning_rate": 1.035187750414416e-05,
61
- "num_train_epochs": 6,
62
- "temperature": 5
 
63
  }
64
  }
 
1
  {
2
+ "best_metric": 0.6976516634050881,
3
  "best_model_checkpoint": "tiny-bert-sst2-distilled/run-0/checkpoint-192",
4
+ "epoch": 1.0,
5
  "eval_steps": 500,
6
  "global_step": 192,
7
  "is_hyper_param_search": true,
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "grad_norm": 1.7846055030822754,
14
+ "learning_rate": 4.610177667546352e-05,
15
+ "loss": 0.4587,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
16
  "step": 192
17
  },
18
  {
19
+ "epoch": 1.0,
20
+ "eval_accuracy": 0.6976516634050881,
21
+ "eval_f1": 0.6419466975666281,
22
+ "eval_loss": 0.4008609354496002,
23
+ "eval_mcc": 0.41595144404027,
24
+ "eval_precision": 0.7869318181818182,
25
+ "eval_recall": 0.5420743639921722,
26
+ "eval_runtime": 66.5688,
27
+ "eval_samples_per_second": 15.353,
28
+ "eval_steps_per_second": 0.481,
29
  "step": 192
30
  }
31
  ],
32
  "logging_steps": 500,
33
+ "max_steps": 1920,
34
  "num_input_tokens_seen": 0,
35
+ "num_train_epochs": 10,
36
  "save_steps": 500,
37
+ "total_flos": 235695197280.0,
38
+ "train_batch_size": 16,
39
  "trial_name": null,
40
  "trial_params": {
41
+ "alpha": 0.6226480553446316,
42
+ "learning_rate": 5.122419630607058e-05,
43
+ "num_train_epochs": 10,
44
+ "per_device_train_batch_size": 16,
45
+ "temperature": 20
46
  }
47
  }
run-0/checkpoint-192/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ebe7dd3c3e257754c6583ea668a830f19b3dc80cb7982abc3ddecb0dac8e92b5
3
- size 4920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dbca9cde0b156ba25d74ee6bc6ea4c2fa160afa3570e75ccc73231ac4a159c49
3
+ size 4984
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2c0967cc1aebc72646b1634b2a505d0131b61790f8449416683fb0b8bf534fc0
3
- size 4920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dbca9cde0b156ba25d74ee6bc6ea4c2fa160afa3570e75ccc73231ac4a159c49
3
+ size 4984