xuancoblab2023 commited on
Commit
385e44f
·
verified ·
1 Parent(s): cea2cdf

Training in progress, epoch 1

Browse files
logs/events.out.tfevents.1709737131.1dcff7455174.4515.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d91e9148ba06f491d0300049693c2341f409577e770e2d96ea5a140e22454fc6
3
+ size 4184
logs/events.out.tfevents.1709737211.1dcff7455174.7719.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c9e523b45bc117c2c3cbadd311f9ddb670d13903eeffafd785984849a8ace2c
3
+ size 5315
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7792eeef88f2b040b67cfb87d16e308ac052158fc8773d47734046de06043a16
3
  size 17549312
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c92adc7dcf01e1fbb05511c4493199b42d344e3981283ab521c477e538f9aceb
3
  size 17549312
run-0/checkpoint-96/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:436c1223e40cc411f216b7a6eb698829ee74318f91d2f9ee826e701f17df37dd
3
  size 17549312
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c92adc7dcf01e1fbb05511c4493199b42d344e3981283ab521c477e538f9aceb
3
  size 17549312
run-0/checkpoint-96/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:14bc0388b3bb04b006cead065a5f3631ae5c4ff9034a98aaaa7d3d7bb6d3b660
3
  size 35122746
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db3824b1c6f237bcf65a54ea4cca3aa03e4cfa3c81a3b6afc4e72e03c759249e
3
  size 35122746
run-0/checkpoint-96/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:98396641528716b08d59d05e7221ff89e68ef8805fd0936c83a7ab0df7e80e0c
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43ddd3b1c41613cd7e1e1227d929645b76a450f62d1a6ce5575c2f7873d9d0b6
3
  size 1064
run-0/checkpoint-96/trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.7436399217221135,
3
  "best_model_checkpoint": "tiny-bert-sst2-distilled/run-0/checkpoint-96",
4
  "epoch": 1.0,
5
  "eval_steps": 500,
@@ -10,36 +10,36 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "grad_norm": 1.8004393577575684,
14
- "learning_rate": 0.0007697157586205755,
15
- "loss": 0.4935,
16
  "step": 96
17
  },
18
  {
19
  "epoch": 1.0,
20
- "eval_accuracy": 0.7436399217221135,
21
- "eval_f1": 0.7689594356261024,
22
- "eval_loss": 0.448881596326828,
23
- "eval_precision": 0.6998394863563403,
24
- "eval_recall": 0.8532289628180039,
25
- "eval_runtime": 28.6476,
26
- "eval_samples_per_second": 35.675,
27
- "eval_steps_per_second": 1.117,
28
  "step": 96
29
  }
30
  ],
31
  "logging_steps": 500,
32
- "max_steps": 960,
33
  "num_input_tokens_seen": 0,
34
- "num_train_epochs": 10,
35
  "save_steps": 500,
36
  "total_flos": 235695197280.0,
37
  "train_batch_size": 32,
38
  "trial_name": null,
39
  "trial_params": {
40
- "alpha": 0.735211359802956,
41
- "learning_rate": 0.0008552397318006393,
42
- "num_train_epochs": 10,
43
- "temperature": 25
44
  }
45
  }
 
1
  {
2
+ "best_metric": 0.7514677103718199,
3
  "best_model_checkpoint": "tiny-bert-sst2-distilled/run-0/checkpoint-96",
4
  "epoch": 1.0,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "grad_norm": 1.6740443706512451,
14
+ "learning_rate": 0.0001218354408608861,
15
+ "loss": 0.4816,
16
  "step": 96
17
  },
18
  {
19
  "epoch": 1.0,
20
+ "eval_accuracy": 0.7514677103718199,
21
+ "eval_f1": 0.7519531250000001,
22
+ "eval_loss": 0.41538161039352417,
23
+ "eval_precision": 0.7504873294346979,
24
+ "eval_recall": 0.7534246575342466,
25
+ "eval_runtime": 26.5175,
26
+ "eval_samples_per_second": 38.541,
27
+ "eval_steps_per_second": 1.207,
28
  "step": 96
29
  }
30
  ],
31
  "logging_steps": 500,
32
+ "max_steps": 480,
33
  "num_input_tokens_seen": 0,
34
+ "num_train_epochs": 5,
35
  "save_steps": 500,
36
  "total_flos": 235695197280.0,
37
  "train_batch_size": 32,
38
  "trial_name": null,
39
  "trial_params": {
40
+ "alpha": 0.679174768290245,
41
+ "learning_rate": 0.00015229430107610762,
42
+ "num_train_epochs": 5,
43
+ "temperature": 27
44
  }
45
  }
run-0/checkpoint-96/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:23804eaaa0feed30486319d2982557f65dce708f7d788864c811c20b2e8c33b4
3
  size 4920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1873f3a503b2d5b3f7200baa33f737ba864dd65edb3834d85c5b8e40b6b72f07
3
  size 4920
tokenizer.json CHANGED
@@ -2,7 +2,7 @@
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
- "max_length": 33,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
 
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
+ "max_length": 31,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6ccea265ae9122da077ff8def664c83c587f85ed26bee202b170a564116cd542
3
  size 4920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1873f3a503b2d5b3f7200baa33f737ba864dd65edb3834d85c5b8e40b6b72f07
3
  size 4920