xuancoblab2023 commited on
Commit
eb43b89
·
verified ·
1 Parent(s): 1082471

Training in progress, epoch 1

Browse files
logs/events.out.tfevents.1711203362.a08db75a0e93.4335.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:71fe8ea276034d50ea2662487d33044c22d787b07263563c26bc2054c6a3ae66
3
- size 17642
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6fe9be7ab2d5b1bc79a7e0d52c51ede7b7d10f52b4d484c8856134da3a874770
3
+ size 18679
logs/events.out.tfevents.1711205777.a08db75a0e93.4335.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78b630a9e465aa30be443299a34b49e6b081b0ba8d18c6b2ce1ee8f872140993
3
+ size 5346
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9d5b5c121b1eac187d043c4e323d50eadad9d5980290a5238c92477d7e0cdce8
3
  size 17549312
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b076bb533559423580ae70c17097e396f62387c173c74e541e335bac8e7e180
3
  size 17549312
run-0/checkpoint-96/config.json CHANGED
@@ -27,7 +27,7 @@
27
  "position_embedding_type": "absolute",
28
  "problem_type": "single_label_classification",
29
  "torch_dtype": "float32",
30
- "transformers_version": "4.38.2",
31
  "type_vocab_size": 2,
32
  "use_cache": true,
33
  "vocab_size": 30522
 
27
  "position_embedding_type": "absolute",
28
  "problem_type": "single_label_classification",
29
  "torch_dtype": "float32",
30
+ "transformers_version": "4.39.1",
31
  "type_vocab_size": 2,
32
  "use_cache": true,
33
  "vocab_size": 30522
run-0/checkpoint-96/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a9deaf7b9483814e8658af2bd540c9c428e1d9d74902b8546da37c62a418f2b8
3
  size 17549312
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b076bb533559423580ae70c17097e396f62387c173c74e541e335bac8e7e180
3
  size 17549312
run-0/checkpoint-96/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5e8f5ef6ee86d49f7eb75c8214eefcb88b1a2166ac8c9a098a261f23125fce34
3
  size 35122746
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33b703a05840ff22d318422c0edd034a5683303adcf0be6a9f507ceb8211b739
3
  size 35122746
run-0/checkpoint-96/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6bc13e09b59a62b6fb29cad756bfeefcce6f512c71a9054cc39e336db0b532a5
3
  size 14054
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24aa86019b8aea1c551cc1adaf38c4db2fc01de75a22af312230f6b592e0fd81
3
  size 14054
run-0/checkpoint-96/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5bd902627d0c1d565c70987837a95a63c8ee21875132d3259ea0ce69d0e7372a
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1deff0f11257c2d691ece1057908e736422281f9c02aff1f44118d31a5fc6ba2
3
  size 1064
run-0/checkpoint-96/trainer_state.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "best_metric": 0.5,
3
- "best_model_checkpoint": "tiny-bert-sst2-distilled/run-0/checkpoint-48",
4
- "epoch": 2.0,
5
  "eval_steps": 500,
6
  "global_step": 96,
7
  "is_hyper_param_search": true,
@@ -10,55 +10,36 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "grad_norm": 1.7277214527130127,
14
- "learning_rate": 7.1080634981543736e-06,
15
- "loss": 0.4421,
16
- "step": 48
17
- },
18
- {
19
- "epoch": 1.0,
20
- "eval_accuracy": 0.5,
21
- "eval_f1": 0.0,
22
- "eval_loss": 0.4095905125141144,
23
- "eval_precision": 0.0,
24
- "eval_recall": 0.0,
25
- "eval_runtime": 28.1077,
26
- "eval_samples_per_second": 36.36,
27
- "eval_steps_per_second": 0.569,
28
- "step": 48
29
- },
30
- {
31
- "epoch": 2.0,
32
- "grad_norm": 0.3527555465698242,
33
- "learning_rate": 3.5540317490771868e-06,
34
- "loss": 0.4039,
35
  "step": 96
36
  },
37
  {
38
- "epoch": 2.0,
39
- "eval_accuracy": 0.5,
40
- "eval_f1": 0.0,
41
- "eval_loss": 0.39591261744499207,
42
- "eval_precision": 0.0,
43
- "eval_recall": 0.0,
44
- "eval_runtime": 27.762,
45
- "eval_samples_per_second": 36.813,
46
- "eval_steps_per_second": 0.576,
47
  "step": 96
48
  }
49
  ],
50
  "logging_steps": 500,
51
- "max_steps": 144,
52
  "num_input_tokens_seen": 0,
53
- "num_train_epochs": 3,
54
  "save_steps": 500,
55
- "total_flos": 471390394560.0,
56
- "train_batch_size": 64,
57
  "trial_name": null,
58
  "trial_params": {
59
- "alpha": 0.48386139243976256,
60
- "learning_rate": 1.066209524723156e-05,
61
- "num_train_epochs": 3,
62
- "temperature": 23
63
  }
64
  }
 
1
  {
2
+ "best_metric": 0.4980430528375734,
3
+ "best_model_checkpoint": "tiny-bert-sst2-distilled/run-0/checkpoint-96",
4
+ "epoch": 1.0,
5
  "eval_steps": 500,
6
  "global_step": 96,
7
  "is_hyper_param_search": true,
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "grad_norm": 0.8380242586135864,
14
+ "learning_rate": 8.6265645867868e-06,
15
+ "loss": 0.6538,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
16
  "step": 96
17
  },
18
  {
19
+ "epoch": 1.0,
20
+ "eval_accuracy": 0.4980430528375734,
21
+ "eval_f1": 0.06215722120658134,
22
+ "eval_loss": 0.6460775136947632,
23
+ "eval_precision": 0.4722222222222222,
24
+ "eval_recall": 0.033268101761252444,
25
+ "eval_runtime": 32.7473,
26
+ "eval_samples_per_second": 31.209,
27
+ "eval_steps_per_second": 0.977,
28
  "step": 96
29
  }
30
  ],
31
  "logging_steps": 500,
32
+ "max_steps": 576,
33
  "num_input_tokens_seen": 0,
34
+ "num_train_epochs": 6,
35
  "save_steps": 500,
36
+ "total_flos": 235695197280.0,
37
+ "train_batch_size": 32,
38
  "trial_name": null,
39
  "trial_params": {
40
+ "alpha": 0.9136100763812092,
41
+ "learning_rate": 1.035187750414416e-05,
42
+ "num_train_epochs": 6,
43
+ "temperature": 5
44
  }
45
  }
run-0/checkpoint-96/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:103518af05e87893001984e8fe4e4fbdef270179595accd70434e2248c87999d
3
  size 4920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebe7dd3c3e257754c6583ea668a830f19b3dc80cb7982abc3ddecb0dac8e92b5
3
  size 4920
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2c0967cc1aebc72646b1634b2a505d0131b61790f8449416683fb0b8bf534fc0
3
  size 4920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebe7dd3c3e257754c6583ea668a830f19b3dc80cb7982abc3ddecb0dac8e92b5
3
  size 4920