xuancoblab2023 commited on Mar 6, 2024

Commit

33b4607

verified ·

1 Parent(s): f9d3f0f

Training in progress, epoch 1

Browse files

Files changed (39) hide show

logs/events.out.tfevents.1709750832.d65e8524b0f6.5185.27 +2 -2
logs/events.out.tfevents.1709751390.d65e8524b0f6.5185.28 +3 -0
logs/events.out.tfevents.1709751499.d65e8524b0f6.5185.29 +3 -0
logs/events.out.tfevents.1709751609.d65e8524b0f6.5185.30 +3 -0
model.safetensors +1 -1
run-27/checkpoint-156/config.json +34 -0
run-27/checkpoint-156/model.safetensors +3 -0
run-27/checkpoint-156/optimizer.pt +3 -0
run-27/checkpoint-156/rng_state.pth +3 -0
run-27/checkpoint-156/scheduler.pt +3 -0
run-27/checkpoint-156/special_tokens_map.json +7 -0
run-27/checkpoint-156/tokenizer.json +0 -0
run-27/checkpoint-156/tokenizer_config.json +57 -0
run-27/checkpoint-156/trainer_state.json +84 -0
run-27/checkpoint-156/training_args.bin +3 -0
run-27/checkpoint-156/vocab.txt +0 -0
run-27/checkpoint-208/config.json +34 -0
run-27/checkpoint-208/model.safetensors +3 -0
run-27/checkpoint-208/optimizer.pt +3 -0
run-27/checkpoint-208/rng_state.pth +3 -0
run-27/checkpoint-208/scheduler.pt +3 -0
run-27/checkpoint-208/special_tokens_map.json +7 -0
run-27/checkpoint-208/tokenizer.json +0 -0
run-27/checkpoint-208/tokenizer_config.json +57 -0
run-27/checkpoint-208/trainer_state.json +103 -0
run-27/checkpoint-208/training_args.bin +3 -0
run-27/checkpoint-208/vocab.txt +0 -0
run-30/checkpoint-56/config.json +34 -0
run-30/checkpoint-56/model.safetensors +3 -0
run-30/checkpoint-56/optimizer.pt +3 -0
run-30/checkpoint-56/rng_state.pth +3 -0
run-30/checkpoint-56/scheduler.pt +3 -0
run-30/checkpoint-56/special_tokens_map.json +7 -0
run-30/checkpoint-56/tokenizer.json +0 -0
run-30/checkpoint-56/tokenizer_config.json +57 -0
run-30/checkpoint-56/trainer_state.json +46 -0
run-30/checkpoint-56/training_args.bin +3 -0
run-30/checkpoint-56/vocab.txt +0 -0
training_args.bin +1 -1

logs/events.out.tfevents.1709750832.d65e8524b0f6.5185.27 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:083be76c70a17fd379b3ce494ebd39d8cf4cbb942a1375fa5c4f168d28f5c002
-size 5982

 version https://git-lfs.github.com/spec/v1
+oid sha256:b8ff4792f18318ccd15976635badc18ae9adf91ff674607257b4fa8122f488f3
+size 8031

logs/events.out.tfevents.1709751390.d65e8524b0f6.5185.28 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d948c512dcb0bd5524dfc50430f0c128b4412f47a9bcb9eafcf1895530e17a94
+size 5314

logs/events.out.tfevents.1709751499.d65e8524b0f6.5185.29 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:027fb39f30a4a59f0dc4446944d32fdfa1869302c10b4e6d3f9640c1252f1eff
+size 5315

logs/events.out.tfevents.1709751609.d65e8524b0f6.5185.30 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0cdde1c4d226c4bafe0b0d770467c5b0030d944445a11713ebfc832a77fbffa3
+size 5313

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c238afc7fd292738acca3d6e49d99d43d1ff9517fa1b5901ab675d443f382623
 size 17549312

 version https://git-lfs.github.com/spec/v1
+oid sha256:8a5c00c89f0bb46b19d00bad6f9ed991aca6501b6a0a0e554e5e51f028f745e7
 size 17549312

run-27/checkpoint-156/config.json ADDED Viewed

	@@ -0,0 +1,34 @@

+{
+  "_name_or_path": "google/bert_uncased_L-2_H-128_A-2",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 128,
+  "id2label": {
+    "0": "negative",
+    "1": "positive"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 512,
+  "label2id": {
+    "negative": "0",
+    "positive": "1"
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 2,
+  "num_hidden_layers": 2,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.2",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 30522
+}

run-27/checkpoint-156/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cbaee8679ae68df8313d4988417e064084361e2903d1e8ad11f53a3e39585dc0
+size 17549312

run-27/checkpoint-156/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:99b354246d6913eba323884b4bcaa147118974bffb2b424433ce595924e03558
+size 35122746

run-27/checkpoint-156/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0f3f2bf3b854c592a6f1e0e90f14af49f8d742650373f022831e4b62d27ad7a2
+size 14054

run-27/checkpoint-156/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c3dc3c1c4292c0f67e651d61d07521cfb24eb08f79f962e161113c4869da5ddc
+size 1064

run-27/checkpoint-156/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-27/checkpoint-156/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-27/checkpoint-156/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,57 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_basic_tokenize": true,
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "never_split": null,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]"
+}

run-27/checkpoint-156/trainer_state.json ADDED Viewed

	@@ -0,0 +1,84 @@

+{
+  "best_metric": 0.7778864970645792,
+  "best_model_checkpoint": "tiny-bert-sst2-distilled/run-27/checkpoint-156",
+  "epoch": 3.0,
+  "eval_steps": 500,
+  "global_step": 156,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "grad_norm": 3.795090675354004,
+      "learning_rate": 0.0004299539034695828,
+      "loss": 0.5539,
+      "step": 52
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.7397260273972602,
+      "eval_f1": 0.7779632721202002,
+      "eval_loss": 0.49282991886138916,
+      "eval_precision": 0.6783114992721979,
+      "eval_recall": 0.9119373776908023,
+      "eval_runtime": 28.2474,
+      "eval_samples_per_second": 36.18,
+      "eval_steps_per_second": 1.133,
+      "step": 52
+    },
+    {
+      "epoch": 2.0,
+      "grad_norm": 2.3241050243377686,
+      "learning_rate": 0.0003582949195579857,
+      "loss": 0.4958,
+      "step": 104
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.776908023483366,
+      "eval_f1": 0.8074324324324325,
+      "eval_loss": 0.4643081724643707,
+      "eval_precision": 0.7102526002971769,
+      "eval_recall": 0.9354207436399217,
+      "eval_runtime": 28.4313,
+      "eval_samples_per_second": 35.946,
+      "eval_steps_per_second": 1.126,
+      "step": 104
+    },
+    {
+      "epoch": 3.0,
+      "grad_norm": 2.4190268516540527,
+      "learning_rate": 0.00028663593564638853,
+      "loss": 0.4714,
+      "step": 156
+    },
+    {
+      "epoch": 3.0,
+      "eval_accuracy": 0.7778864970645792,
+      "eval_f1": 0.8090832632464255,
+      "eval_loss": 0.4609759449958801,
+      "eval_precision": 0.7094395280235988,
+      "eval_recall": 0.9412915851272016,
+      "eval_runtime": 28.809,
+      "eval_samples_per_second": 35.475,
+      "eval_steps_per_second": 1.111,
+      "step": 156
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 364,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 7,
+  "save_steps": 500,
+  "total_flos": 707085591840.0,
+  "train_batch_size": 59,
+  "trial_name": null,
+  "trial_params": {
+    "alpha": 0.845201757467621,
+    "learning_rate": 0.00050161288738118,
+    "num_train_epochs": 7,
+    "per_device_train_batch_size": 59,
+    "temperature": 21
+  }
+}

run-27/checkpoint-156/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3427d367c6681566932cafa2f6b6a62ba9e8ebfdfa8d9ebafbc1230e1c415890
+size 4920

run-27/checkpoint-156/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-27/checkpoint-208/config.json ADDED Viewed

	@@ -0,0 +1,34 @@

+{
+  "_name_or_path": "google/bert_uncased_L-2_H-128_A-2",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 128,
+  "id2label": {
+    "0": "negative",
+    "1": "positive"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 512,
+  "label2id": {
+    "negative": "0",
+    "positive": "1"
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 2,
+  "num_hidden_layers": 2,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.2",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 30522
+}

run-27/checkpoint-208/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:102c93b829589eb1cac4ad524d714afd102e305c94b7f8dcd13e732020ab7405
+size 17549312

run-27/checkpoint-208/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:877d549bf031de1088c4cc2b02c3935790c955023333cbb7838afc0cc7f3eee4
+size 35122746

run-27/checkpoint-208/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8b6ed2075102dd75f9c18fe89ccd178319808314220b3c31c67cb30308a85909
+size 14054

run-27/checkpoint-208/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fcfad319aafebfc536f7ba6caa955cb14f7b60b3df258f75f6a9906cafa524a9
+size 1064

run-27/checkpoint-208/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-27/checkpoint-208/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-27/checkpoint-208/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,57 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_basic_tokenize": true,
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "never_split": null,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]"
+}

run-27/checkpoint-208/trainer_state.json ADDED Viewed

	@@ -0,0 +1,103 @@

+{
+  "best_metric": 0.7945205479452054,
+  "best_model_checkpoint": "tiny-bert-sst2-distilled/run-27/checkpoint-208",
+  "epoch": 4.0,
+  "eval_steps": 500,
+  "global_step": 208,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "grad_norm": 3.795090675354004,
+      "learning_rate": 0.0004299539034695828,
+      "loss": 0.5539,
+      "step": 52
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.7397260273972602,
+      "eval_f1": 0.7779632721202002,
+      "eval_loss": 0.49282991886138916,
+      "eval_precision": 0.6783114992721979,
+      "eval_recall": 0.9119373776908023,
+      "eval_runtime": 28.2474,
+      "eval_samples_per_second": 36.18,
+      "eval_steps_per_second": 1.133,
+      "step": 52
+    },
+    {
+      "epoch": 2.0,
+      "grad_norm": 2.3241050243377686,
+      "learning_rate": 0.0003582949195579857,
+      "loss": 0.4958,
+      "step": 104
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.776908023483366,
+      "eval_f1": 0.8074324324324325,
+      "eval_loss": 0.4643081724643707,
+      "eval_precision": 0.7102526002971769,
+      "eval_recall": 0.9354207436399217,
+      "eval_runtime": 28.4313,
+      "eval_samples_per_second": 35.946,
+      "eval_steps_per_second": 1.126,
+      "step": 104
+    },
+    {
+      "epoch": 3.0,
+      "grad_norm": 2.4190268516540527,
+      "learning_rate": 0.00028663593564638853,
+      "loss": 0.4714,
+      "step": 156
+    },
+    {
+      "epoch": 3.0,
+      "eval_accuracy": 0.7778864970645792,
+      "eval_f1": 0.8090832632464255,
+      "eval_loss": 0.4609759449958801,
+      "eval_precision": 0.7094395280235988,
+      "eval_recall": 0.9412915851272016,
+      "eval_runtime": 28.809,
+      "eval_samples_per_second": 35.475,
+      "eval_steps_per_second": 1.111,
+      "step": 156
+    },
+    {
+      "epoch": 4.0,
+      "grad_norm": 3.24399471282959,
+      "learning_rate": 0.0002149769517347914,
+      "loss": 0.4531,
+      "step": 208
+    },
+    {
+      "epoch": 4.0,
+      "eval_accuracy": 0.7945205479452054,
+      "eval_f1": 0.8111510791366907,
+      "eval_loss": 0.4340381920337677,
+      "eval_precision": 0.7504159733777038,
+      "eval_recall": 0.8825831702544031,
+      "eval_runtime": 28.4651,
+      "eval_samples_per_second": 35.904,
+      "eval_steps_per_second": 1.124,
+      "step": 208
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 364,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 7,
+  "save_steps": 500,
+  "total_flos": 942780789120.0,
+  "train_batch_size": 59,
+  "trial_name": null,
+  "trial_params": {
+    "alpha": 0.845201757467621,
+    "learning_rate": 0.00050161288738118,
+    "num_train_epochs": 7,
+    "per_device_train_batch_size": 59,
+    "temperature": 21
+  }
+}

run-27/checkpoint-208/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3427d367c6681566932cafa2f6b6a62ba9e8ebfdfa8d9ebafbc1230e1c415890
+size 4920

run-27/checkpoint-208/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-30/checkpoint-56/config.json ADDED Viewed

	@@ -0,0 +1,34 @@

+{
+  "_name_or_path": "google/bert_uncased_L-2_H-128_A-2",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 128,
+  "id2label": {
+    "0": "negative",
+    "1": "positive"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 512,
+  "label2id": {
+    "negative": "0",
+    "positive": "1"
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 2,
+  "num_hidden_layers": 2,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.2",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 30522
+}

run-30/checkpoint-56/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8a5c00c89f0bb46b19d00bad6f9ed991aca6501b6a0a0e554e5e51f028f745e7
+size 17549312

run-30/checkpoint-56/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4b38df252558245bda6818cd03784ce17df77370b0a874894f92db1f03eb4980
+size 35122746

run-30/checkpoint-56/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:246901d84b3447ae67c6e9126b5bbf4473c08da78ffc08c216b42ebe7054b997
+size 14054

run-30/checkpoint-56/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4df513a35f06ea0da7e195eadb1eb84530e3e52b103421b6a7f034aaf26c0265
+size 1064

run-30/checkpoint-56/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-30/checkpoint-56/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-30/checkpoint-56/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,57 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_basic_tokenize": true,
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "never_split": null,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]"
+}

run-30/checkpoint-56/trainer_state.json ADDED Viewed

	@@ -0,0 +1,46 @@

+{
+  "best_metric": 0.7847358121330724,
+  "best_model_checkpoint": "tiny-bert-sst2-distilled/run-30/checkpoint-56",
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 56,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "grad_norm": 2.488581895828247,
+      "learning_rate": 0.00035374495201026426,
+      "loss": 0.5645,
+      "step": 56
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.7847358121330724,
+      "eval_f1": 0.8049645390070922,
+      "eval_loss": 0.4679928421974182,
+      "eval_precision": 0.7358184764991896,
+      "eval_recall": 0.8884540117416829,
+      "eval_runtime": 28.8427,
+      "eval_samples_per_second": 35.434,
+      "eval_steps_per_second": 1.109,
+      "step": 56
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 392,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 7,
+  "save_steps": 500,
+  "total_flos": 235695197280.0,
+  "train_batch_size": 55,
+  "trial_name": null,
+  "trial_params": {
+    "alpha": 0.9318712276013821,
+    "learning_rate": 0.000412702444011975,
+    "num_train_epochs": 7,
+    "per_device_train_batch_size": 55,
+    "temperature": 27
+  }
+}

run-30/checkpoint-56/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:87c31c0ff5ab5419b10c4b045c98d73f4009f0b63f2ceac81514144c885ecd65
+size 4920

run-30/checkpoint-56/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:89efecad9561cc854d69fd70f328f321f6dd5b5b818174094a406c3a368090ff
 size 4920

 version https://git-lfs.github.com/spec/v1
+oid sha256:87c31c0ff5ab5419b10c4b045c98d73f4009f0b63f2ceac81514144c885ecd65
 size 4920