Commit
·
25e67aa
1
Parent(s):
53ebf5d
Initial commit of fine-tuned model
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- checkpoint-100/config.json +47 -0
- checkpoint-100/model.safetensors +3 -0
- checkpoint-100/optimizer.pt +3 -0
- checkpoint-100/rng_state.pth +3 -0
- checkpoint-100/scheduler.pt +3 -0
- checkpoint-100/special_tokens_map.json +7 -0
- checkpoint-100/tokenizer_config.json +64 -0
- checkpoint-100/trainer_state.json +32 -0
- checkpoint-100/training_args.bin +3 -0
- checkpoint-100/vocab.txt +0 -0
- checkpoint-1000/config.json +47 -0
- checkpoint-1000/model.safetensors +3 -0
- checkpoint-1000/optimizer.pt +3 -0
- checkpoint-1000/rng_state.pth +3 -0
- checkpoint-1000/scheduler.pt +3 -0
- checkpoint-1000/special_tokens_map.json +7 -0
- checkpoint-1000/tokenizer_config.json +64 -0
- checkpoint-1000/trainer_state.json +47 -0
- checkpoint-1000/training_args.bin +3 -0
- checkpoint-1000/vocab.txt +0 -0
- checkpoint-1200/config.json +47 -0
- checkpoint-1200/model.safetensors +3 -0
- checkpoint-1200/optimizer.pt +3 -0
- checkpoint-1200/rng_state.pth +3 -0
- checkpoint-1200/scheduler.pt +3 -0
- checkpoint-1200/special_tokens_map.json +7 -0
- checkpoint-1200/tokenizer_config.json +64 -0
- checkpoint-1200/trainer_state.json +47 -0
- checkpoint-1200/training_args.bin +3 -0
- checkpoint-1200/vocab.txt +0 -0
- checkpoint-500/config.json +47 -0
- checkpoint-500/model.safetensors +3 -0
- checkpoint-500/optimizer.pt +3 -0
- checkpoint-500/rng_state.pth +3 -0
- checkpoint-500/scheduler.pt +3 -0
- checkpoint-500/special_tokens_map.json +7 -0
- checkpoint-500/tokenizer_config.json +64 -0
- checkpoint-500/trainer_state.json +40 -0
- checkpoint-500/training_args.bin +3 -0
- checkpoint-500/vocab.txt +0 -0
- checkpoint-75/config.json +47 -0
- checkpoint-75/model.safetensors +3 -0
- checkpoint-75/optimizer.pt +3 -0
- checkpoint-75/rng_state.pth +3 -0
- checkpoint-75/scheduler.pt +3 -0
- checkpoint-75/special_tokens_map.json +7 -0
- checkpoint-75/tokenizer_config.json +64 -0
- checkpoint-75/trainer_state.json +32 -0
- checkpoint-75/training_args.bin +3 -0
- checkpoint-75/vocab.txt +0 -0
checkpoint-100/config.json
ADDED
@@ -0,0 +1,47 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "tohoku-nlp/bert-base-japanese-v3",
|
3 |
+
"architectures": [
|
4 |
+
"BertForTokenClassification"
|
5 |
+
],
|
6 |
+
"attention_probs_dropout_prob": 0.1,
|
7 |
+
"classifier_dropout": null,
|
8 |
+
"hidden_act": "gelu",
|
9 |
+
"hidden_dropout_prob": 0.1,
|
10 |
+
"hidden_size": 768,
|
11 |
+
"id2label": {
|
12 |
+
"0": "O",
|
13 |
+
"1": "B-POS",
|
14 |
+
"2": "I-POS",
|
15 |
+
"3": "B-PST",
|
16 |
+
"4": "I-PST",
|
17 |
+
"5": "B-NEG",
|
18 |
+
"6": "I-NEG",
|
19 |
+
"7": "B-NGT",
|
20 |
+
"8": "I-NGT"
|
21 |
+
},
|
22 |
+
"initializer_range": 0.02,
|
23 |
+
"intermediate_size": 3072,
|
24 |
+
"label2id": {
|
25 |
+
"B-NEG": 5,
|
26 |
+
"B-NGT": 7,
|
27 |
+
"B-POS": 1,
|
28 |
+
"B-PST": 3,
|
29 |
+
"I-NEG": 6,
|
30 |
+
"I-NGT": 8,
|
31 |
+
"I-POS": 2,
|
32 |
+
"I-PST": 4,
|
33 |
+
"O": 0
|
34 |
+
},
|
35 |
+
"layer_norm_eps": 1e-12,
|
36 |
+
"max_position_embeddings": 512,
|
37 |
+
"model_type": "bert",
|
38 |
+
"num_attention_heads": 12,
|
39 |
+
"num_hidden_layers": 12,
|
40 |
+
"pad_token_id": 0,
|
41 |
+
"position_embedding_type": "absolute",
|
42 |
+
"torch_dtype": "float32",
|
43 |
+
"transformers_version": "4.47.1",
|
44 |
+
"type_vocab_size": 2,
|
45 |
+
"use_cache": true,
|
46 |
+
"vocab_size": 32768
|
47 |
+
}
|
checkpoint-100/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ceb853309edc8d2a5034db0e99cb3b0e1d29fd5b4b6b6f31134175d0d3a64fb3
|
3 |
+
size 442517340
|
checkpoint-100/optimizer.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6be533913e75ff7bd4e7fb6e3ad54af3038caefde8956f2b2130791e22335214
|
3 |
+
size 885154362
|
checkpoint-100/rng_state.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ff8c58827d00a64816afe1f177dde7825b67d45deb2f884be0236869094cbf4
|
3 |
+
size 14244
|
checkpoint-100/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:beccfaf9bab963f178f24d893fd68585ea073339edab1cdcc5698c989a1dd81e
|
3 |
+
size 1064
|
checkpoint-100/special_tokens_map.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"cls_token": "[CLS]",
|
3 |
+
"mask_token": "[MASK]",
|
4 |
+
"pad_token": "[PAD]",
|
5 |
+
"sep_token": "[SEP]",
|
6 |
+
"unk_token": "[UNK]"
|
7 |
+
}
|
checkpoint-100/tokenizer_config.json
ADDED
@@ -0,0 +1,64 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"added_tokens_decoder": {
|
3 |
+
"0": {
|
4 |
+
"content": "[PAD]",
|
5 |
+
"lstrip": false,
|
6 |
+
"normalized": false,
|
7 |
+
"rstrip": false,
|
8 |
+
"single_word": false,
|
9 |
+
"special": true
|
10 |
+
},
|
11 |
+
"1": {
|
12 |
+
"content": "[UNK]",
|
13 |
+
"lstrip": false,
|
14 |
+
"normalized": false,
|
15 |
+
"rstrip": false,
|
16 |
+
"single_word": false,
|
17 |
+
"special": true
|
18 |
+
},
|
19 |
+
"2": {
|
20 |
+
"content": "[CLS]",
|
21 |
+
"lstrip": false,
|
22 |
+
"normalized": false,
|
23 |
+
"rstrip": false,
|
24 |
+
"single_word": false,
|
25 |
+
"special": true
|
26 |
+
},
|
27 |
+
"3": {
|
28 |
+
"content": "[SEP]",
|
29 |
+
"lstrip": false,
|
30 |
+
"normalized": false,
|
31 |
+
"rstrip": false,
|
32 |
+
"single_word": false,
|
33 |
+
"special": true
|
34 |
+
},
|
35 |
+
"4": {
|
36 |
+
"content": "[MASK]",
|
37 |
+
"lstrip": false,
|
38 |
+
"normalized": false,
|
39 |
+
"rstrip": false,
|
40 |
+
"single_word": false,
|
41 |
+
"special": true
|
42 |
+
}
|
43 |
+
},
|
44 |
+
"clean_up_tokenization_spaces": false,
|
45 |
+
"cls_token": "[CLS]",
|
46 |
+
"do_lower_case": false,
|
47 |
+
"do_subword_tokenize": true,
|
48 |
+
"do_word_tokenize": true,
|
49 |
+
"extra_special_tokens": {},
|
50 |
+
"jumanpp_kwargs": null,
|
51 |
+
"mask_token": "[MASK]",
|
52 |
+
"mecab_kwargs": {
|
53 |
+
"mecab_dic": "unidic_lite"
|
54 |
+
},
|
55 |
+
"model_max_length": 512,
|
56 |
+
"never_split": null,
|
57 |
+
"pad_token": "[PAD]",
|
58 |
+
"sep_token": "[SEP]",
|
59 |
+
"subword_tokenizer_type": "wordpiece",
|
60 |
+
"sudachi_kwargs": null,
|
61 |
+
"tokenizer_class": "BertJapaneseTokenizer",
|
62 |
+
"unk_token": "[UNK]",
|
63 |
+
"word_tokenizer_type": "mecab"
|
64 |
+
}
|
checkpoint-100/trainer_state.json
ADDED
@@ -0,0 +1,32 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"best_metric": null,
|
3 |
+
"best_model_checkpoint": null,
|
4 |
+
"epoch": 4.0,
|
5 |
+
"eval_steps": 500,
|
6 |
+
"global_step": 100,
|
7 |
+
"is_hyper_param_search": false,
|
8 |
+
"is_local_process_zero": true,
|
9 |
+
"is_world_process_zero": true,
|
10 |
+
"log_history": [],
|
11 |
+
"logging_steps": 500,
|
12 |
+
"max_steps": 100,
|
13 |
+
"num_input_tokens_seen": 0,
|
14 |
+
"num_train_epochs": 4,
|
15 |
+
"save_steps": 500,
|
16 |
+
"stateful_callbacks": {
|
17 |
+
"TrainerControl": {
|
18 |
+
"args": {
|
19 |
+
"should_epoch_stop": false,
|
20 |
+
"should_evaluate": false,
|
21 |
+
"should_log": false,
|
22 |
+
"should_save": true,
|
23 |
+
"should_training_stop": true
|
24 |
+
},
|
25 |
+
"attributes": {}
|
26 |
+
}
|
27 |
+
},
|
28 |
+
"total_flos": 836202538598400.0,
|
29 |
+
"train_batch_size": 32,
|
30 |
+
"trial_name": null,
|
31 |
+
"trial_params": null
|
32 |
+
}
|
checkpoint-100/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9e073bb423ca3c7a925f3b63620fc8c4cdeb162b5242b3d43a23a66e0e2ee732
|
3 |
+
size 5304
|
checkpoint-100/vocab.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
checkpoint-1000/config.json
ADDED
@@ -0,0 +1,47 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "tohoku-nlp/bert-base-japanese-v3",
|
3 |
+
"architectures": [
|
4 |
+
"BertForTokenClassification"
|
5 |
+
],
|
6 |
+
"attention_probs_dropout_prob": 0.1,
|
7 |
+
"classifier_dropout": null,
|
8 |
+
"hidden_act": "gelu",
|
9 |
+
"hidden_dropout_prob": 0.1,
|
10 |
+
"hidden_size": 768,
|
11 |
+
"id2label": {
|
12 |
+
"0": "O",
|
13 |
+
"1": "B-POS",
|
14 |
+
"2": "I-POS",
|
15 |
+
"3": "B-PST",
|
16 |
+
"4": "I-PST",
|
17 |
+
"5": "B-NEG",
|
18 |
+
"6": "I-NEG",
|
19 |
+
"7": "B-NGT",
|
20 |
+
"8": "I-NGT"
|
21 |
+
},
|
22 |
+
"initializer_range": 0.02,
|
23 |
+
"intermediate_size": 3072,
|
24 |
+
"label2id": {
|
25 |
+
"B-NEG": 5,
|
26 |
+
"B-NGT": 7,
|
27 |
+
"B-POS": 1,
|
28 |
+
"B-PST": 3,
|
29 |
+
"I-NEG": 6,
|
30 |
+
"I-NGT": 8,
|
31 |
+
"I-POS": 2,
|
32 |
+
"I-PST": 4,
|
33 |
+
"O": 0
|
34 |
+
},
|
35 |
+
"layer_norm_eps": 1e-12,
|
36 |
+
"max_position_embeddings": 512,
|
37 |
+
"model_type": "bert",
|
38 |
+
"num_attention_heads": 12,
|
39 |
+
"num_hidden_layers": 12,
|
40 |
+
"pad_token_id": 0,
|
41 |
+
"position_embedding_type": "absolute",
|
42 |
+
"torch_dtype": "float32",
|
43 |
+
"transformers_version": "4.47.1",
|
44 |
+
"type_vocab_size": 2,
|
45 |
+
"use_cache": true,
|
46 |
+
"vocab_size": 32768
|
47 |
+
}
|
checkpoint-1000/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b25847c52a4cb35f2dc3c63e151af4ea40a0593611ca8a203b467ec3fc06c80e
|
3 |
+
size 442517340
|
checkpoint-1000/optimizer.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:04624bbc71e6cdd276c0864ce270174bff8a5c09d48060b30b37c55eb8f4480a
|
3 |
+
size 885154362
|
checkpoint-1000/rng_state.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f8e61c6e4521371c10c309f0301e6714e45aaf2365669ddc0f5c50abb6680c1
|
3 |
+
size 14244
|
checkpoint-1000/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:09e1d146fa1811b6149157f0b84ed5e54fe5e0faf5ad56a1bbda57354ab4f6a8
|
3 |
+
size 1064
|
checkpoint-1000/special_tokens_map.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"cls_token": "[CLS]",
|
3 |
+
"mask_token": "[MASK]",
|
4 |
+
"pad_token": "[PAD]",
|
5 |
+
"sep_token": "[SEP]",
|
6 |
+
"unk_token": "[UNK]"
|
7 |
+
}
|
checkpoint-1000/tokenizer_config.json
ADDED
@@ -0,0 +1,64 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"added_tokens_decoder": {
|
3 |
+
"0": {
|
4 |
+
"content": "[PAD]",
|
5 |
+
"lstrip": false,
|
6 |
+
"normalized": false,
|
7 |
+
"rstrip": false,
|
8 |
+
"single_word": false,
|
9 |
+
"special": true
|
10 |
+
},
|
11 |
+
"1": {
|
12 |
+
"content": "[UNK]",
|
13 |
+
"lstrip": false,
|
14 |
+
"normalized": false,
|
15 |
+
"rstrip": false,
|
16 |
+
"single_word": false,
|
17 |
+
"special": true
|
18 |
+
},
|
19 |
+
"2": {
|
20 |
+
"content": "[CLS]",
|
21 |
+
"lstrip": false,
|
22 |
+
"normalized": false,
|
23 |
+
"rstrip": false,
|
24 |
+
"single_word": false,
|
25 |
+
"special": true
|
26 |
+
},
|
27 |
+
"3": {
|
28 |
+
"content": "[SEP]",
|
29 |
+
"lstrip": false,
|
30 |
+
"normalized": false,
|
31 |
+
"rstrip": false,
|
32 |
+
"single_word": false,
|
33 |
+
"special": true
|
34 |
+
},
|
35 |
+
"4": {
|
36 |
+
"content": "[MASK]",
|
37 |
+
"lstrip": false,
|
38 |
+
"normalized": false,
|
39 |
+
"rstrip": false,
|
40 |
+
"single_word": false,
|
41 |
+
"special": true
|
42 |
+
}
|
43 |
+
},
|
44 |
+
"clean_up_tokenization_spaces": false,
|
45 |
+
"cls_token": "[CLS]",
|
46 |
+
"do_lower_case": false,
|
47 |
+
"do_subword_tokenize": true,
|
48 |
+
"do_word_tokenize": true,
|
49 |
+
"extra_special_tokens": {},
|
50 |
+
"jumanpp_kwargs": null,
|
51 |
+
"mask_token": "[MASK]",
|
52 |
+
"mecab_kwargs": {
|
53 |
+
"mecab_dic": "unidic_lite"
|
54 |
+
},
|
55 |
+
"model_max_length": 512,
|
56 |
+
"never_split": null,
|
57 |
+
"pad_token": "[PAD]",
|
58 |
+
"sep_token": "[SEP]",
|
59 |
+
"subword_tokenizer_type": "wordpiece",
|
60 |
+
"sudachi_kwargs": null,
|
61 |
+
"tokenizer_class": "BertJapaneseTokenizer",
|
62 |
+
"unk_token": "[UNK]",
|
63 |
+
"word_tokenizer_type": "mecab"
|
64 |
+
}
|
checkpoint-1000/trainer_state.json
ADDED
@@ -0,0 +1,47 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"best_metric": null,
|
3 |
+
"best_model_checkpoint": null,
|
4 |
+
"epoch": 2.5,
|
5 |
+
"eval_steps": 500,
|
6 |
+
"global_step": 1000,
|
7 |
+
"is_hyper_param_search": false,
|
8 |
+
"is_local_process_zero": true,
|
9 |
+
"is_world_process_zero": true,
|
10 |
+
"log_history": [
|
11 |
+
{
|
12 |
+
"epoch": 1.25,
|
13 |
+
"grad_norm": 0.5698992013931274,
|
14 |
+
"learning_rate": 1.2173913043478263e-05,
|
15 |
+
"loss": 0.2027,
|
16 |
+
"step": 500
|
17 |
+
},
|
18 |
+
{
|
19 |
+
"epoch": 2.5,
|
20 |
+
"grad_norm": 0.8053608536720276,
|
21 |
+
"learning_rate": 3.4782608695652175e-06,
|
22 |
+
"loss": 0.0731,
|
23 |
+
"step": 1000
|
24 |
+
}
|
25 |
+
],
|
26 |
+
"logging_steps": 500,
|
27 |
+
"max_steps": 1200,
|
28 |
+
"num_input_tokens_seen": 0,
|
29 |
+
"num_train_epochs": 3,
|
30 |
+
"save_steps": 500,
|
31 |
+
"stateful_callbacks": {
|
32 |
+
"TrainerControl": {
|
33 |
+
"args": {
|
34 |
+
"should_epoch_stop": false,
|
35 |
+
"should_evaluate": false,
|
36 |
+
"should_log": false,
|
37 |
+
"should_save": true,
|
38 |
+
"should_training_stop": false
|
39 |
+
},
|
40 |
+
"attributes": {}
|
41 |
+
}
|
42 |
+
},
|
43 |
+
"total_flos": 522626586624000.0,
|
44 |
+
"train_batch_size": 2,
|
45 |
+
"trial_name": null,
|
46 |
+
"trial_params": null
|
47 |
+
}
|
checkpoint-1000/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2a4ed7e5bedd6b0e0497f3bd37c67423068705a56fe53584376220f5215e05e
|
3 |
+
size 5304
|
checkpoint-1000/vocab.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
checkpoint-1200/config.json
ADDED
@@ -0,0 +1,47 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "tohoku-nlp/bert-base-japanese-v3",
|
3 |
+
"architectures": [
|
4 |
+
"BertForTokenClassification"
|
5 |
+
],
|
6 |
+
"attention_probs_dropout_prob": 0.1,
|
7 |
+
"classifier_dropout": null,
|
8 |
+
"hidden_act": "gelu",
|
9 |
+
"hidden_dropout_prob": 0.1,
|
10 |
+
"hidden_size": 768,
|
11 |
+
"id2label": {
|
12 |
+
"0": "O",
|
13 |
+
"1": "B-POS",
|
14 |
+
"2": "I-POS",
|
15 |
+
"3": "B-PST",
|
16 |
+
"4": "I-PST",
|
17 |
+
"5": "B-NEG",
|
18 |
+
"6": "I-NEG",
|
19 |
+
"7": "B-NGT",
|
20 |
+
"8": "I-NGT"
|
21 |
+
},
|
22 |
+
"initializer_range": 0.02,
|
23 |
+
"intermediate_size": 3072,
|
24 |
+
"label2id": {
|
25 |
+
"B-NEG": 5,
|
26 |
+
"B-NGT": 7,
|
27 |
+
"B-POS": 1,
|
28 |
+
"B-PST": 3,
|
29 |
+
"I-NEG": 6,
|
30 |
+
"I-NGT": 8,
|
31 |
+
"I-POS": 2,
|
32 |
+
"I-PST": 4,
|
33 |
+
"O": 0
|
34 |
+
},
|
35 |
+
"layer_norm_eps": 1e-12,
|
36 |
+
"max_position_embeddings": 512,
|
37 |
+
"model_type": "bert",
|
38 |
+
"num_attention_heads": 12,
|
39 |
+
"num_hidden_layers": 12,
|
40 |
+
"pad_token_id": 0,
|
41 |
+
"position_embedding_type": "absolute",
|
42 |
+
"torch_dtype": "float32",
|
43 |
+
"transformers_version": "4.47.1",
|
44 |
+
"type_vocab_size": 2,
|
45 |
+
"use_cache": true,
|
46 |
+
"vocab_size": 32768
|
47 |
+
}
|
checkpoint-1200/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b0929aa6b57c343e3d27531d8b0b8cec4455d5901ea451dd3bd456884541a257
|
3 |
+
size 442517340
|
checkpoint-1200/optimizer.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e5e5adaa48dea5e747d924a18a13d2109766b113712bf10df5f9fa68fc2272a0
|
3 |
+
size 885154362
|
checkpoint-1200/rng_state.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ff3b215993bb305f3da021b49a5969a508fd46447812b7c80a2cf22ad32af4d
|
3 |
+
size 14244
|
checkpoint-1200/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6dbcd8bb7627ff20a690e1dcef58b9babd947ff44c1ea4785784740fa416a427
|
3 |
+
size 1064
|
checkpoint-1200/special_tokens_map.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"cls_token": "[CLS]",
|
3 |
+
"mask_token": "[MASK]",
|
4 |
+
"pad_token": "[PAD]",
|
5 |
+
"sep_token": "[SEP]",
|
6 |
+
"unk_token": "[UNK]"
|
7 |
+
}
|
checkpoint-1200/tokenizer_config.json
ADDED
@@ -0,0 +1,64 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"added_tokens_decoder": {
|
3 |
+
"0": {
|
4 |
+
"content": "[PAD]",
|
5 |
+
"lstrip": false,
|
6 |
+
"normalized": false,
|
7 |
+
"rstrip": false,
|
8 |
+
"single_word": false,
|
9 |
+
"special": true
|
10 |
+
},
|
11 |
+
"1": {
|
12 |
+
"content": "[UNK]",
|
13 |
+
"lstrip": false,
|
14 |
+
"normalized": false,
|
15 |
+
"rstrip": false,
|
16 |
+
"single_word": false,
|
17 |
+
"special": true
|
18 |
+
},
|
19 |
+
"2": {
|
20 |
+
"content": "[CLS]",
|
21 |
+
"lstrip": false,
|
22 |
+
"normalized": false,
|
23 |
+
"rstrip": false,
|
24 |
+
"single_word": false,
|
25 |
+
"special": true
|
26 |
+
},
|
27 |
+
"3": {
|
28 |
+
"content": "[SEP]",
|
29 |
+
"lstrip": false,
|
30 |
+
"normalized": false,
|
31 |
+
"rstrip": false,
|
32 |
+
"single_word": false,
|
33 |
+
"special": true
|
34 |
+
},
|
35 |
+
"4": {
|
36 |
+
"content": "[MASK]",
|
37 |
+
"lstrip": false,
|
38 |
+
"normalized": false,
|
39 |
+
"rstrip": false,
|
40 |
+
"single_word": false,
|
41 |
+
"special": true
|
42 |
+
}
|
43 |
+
},
|
44 |
+
"clean_up_tokenization_spaces": false,
|
45 |
+
"cls_token": "[CLS]",
|
46 |
+
"do_lower_case": false,
|
47 |
+
"do_subword_tokenize": true,
|
48 |
+
"do_word_tokenize": true,
|
49 |
+
"extra_special_tokens": {},
|
50 |
+
"jumanpp_kwargs": null,
|
51 |
+
"mask_token": "[MASK]",
|
52 |
+
"mecab_kwargs": {
|
53 |
+
"mecab_dic": "unidic_lite"
|
54 |
+
},
|
55 |
+
"model_max_length": 512,
|
56 |
+
"never_split": null,
|
57 |
+
"pad_token": "[PAD]",
|
58 |
+
"sep_token": "[SEP]",
|
59 |
+
"subword_tokenizer_type": "wordpiece",
|
60 |
+
"sudachi_kwargs": null,
|
61 |
+
"tokenizer_class": "BertJapaneseTokenizer",
|
62 |
+
"unk_token": "[UNK]",
|
63 |
+
"word_tokenizer_type": "mecab"
|
64 |
+
}
|
checkpoint-1200/trainer_state.json
ADDED
@@ -0,0 +1,47 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"best_metric": null,
|
3 |
+
"best_model_checkpoint": null,
|
4 |
+
"epoch": 3.0,
|
5 |
+
"eval_steps": 500,
|
6 |
+
"global_step": 1200,
|
7 |
+
"is_hyper_param_search": false,
|
8 |
+
"is_local_process_zero": true,
|
9 |
+
"is_world_process_zero": true,
|
10 |
+
"log_history": [
|
11 |
+
{
|
12 |
+
"epoch": 1.25,
|
13 |
+
"grad_norm": 0.5698992013931274,
|
14 |
+
"learning_rate": 1.2173913043478263e-05,
|
15 |
+
"loss": 0.2027,
|
16 |
+
"step": 500
|
17 |
+
},
|
18 |
+
{
|
19 |
+
"epoch": 2.5,
|
20 |
+
"grad_norm": 0.8053608536720276,
|
21 |
+
"learning_rate": 3.4782608695652175e-06,
|
22 |
+
"loss": 0.0731,
|
23 |
+
"step": 1000
|
24 |
+
}
|
25 |
+
],
|
26 |
+
"logging_steps": 500,
|
27 |
+
"max_steps": 1200,
|
28 |
+
"num_input_tokens_seen": 0,
|
29 |
+
"num_train_epochs": 3,
|
30 |
+
"save_steps": 500,
|
31 |
+
"stateful_callbacks": {
|
32 |
+
"TrainerControl": {
|
33 |
+
"args": {
|
34 |
+
"should_epoch_stop": false,
|
35 |
+
"should_evaluate": false,
|
36 |
+
"should_log": false,
|
37 |
+
"should_save": true,
|
38 |
+
"should_training_stop": true
|
39 |
+
},
|
40 |
+
"attributes": {}
|
41 |
+
}
|
42 |
+
},
|
43 |
+
"total_flos": 627151903948800.0,
|
44 |
+
"train_batch_size": 2,
|
45 |
+
"trial_name": null,
|
46 |
+
"trial_params": null
|
47 |
+
}
|
checkpoint-1200/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2a4ed7e5bedd6b0e0497f3bd37c67423068705a56fe53584376220f5215e05e
|
3 |
+
size 5304
|
checkpoint-1200/vocab.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
checkpoint-500/config.json
ADDED
@@ -0,0 +1,47 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "tohoku-nlp/bert-base-japanese-v3",
|
3 |
+
"architectures": [
|
4 |
+
"BertForTokenClassification"
|
5 |
+
],
|
6 |
+
"attention_probs_dropout_prob": 0.1,
|
7 |
+
"classifier_dropout": null,
|
8 |
+
"hidden_act": "gelu",
|
9 |
+
"hidden_dropout_prob": 0.1,
|
10 |
+
"hidden_size": 768,
|
11 |
+
"id2label": {
|
12 |
+
"0": "O",
|
13 |
+
"1": "B-POS",
|
14 |
+
"2": "I-POS",
|
15 |
+
"3": "B-PST",
|
16 |
+
"4": "I-PST",
|
17 |
+
"5": "B-NEG",
|
18 |
+
"6": "I-NEG",
|
19 |
+
"7": "B-NGT",
|
20 |
+
"8": "I-NGT"
|
21 |
+
},
|
22 |
+
"initializer_range": 0.02,
|
23 |
+
"intermediate_size": 3072,
|
24 |
+
"label2id": {
|
25 |
+
"B-NEG": 5,
|
26 |
+
"B-NGT": 7,
|
27 |
+
"B-POS": 1,
|
28 |
+
"B-PST": 3,
|
29 |
+
"I-NEG": 6,
|
30 |
+
"I-NGT": 8,
|
31 |
+
"I-POS": 2,
|
32 |
+
"I-PST": 4,
|
33 |
+
"O": 0
|
34 |
+
},
|
35 |
+
"layer_norm_eps": 1e-12,
|
36 |
+
"max_position_embeddings": 512,
|
37 |
+
"model_type": "bert",
|
38 |
+
"num_attention_heads": 12,
|
39 |
+
"num_hidden_layers": 12,
|
40 |
+
"pad_token_id": 0,
|
41 |
+
"position_embedding_type": "absolute",
|
42 |
+
"torch_dtype": "float32",
|
43 |
+
"transformers_version": "4.47.1",
|
44 |
+
"type_vocab_size": 2,
|
45 |
+
"use_cache": true,
|
46 |
+
"vocab_size": 32768
|
47 |
+
}
|
checkpoint-500/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3eea84a49bc17b78494dde70428a80ef7ebe516cd7eb79ae3d68e0c25580188
|
3 |
+
size 442517340
|
checkpoint-500/optimizer.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3d683cddd426a28fd74dc231df42d530f73233d44c756d3f0e6442e804cdb592
|
3 |
+
size 885154362
|
checkpoint-500/rng_state.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bfe7e28914cf1759ae2d075a723f32809a485ad4b118cdc1ba3bf4f411ff3492
|
3 |
+
size 14244
|
checkpoint-500/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96aac63cbafeabe90e455718b58c392b5a1771a750af6acf49d636d38e47e57a
|
3 |
+
size 1064
|
checkpoint-500/special_tokens_map.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"cls_token": "[CLS]",
|
3 |
+
"mask_token": "[MASK]",
|
4 |
+
"pad_token": "[PAD]",
|
5 |
+
"sep_token": "[SEP]",
|
6 |
+
"unk_token": "[UNK]"
|
7 |
+
}
|
checkpoint-500/tokenizer_config.json
ADDED
@@ -0,0 +1,64 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"added_tokens_decoder": {
|
3 |
+
"0": {
|
4 |
+
"content": "[PAD]",
|
5 |
+
"lstrip": false,
|
6 |
+
"normalized": false,
|
7 |
+
"rstrip": false,
|
8 |
+
"single_word": false,
|
9 |
+
"special": true
|
10 |
+
},
|
11 |
+
"1": {
|
12 |
+
"content": "[UNK]",
|
13 |
+
"lstrip": false,
|
14 |
+
"normalized": false,
|
15 |
+
"rstrip": false,
|
16 |
+
"single_word": false,
|
17 |
+
"special": true
|
18 |
+
},
|
19 |
+
"2": {
|
20 |
+
"content": "[CLS]",
|
21 |
+
"lstrip": false,
|
22 |
+
"normalized": false,
|
23 |
+
"rstrip": false,
|
24 |
+
"single_word": false,
|
25 |
+
"special": true
|
26 |
+
},
|
27 |
+
"3": {
|
28 |
+
"content": "[SEP]",
|
29 |
+
"lstrip": false,
|
30 |
+
"normalized": false,
|
31 |
+
"rstrip": false,
|
32 |
+
"single_word": false,
|
33 |
+
"special": true
|
34 |
+
},
|
35 |
+
"4": {
|
36 |
+
"content": "[MASK]",
|
37 |
+
"lstrip": false,
|
38 |
+
"normalized": false,
|
39 |
+
"rstrip": false,
|
40 |
+
"single_word": false,
|
41 |
+
"special": true
|
42 |
+
}
|
43 |
+
},
|
44 |
+
"clean_up_tokenization_spaces": false,
|
45 |
+
"cls_token": "[CLS]",
|
46 |
+
"do_lower_case": false,
|
47 |
+
"do_subword_tokenize": true,
|
48 |
+
"do_word_tokenize": true,
|
49 |
+
"extra_special_tokens": {},
|
50 |
+
"jumanpp_kwargs": null,
|
51 |
+
"mask_token": "[MASK]",
|
52 |
+
"mecab_kwargs": {
|
53 |
+
"mecab_dic": "unidic_lite"
|
54 |
+
},
|
55 |
+
"model_max_length": 512,
|
56 |
+
"never_split": null,
|
57 |
+
"pad_token": "[PAD]",
|
58 |
+
"sep_token": "[SEP]",
|
59 |
+
"subword_tokenizer_type": "wordpiece",
|
60 |
+
"sudachi_kwargs": null,
|
61 |
+
"tokenizer_class": "BertJapaneseTokenizer",
|
62 |
+
"unk_token": "[UNK]",
|
63 |
+
"word_tokenizer_type": "mecab"
|
64 |
+
}
|
checkpoint-500/trainer_state.json
ADDED
@@ -0,0 +1,40 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"best_metric": null,
|
3 |
+
"best_model_checkpoint": null,
|
4 |
+
"epoch": 1.25,
|
5 |
+
"eval_steps": 500,
|
6 |
+
"global_step": 500,
|
7 |
+
"is_hyper_param_search": false,
|
8 |
+
"is_local_process_zero": true,
|
9 |
+
"is_world_process_zero": true,
|
10 |
+
"log_history": [
|
11 |
+
{
|
12 |
+
"epoch": 1.25,
|
13 |
+
"grad_norm": 0.5698992013931274,
|
14 |
+
"learning_rate": 1.2173913043478263e-05,
|
15 |
+
"loss": 0.2027,
|
16 |
+
"step": 500
|
17 |
+
}
|
18 |
+
],
|
19 |
+
"logging_steps": 500,
|
20 |
+
"max_steps": 1200,
|
21 |
+
"num_input_tokens_seen": 0,
|
22 |
+
"num_train_epochs": 3,
|
23 |
+
"save_steps": 500,
|
24 |
+
"stateful_callbacks": {
|
25 |
+
"TrainerControl": {
|
26 |
+
"args": {
|
27 |
+
"should_epoch_stop": false,
|
28 |
+
"should_evaluate": false,
|
29 |
+
"should_log": false,
|
30 |
+
"should_save": true,
|
31 |
+
"should_training_stop": false
|
32 |
+
},
|
33 |
+
"attributes": {}
|
34 |
+
}
|
35 |
+
},
|
36 |
+
"total_flos": 261313293312000.0,
|
37 |
+
"train_batch_size": 2,
|
38 |
+
"trial_name": null,
|
39 |
+
"trial_params": null
|
40 |
+
}
|
checkpoint-500/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2a4ed7e5bedd6b0e0497f3bd37c67423068705a56fe53584376220f5215e05e
|
3 |
+
size 5304
|
checkpoint-500/vocab.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
checkpoint-75/config.json
ADDED
@@ -0,0 +1,47 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "tohoku-nlp/bert-base-japanese-v3",
|
3 |
+
"architectures": [
|
4 |
+
"BertForTokenClassification"
|
5 |
+
],
|
6 |
+
"attention_probs_dropout_prob": 0.1,
|
7 |
+
"classifier_dropout": null,
|
8 |
+
"hidden_act": "gelu",
|
9 |
+
"hidden_dropout_prob": 0.1,
|
10 |
+
"hidden_size": 768,
|
11 |
+
"id2label": {
|
12 |
+
"0": "O",
|
13 |
+
"1": "B-POS",
|
14 |
+
"2": "I-POS",
|
15 |
+
"3": "B-PST",
|
16 |
+
"4": "I-PST",
|
17 |
+
"5": "B-NEG",
|
18 |
+
"6": "I-NEG",
|
19 |
+
"7": "B-NGT",
|
20 |
+
"8": "I-NGT"
|
21 |
+
},
|
22 |
+
"initializer_range": 0.02,
|
23 |
+
"intermediate_size": 3072,
|
24 |
+
"label2id": {
|
25 |
+
"B-NEG": 5,
|
26 |
+
"B-NGT": 7,
|
27 |
+
"B-POS": 1,
|
28 |
+
"B-PST": 3,
|
29 |
+
"I-NEG": 6,
|
30 |
+
"I-NGT": 8,
|
31 |
+
"I-POS": 2,
|
32 |
+
"I-PST": 4,
|
33 |
+
"O": 0
|
34 |
+
},
|
35 |
+
"layer_norm_eps": 1e-12,
|
36 |
+
"max_position_embeddings": 512,
|
37 |
+
"model_type": "bert",
|
38 |
+
"num_attention_heads": 12,
|
39 |
+
"num_hidden_layers": 12,
|
40 |
+
"pad_token_id": 0,
|
41 |
+
"position_embedding_type": "absolute",
|
42 |
+
"torch_dtype": "float32",
|
43 |
+
"transformers_version": "4.47.1",
|
44 |
+
"type_vocab_size": 2,
|
45 |
+
"use_cache": true,
|
46 |
+
"vocab_size": 32768
|
47 |
+
}
|
checkpoint-75/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:99bec2f7f62f01913e8b1871c0ab247e83d9c8bd23ef355c2772cd820d053aee
|
3 |
+
size 442517340
|
checkpoint-75/optimizer.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1ffeab4b02dbe1c162d2c586bc73d16b35c19be723831004461af869d37d9c3
|
3 |
+
size 885154362
|
checkpoint-75/rng_state.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b6180bc217820e01c9ec907369a5c79179f9ead5fb8e05fbaecd18bec0a9a74b
|
3 |
+
size 14244
|
checkpoint-75/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0f6003820aa1d9b0e6aa1d70309948568223b16abb8759408bc4ed8976518161
|
3 |
+
size 1064
|
checkpoint-75/special_tokens_map.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"cls_token": "[CLS]",
|
3 |
+
"mask_token": "[MASK]",
|
4 |
+
"pad_token": "[PAD]",
|
5 |
+
"sep_token": "[SEP]",
|
6 |
+
"unk_token": "[UNK]"
|
7 |
+
}
|
checkpoint-75/tokenizer_config.json
ADDED
@@ -0,0 +1,64 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"added_tokens_decoder": {
|
3 |
+
"0": {
|
4 |
+
"content": "[PAD]",
|
5 |
+
"lstrip": false,
|
6 |
+
"normalized": false,
|
7 |
+
"rstrip": false,
|
8 |
+
"single_word": false,
|
9 |
+
"special": true
|
10 |
+
},
|
11 |
+
"1": {
|
12 |
+
"content": "[UNK]",
|
13 |
+
"lstrip": false,
|
14 |
+
"normalized": false,
|
15 |
+
"rstrip": false,
|
16 |
+
"single_word": false,
|
17 |
+
"special": true
|
18 |
+
},
|
19 |
+
"2": {
|
20 |
+
"content": "[CLS]",
|
21 |
+
"lstrip": false,
|
22 |
+
"normalized": false,
|
23 |
+
"rstrip": false,
|
24 |
+
"single_word": false,
|
25 |
+
"special": true
|
26 |
+
},
|
27 |
+
"3": {
|
28 |
+
"content": "[SEP]",
|
29 |
+
"lstrip": false,
|
30 |
+
"normalized": false,
|
31 |
+
"rstrip": false,
|
32 |
+
"single_word": false,
|
33 |
+
"special": true
|
34 |
+
},
|
35 |
+
"4": {
|
36 |
+
"content": "[MASK]",
|
37 |
+
"lstrip": false,
|
38 |
+
"normalized": false,
|
39 |
+
"rstrip": false,
|
40 |
+
"single_word": false,
|
41 |
+
"special": true
|
42 |
+
}
|
43 |
+
},
|
44 |
+
"clean_up_tokenization_spaces": false,
|
45 |
+
"cls_token": "[CLS]",
|
46 |
+
"do_lower_case": false,
|
47 |
+
"do_subword_tokenize": true,
|
48 |
+
"do_word_tokenize": true,
|
49 |
+
"extra_special_tokens": {},
|
50 |
+
"jumanpp_kwargs": null,
|
51 |
+
"mask_token": "[MASK]",
|
52 |
+
"mecab_kwargs": {
|
53 |
+
"mecab_dic": "unidic_lite"
|
54 |
+
},
|
55 |
+
"model_max_length": 512,
|
56 |
+
"never_split": null,
|
57 |
+
"pad_token": "[PAD]",
|
58 |
+
"sep_token": "[SEP]",
|
59 |
+
"subword_tokenizer_type": "wordpiece",
|
60 |
+
"sudachi_kwargs": null,
|
61 |
+
"tokenizer_class": "BertJapaneseTokenizer",
|
62 |
+
"unk_token": "[UNK]",
|
63 |
+
"word_tokenizer_type": "mecab"
|
64 |
+
}
|
checkpoint-75/trainer_state.json
ADDED
@@ -0,0 +1,32 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"best_metric": null,
|
3 |
+
"best_model_checkpoint": null,
|
4 |
+
"epoch": 3.0,
|
5 |
+
"eval_steps": 500,
|
6 |
+
"global_step": 75,
|
7 |
+
"is_hyper_param_search": false,
|
8 |
+
"is_local_process_zero": true,
|
9 |
+
"is_world_process_zero": true,
|
10 |
+
"log_history": [],
|
11 |
+
"logging_steps": 500,
|
12 |
+
"max_steps": 75,
|
13 |
+
"num_input_tokens_seen": 0,
|
14 |
+
"num_train_epochs": 3,
|
15 |
+
"save_steps": 500,
|
16 |
+
"stateful_callbacks": {
|
17 |
+
"TrainerControl": {
|
18 |
+
"args": {
|
19 |
+
"should_epoch_stop": false,
|
20 |
+
"should_evaluate": false,
|
21 |
+
"should_log": false,
|
22 |
+
"should_save": true,
|
23 |
+
"should_training_stop": true
|
24 |
+
},
|
25 |
+
"attributes": {}
|
26 |
+
}
|
27 |
+
},
|
28 |
+
"total_flos": 627151903948800.0,
|
29 |
+
"train_batch_size": 32,
|
30 |
+
"trial_name": null,
|
31 |
+
"trial_params": null
|
32 |
+
}
|
checkpoint-75/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:636218e449c6c1b6590a5a29c69568a90f5a537e70e0dc34506869cc17649bb2
|
3 |
+
size 5304
|
checkpoint-75/vocab.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|