Minata commited on
Commit
a52ed2c
·
1 Parent(s): ff65992

Training in progress, step 500

Browse files
.gitignore ADDED
@@ -0,0 +1 @@
 
 
1
+ checkpoint-*/
config.json ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "uclanlp/plbart-large",
3
+ "activation_dropout": 0.0,
4
+ "activation_function": "gelu",
5
+ "architectures": [
6
+ "PLBartForConditionalGeneration"
7
+ ],
8
+ "attention_dropout": 0.1,
9
+ "bos_token_id": 0,
10
+ "classifier_dropout": 0.0,
11
+ "d_model": 1024,
12
+ "decoder_attention_heads": 16,
13
+ "decoder_ffn_dim": 4096,
14
+ "decoder_layerdrop": 0.0,
15
+ "decoder_layers": 12,
16
+ "dropout": 0.1,
17
+ "encoder_attention_heads": 16,
18
+ "encoder_ffn_dim": 4096,
19
+ "encoder_layerdrop": 0.0,
20
+ "encoder_layers": 12,
21
+ "eos_token_id": 2,
22
+ "forced_eos_token_id": 2,
23
+ "gradient_checkpointing": false,
24
+ "init_std": 0.02,
25
+ "is_encoder_decoder": true,
26
+ "max_position_embeddings": 1024,
27
+ "model_type": "plbart",
28
+ "num_hidden_layers": 12,
29
+ "pad_token_id": 1,
30
+ "scale_embedding": true,
31
+ "torch_dtype": "float32",
32
+ "transformers_version": "4.26.1",
33
+ "use_cache": true,
34
+ "vocab_size": 50005
35
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c544cf5aa2edd62d120b1c71af8539cc0138197260b3064aaadd1f24e07991a
3
+ size 1624475405
runs/Feb26_14-31-19_cbed3e0970a0/1677421894.0369194/events.out.tfevents.1677421894.cbed3e0970a0.5245.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:655bb0c81d1cd2419db4cfbb0ba749fd8adfa90ec89f9e7c2e896ab724cfd899
3
+ size 5957
runs/Feb26_14-31-19_cbed3e0970a0/events.out.tfevents.1677421894.cbed3e0970a0.5245.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab5d8d3ecc2f486f995eff7740469f37bbcc71872f5bc2908d03424740f48261
3
+ size 4237
runs/Feb26_14-34-06_cbed3e0970a0/1677422054.6514044/events.out.tfevents.1677422054.cbed3e0970a0.6949.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:292254fb3ad6fee59c3d3321e6a9f996d2da5aadc7162faa895380b60e2e0554
3
+ size 5957
runs/Feb26_14-34-06_cbed3e0970a0/events.out.tfevents.1677422054.cbed3e0970a0.6949.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8382b6914ec7b0818c633a4167ebc0987fbb1d251d7700c516b052c6ab232c52
3
+ size 6369
sentencepiece.bpe.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f72f5d040a176945623a255484d24066f8c0da89a294359154e226efbe494b80
3
+ size 985833
special_tokens_map.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "__java__",
4
+ "__python__",
5
+ "__en_XX__"
6
+ ],
7
+ "bos_token": "<s>",
8
+ "cls_token": "<s>",
9
+ "eos_token": "</s>",
10
+ "mask_token": {
11
+ "content": "<mask>",
12
+ "lstrip": true,
13
+ "normalized": true,
14
+ "rstrip": false,
15
+ "single_word": false
16
+ },
17
+ "pad_token": "<pad>",
18
+ "sep_token": "</s>",
19
+ "unk_token": "<unk>"
20
+ }
tokenizer_config.json ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": null,
3
+ "bos_token": "<s>",
4
+ "cls_token": "<s>",
5
+ "eos_token": "</s>",
6
+ "language_codes": "base",
7
+ "mask_token": {
8
+ "__type": "AddedToken",
9
+ "content": "<mask>",
10
+ "lstrip": true,
11
+ "normalized": true,
12
+ "rstrip": false,
13
+ "single_word": false
14
+ },
15
+ "model_max_length": 1024,
16
+ "name_or_path": "Minata/plbart-base-finetuned-ut-generator",
17
+ "pad_token": "<pad>",
18
+ "sep_token": "</s>",
19
+ "sp_model_kwargs": {},
20
+ "special_tokens_map_file": null,
21
+ "src_lang": null,
22
+ "tgt_lang": null,
23
+ "tokenizer_class": "PLBartTokenizer",
24
+ "unk_token": "<unk>"
25
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1251a72426143261c1d5a6a26e32c2e1b13173fda38739c6a38e6057b8c85566
3
+ size 3643