viahes commited on
Commit
586f8e8
·
verified ·
1 Parent(s): a4bb043

Upload folder using huggingface_hub

Browse files
added_tokens.json CHANGED
@@ -1,6 +1,4 @@
1
  {
2
- "<lang:ca>": 60002,
3
- "<lang:es>": 60003,
4
  "<mask>": 60000,
5
  "<text>": 60001
6
  }
 
1
  {
 
 
2
  "<mask>": 60000,
3
  "<text>": 60001
4
  }
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "./pre-nasca",
3
  "activation_dropout": 0.0,
4
  "activation_function": "gelu",
5
  "architectures": [
@@ -42,8 +42,8 @@
42
  "pad_token_id": 0,
43
  "scale_embedding": false,
44
  "torch_dtype": "float32",
45
- "transformers_version": "4.27.4",
46
  "unk_token_id": 3,
47
  "use_cache": true,
48
- "vocab_size": 60004
49
  }
 
1
  {
2
+ "_name_or_path": "./NAS-bilingue",
3
  "activation_dropout": 0.0,
4
  "activation_function": "gelu",
5
  "architectures": [
 
42
  "pad_token_id": 0,
43
  "scale_embedding": false,
44
  "torch_dtype": "float32",
45
+ "transformers_version": "4.26.1",
46
  "unk_token_id": 3,
47
  "use_cache": true,
48
+ "vocab_size": 60002
49
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9df303c733e557cd238216950c2f323fed37a202206277c807099d6026e1b433
3
- size 1661277005
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a31455ecbf8c898491f4668dc2b32fbe7f917b872651863d86ef4759dfdffeb5
3
+ size 1661268813
tokenizer.json CHANGED
@@ -1,7 +1,21 @@
1
  {
2
  "version": "1.0",
3
- "truncation": null,
4
- "padding": null,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5
  "added_tokens": [
6
  {
7
  "id": 0,
@@ -40,17 +54,17 @@
40
  "special": true
41
  },
42
  {
43
- "id": 60000,
44
- "content": "<mask>",
45
  "single_word": false,
46
- "lstrip": true,
47
  "rstrip": false,
48
- "normalized": true,
49
  "special": true
50
  },
51
  {
52
- "id": 60001,
53
- "content": "<text>",
54
  "single_word": false,
55
  "lstrip": false,
56
  "rstrip": false,
@@ -58,17 +72,17 @@
58
  "special": true
59
  },
60
  {
61
- "id": 60002,
62
- "content": "<lang:ca>",
63
  "single_word": false,
64
- "lstrip": false,
65
  "rstrip": false,
66
- "normalized": false,
67
  "special": true
68
  },
69
  {
70
- "id": 60003,
71
- "content": "<lang:es>",
72
  "single_word": false,
73
  "lstrip": false,
74
  "rstrip": false,
 
1
  {
2
  "version": "1.0",
3
+ "truncation": {
4
+ "direction": "Right",
5
+ "max_length": 512,
6
+ "strategy": "LongestFirst",
7
+ "stride": 0
8
+ },
9
+ "padding": {
10
+ "strategy": {
11
+ "Fixed": 512
12
+ },
13
+ "direction": "Right",
14
+ "pad_to_multiple_of": 8,
15
+ "pad_id": 0,
16
+ "pad_type_id": 0,
17
+ "pad_token": "<pad>"
18
+ },
19
  "added_tokens": [
20
  {
21
  "id": 0,
 
54
  "special": true
55
  },
56
  {
57
+ "id": 1633,
58
+ "content": "ES",
59
  "single_word": false,
60
+ "lstrip": false,
61
  "rstrip": false,
62
+ "normalized": false,
63
  "special": true
64
  },
65
  {
66
+ "id": 9559,
67
+ "content": "CA",
68
  "single_word": false,
69
  "lstrip": false,
70
  "rstrip": false,
 
72
  "special": true
73
  },
74
  {
75
+ "id": 60000,
76
+ "content": "<mask>",
77
  "single_word": false,
78
+ "lstrip": true,
79
  "rstrip": false,
80
+ "normalized": true,
81
  "special": true
82
  },
83
  {
84
+ "id": 60001,
85
+ "content": "<text>",
86
  "single_word": false,
87
  "lstrip": false,
88
  "rstrip": false,
tokenizer_config.json CHANGED
@@ -33,7 +33,8 @@
33
  "rstrip": false,
34
  "single_word": false
35
  },
36
- "model_max_length": 1000000000000000019884624838656,
 
37
  "pad_token": {
38
  "__type": "AddedToken",
39
  "content": "<pad>",
 
33
  "rstrip": false,
34
  "single_word": false
35
  },
36
+ "model_max_length": 512,
37
+ "name_or_path": "./NAS-bilingue",
38
  "pad_token": {
39
  "__type": "AddedToken",
40
  "content": "<pad>",
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81e3b61835cb9e885736d6b9d47f384fbb2e248cd8a93217b0f801e836862e29
3
+ size 3643