File size: 2,237 Bytes
1c9c7eb
594f96a
 
 
1c9c7eb
594f96a
1c9c7eb
594f96a
 
1c9c7eb
594f96a
 
1c9c7eb
594f96a
1c9c7eb
594f96a
 
1c9c7eb
594f96a
 
1c9c7eb
594f96a
1c9c7eb
594f96a
 
1c9c7eb
594f96a
 
1c9c7eb
594f96a
1c9c7eb
594f96a
 
1c9c7eb
594f96a
 
 
1c9c7eb
 
594f96a
 
1c9c7eb
594f96a
1c9c7eb
 
 
 
594f96a
 
1c9c7eb
594f96a
1c9c7eb
 
 
 
594f96a
 
1c9c7eb
594f96a
 
 
 
 
 
 
 
 
 
1c9c7eb
 
 
 
 
 
 
 
 
 
 
 
 
594f96a
 
1c9c7eb
 
 
 
 
 
 
594f96a
 
1c9c7eb
 
 
594f96a
1c9c7eb
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
{
  "added_tokens_decoder": {
    "0": {
      "content": "<s>",
      "lstrip": false,
      "normalized": false,
      "rstrip": false,
      "single_word": false,
      "special": true
    },
    "1": {
      "content": "<pad>",
      "lstrip": false,
      "normalized": false,
      "rstrip": false,
      "single_word": false,
      "special": true
    },
    "2": {
      "content": "</s>",
      "lstrip": false,
      "normalized": false,
      "rstrip": false,
      "single_word": false,
      "special": true
    },
    "3": {
      "content": "<unk>",
      "lstrip": false,
      "normalized": false,
      "rstrip": false,
      "single_word": false,
      "special": true
    },
    "32769": {
      "content": "<mask>",
      "lstrip": true,
      "normalized": true,
      "rstrip": false,
      "single_word": false,
      "special": true
    },
    "32770": {
      "content": "<ent>",
      "lstrip": false,
      "normalized": true,
      "rstrip": false,
      "single_word": false,
      "special": true
    },
    "32771": {
      "content": "<ent2>",
      "lstrip": false,
      "normalized": true,
      "rstrip": false,
      "single_word": false,
      "special": true
    }
  },
  "additional_special_tokens": [
    "<ent>",
    "<ent2>",
    "<ent>",
    "<ent2>",
    "<ent>",
    "<ent2>",
    "<ent>",
    "<ent2>"
  ],
  "bos_token": "<s>",
  "clean_up_tokenization_spaces": true,
  "cls_token": "<s>",
  "entity_mask2_token": "[MASK2]",
  "entity_mask_token": "[MASK]",
  "entity_pad_token": "[PAD]",
  "entity_token_1": {
    "__type": "AddedToken",
    "content": "<ent>",
    "lstrip": false,
    "normalized": true,
    "rstrip": false,
    "single_word": false,
    "special": false
  },
  "entity_token_2": {
    "__type": "AddedToken",
    "content": "<ent2>",
    "lstrip": false,
    "normalized": true,
    "rstrip": false,
    "single_word": false,
    "special": false
  },
  "entity_unk_token": "[UNK]",
  "eos_token": "</s>",
  "mask_token": "<mask>",
  "max_entity_length": 32,
  "max_mention_length": 30,
  "model_max_length": 512,
  "pad_token": "<pad>",
  "sep_token": "</s>",
  "sp_model_kwargs": {},
  "task": null,
  "tokenizer_class": "MLukeTokenizer",
  "unk_token": "<unk>"
}