Upload tokenizer
Browse files- dna_vocab_list.txt +2 -1
- rna_vocab_list.txt +2 -1
dna_vocab_list.txt
CHANGED
@@ -30,4 +30,5 @@ O
|
|
30 |
.
|
31 |
-
|
32 |
<null_1>
|
33 |
-
<mask>
|
|
|
|
30 |
.
|
31 |
-
|
32 |
<null_1>
|
33 |
+
<mask>
|
34 |
+
<bos>
|
rna_vocab_list.txt
CHANGED
@@ -4103,4 +4103,5 @@ GGGGGG
|
|
4103 |
A
|
4104 |
U
|
4105 |
C
|
4106 |
-
G
|
|
|
|
4103 |
A
|
4104 |
U
|
4105 |
C
|
4106 |
+
G
|
4107 |
+
N
|