Commit
•
687c87b
1
Parent(s):
fa2ac91
Upload tokenizer
Browse files- special_tokens_map.json +7 -0
- tokenizer_config.json +3 -0
- vocab.txt +26 -0
special_tokens_map.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"cls_token": "<cls>",
|
3 |
+
"eos_token": "<eos>",
|
4 |
+
"mask_token": "<mask>",
|
5 |
+
"pad_token": "A",
|
6 |
+
"unk_token": "<unk>"
|
7 |
+
}
|
tokenizer_config.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"tokenizer_class": "EsmTokenizer"
|
3 |
+
}
|
vocab.txt
ADDED
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
A
|
2 |
+
R
|
3 |
+
N
|
4 |
+
D
|
5 |
+
C
|
6 |
+
Q
|
7 |
+
E
|
8 |
+
G
|
9 |
+
H
|
10 |
+
I
|
11 |
+
L
|
12 |
+
K
|
13 |
+
M
|
14 |
+
F
|
15 |
+
P
|
16 |
+
S
|
17 |
+
T
|
18 |
+
W
|
19 |
+
Y
|
20 |
+
V
|
21 |
+
X
|
22 |
+
<pad>
|
23 |
+
<mask>
|
24 |
+
<cls>
|
25 |
+
<sep>
|
26 |
+
<eos>
|