Commit
·
4ebf1d8
1
Parent(s):
8ced1bf
add tokenizer
Browse files- tokenizer.json +3 -3
- vocab.txt +1 -1
tokenizer.json
CHANGED
|
@@ -85,9 +85,9 @@
|
|
| 85 |
"G": 7,
|
| 86 |
"T": 8,
|
| 87 |
"##G": 9,
|
| 88 |
-
"##
|
| 89 |
-
"##
|
| 90 |
-
"##
|
| 91 |
"AA": 13,
|
| 92 |
"GA": 14,
|
| 93 |
"TT": 15,
|
|
|
|
| 85 |
"G": 7,
|
| 86 |
"T": 8,
|
| 87 |
"##G": 9,
|
| 88 |
+
"##A": 10,
|
| 89 |
+
"##C": 11,
|
| 90 |
+
"##T": 12,
|
| 91 |
"AA": 13,
|
| 92 |
"GA": 14,
|
| 93 |
"TT": 15,
|
vocab.txt
CHANGED
|
@@ -8,9 +8,9 @@ C
|
|
| 8 |
G
|
| 9 |
T
|
| 10 |
##G
|
|
|
|
| 11 |
##C
|
| 12 |
##T
|
| 13 |
-
##A
|
| 14 |
AA
|
| 15 |
GA
|
| 16 |
TT
|
|
|
|
| 8 |
G
|
| 9 |
T
|
| 10 |
##G
|
| 11 |
+
##A
|
| 12 |
##C
|
| 13 |
##T
|
|
|
|
| 14 |
AA
|
| 15 |
GA
|
| 16 |
TT
|