| { | |
| "special_token_str": { | |
| "bos": "<bos>", | |
| "eos": "<stop>", | |
| "pad": "<pad>", | |
| "unk": "<unk>" | |
| }, | |
| "vocab": { | |
| "<bos>": 2, | |
| "<pad>": 0, | |
| "<stop>": 3, | |
| "<unk>": 1, | |
| "AAA": 4, | |
| "AAC": 5, | |
| "AAG": 6, | |
| "AAT": 7, | |
| "ACA": 8, | |
| "ACC": 9, | |
| "ACG": 10, | |
| "ACT": 11, | |
| "AGA": 12, | |
| "AGC": 13, | |
| "AGG": 14, | |
| "AGT": 15, | |
| "ATA": 16, | |
| "ATC": 17, | |
| "ATG": 18, | |
| "ATT": 19, | |
| "CAA": 20, | |
| "CAC": 21, | |
| "CAG": 22, | |
| "CAT": 23, | |
| "CCA": 24, | |
| "CCC": 25, | |
| "CCG": 26, | |
| "CCT": 27, | |
| "CGA": 28, | |
| "CGC": 29, | |
| "CGG": 30, | |
| "CGT": 31, | |
| "CTA": 32, | |
| "CTC": 33, | |
| "CTG": 34, | |
| "CTT": 35, | |
| "GAA": 36, | |
| "GAC": 37, | |
| "GAG": 38, | |
| "GAT": 39, | |
| "GCA": 40, | |
| "GCC": 41, | |
| "GCG": 42, | |
| "GCT": 43, | |
| "GGA": 44, | |
| "GGC": 45, | |
| "GGG": 46, | |
| "GGT": 47, | |
| "GTA": 48, | |
| "GTC": 49, | |
| "GTG": 50, | |
| "GTT": 51, | |
| "TAA": 52, | |
| "TAC": 53, | |
| "TAG": 54, | |
| "TAT": 55, | |
| "TCA": 56, | |
| "TCC": 57, | |
| "TCG": 58, | |
| "TCT": 59, | |
| "TGA": 60, | |
| "TGC": 61, | |
| "TGG": 62, | |
| "TGT": 63, | |
| "TTA": 64, | |
| "TTC": 65, | |
| "TTG": 66, | |
| "TTT": 67 | |
| } | |
| } |