Delete Instadeep_NT_500M_CPT

#2
Instadeep_NT_500M_CPT/100k_testing_AUC.ipynb DELETED
@@ -1,106 +0,0 @@
1
- {
2
- "cells": [
3
- {
4
- "cell_type": "code",
5
- "execution_count": 26,
6
- "metadata": {},
7
- "outputs": [
8
- {
9
- "name": "stdout",
10
- "output_type": "stream",
11
- "text": [
12
- "\n",
13
- "========================================================================\n",
14
- "🏆 PATHOGENICITY LEADERBOARD — Bottom 100k ClinVar\n",
15
- "========================================================================\n",
16
- "Model | ROC-AUC | PR-AUC \n",
17
- "------------------------------------------------------------------------\n",
18
- "ClinPred | 0.9602 | 0.5921\n",
19
- "REVEL | 0.9554 | 0.5828\n",
20
- "AlphaMissense | 0.9526 | 0.5764\n",
21
- "ESM1b | 0.9440 | 0.5492\n",
22
- "BayesDel_addAF | 0.9355 | 0.6880\n",
23
- "PrimateAI | 0.9298 | 0.4834\n",
24
- "MPC | 0.9210 | 0.4960\n",
25
- "EVE | 0.9188 | 0.5107\n",
26
- "PathoPreter | 0.9123 | 0.6204\n",
27
- "CADD_raw | 0.8980 | 0.6566\n",
28
- "========================================================================\n"
29
- ]
30
- }
31
- ],
32
- "source": [
33
- "import numpy as np\n",
34
- "from sklearn.metrics import roc_auc_score, average_precision_score\n",
35
- "\n",
36
- "# Load saved PathoPreter probabilities\n",
37
- "probs = np.load(\"100k_probs.npy\")\n",
38
- "y_true = df[\"labels\"].values\n",
39
- "\n",
40
- "bench_cols = [\n",
41
- " \"CADD_raw_rankscore\",\"REVEL_rankscore\",\"AlphaMissense_rankscore\",\n",
42
- " \"ClinPred_rankscore\",\"PrimateAI_rankscore\",\"MPC_rankscore\",\n",
43
- " \"BayesDel_addAF_rankscore\",\"EVE_rankscore\",\"ESM1b_rankscore\"\n",
44
- "]\n",
45
- "\n",
46
- "bench_results = []\n",
47
- "\n",
48
- "# PathoPreter first\n",
49
- "bench_results.append((\n",
50
- " \"PathoPreter\",\n",
51
- " roc_auc_score(y_true, probs),\n",
52
- " average_precision_score(y_true, probs)\n",
53
- "))\n",
54
- "\n",
55
- "# DBNSFP models\n",
56
- "for c in bench_cols:\n",
57
- " if c in df.columns:\n",
58
- " scores = np.nan_to_num(df[c].to_numpy(), nan=0.0)\n",
59
- " try:\n",
60
- " auc = roc_auc_score(y_true, scores)\n",
61
- " pr = average_precision_score(y_true, scores)\n",
62
- " except Exception:\n",
63
- " auc, pr = np.nan, np.nan\n",
64
- " bench_results.append((c.replace(\"_rankscore\",\"\"), auc, pr))\n",
65
- "\n",
66
- "# Safe sort (NumPy 2.0 compliant)\n",
67
- "bench_results = sorted(\n",
68
- " bench_results,\n",
69
- " key=lambda x: float(x[1]) if x[1] == x[1] else 0.0,\n",
70
- " reverse=True\n",
71
- ")\n",
72
- "\n",
73
- "# Print leaderboard\n",
74
- "print(\"\\n\" + \"=\"*72)\n",
75
- "print(\"🏆 PATHOGENICITY LEADERBOARD — Bottom 100k ClinVar\")\n",
76
- "print(\"=\"*72)\n",
77
- "print(f\"{'Model':20s} | {'ROC-AUC':8s} | {'PR-AUC':8s}\")\n",
78
- "print(\"-\"*72)\n",
79
- "for name, auc, pr in bench_results:\n",
80
- " print(f\"{name:20s} | {auc:8.4f} | {pr:8.4f}\")\n",
81
- "print(\"=\"*72)\n"
82
- ]
83
- }
84
- ],
85
- "metadata": {
86
- "kernelspec": {
87
- "display_name": ".venv",
88
- "language": "python",
89
- "name": "python3"
90
- },
91
- "language_info": {
92
- "codemirror_mode": {
93
- "name": "ipython",
94
- "version": 3
95
- },
96
- "file_extension": ".py",
97
- "mimetype": "text/x-python",
98
- "name": "python",
99
- "nbconvert_exporter": "python",
100
- "pygments_lexer": "ipython3",
101
- "version": "3.10.11"
102
- }
103
- },
104
- "nbformat": 4,
105
- "nbformat_minor": 2
106
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
Instadeep_NT_500M_CPT/100k_testing_recall.ipynb DELETED
@@ -1,315 +0,0 @@
1
- {
2
- "cells": [
3
- {
4
- "cell_type": "code",
5
- "execution_count": null,
6
- "metadata": {},
7
- "outputs": [
8
- {
9
- "name": "stderr",
10
- "output_type": "stream",
11
- "text": [
12
- "Inference @128: 100%|██████████| 782/782 [4:10:15<00:00, 19.20s/it] \n"
13
- ]
14
- },
15
- {
16
- "name": "stdout",
17
- "output_type": "stream",
18
- "text": [
19
- "Finished inference with batch=128 in 250.25 min\n",
20
- "Saved probabilities to 100k_probs.npy\n",
21
- "\n",
22
- "bottom-100000 metrics: ROC-AUC=0.9123 | PR-AUC=0.6204 (batch=128)\n",
23
- "Confusion (thr=0.5):\n",
24
- " [[83418 9395]\n",
25
- " [ 1097 6090]]\n",
26
- "Best-F1 thr=0.5832 -> Confusion:\n",
27
- " [[89911 2902]\n",
28
- " [ 2323 4864]]\n",
29
- "Brier score: 0.1676\n",
30
- "Recall@Top1%: 0.11172951161819951\n",
31
- "Recall@Top5%: 0.4886600807012661\n",
32
- "Recall@Top10%: 0.7528871573674689\n",
33
- "Recall @ FPR=1%: 0.3568 (thr=0.6822442412376404)\n"
34
- ]
35
- }
36
- ],
37
- "source": [
38
- "# =============================\n",
39
- "# RUN: Bottom-100k Evaluation (single cell)\n",
40
- "# - loads model + feat scalers\n",
41
- "# - takes the last 100k rows from 900k_test.parquet\n",
42
- "# - normalizes features exactly like training\n",
43
- "# - batched tokenization & inference with GPU-safe fallback\n",
44
- "# - metrics, leaderboard, ROC/PR, calibration, ranking metrics\n",
45
- "# =============================\n",
46
- "\n",
47
- "import os, time, gc, json\n",
48
- "from tqdm.auto import tqdm\n",
49
- "import numpy as np\n",
50
- "import pandas as pd\n",
51
- "import torch\n",
52
- "import torch.nn as nn\n",
53
- "import matplotlib.pyplot as plt\n",
54
- "import seaborn as sns\n",
55
- "from safetensors.torch import load_file\n",
56
- "from transformers import AutoTokenizer, AutoModel\n",
57
- "from sklearn.metrics import (\n",
58
- " roc_auc_score, average_precision_score, roc_curve,\n",
59
- " precision_recall_curve, confusion_matrix, brier_score_loss\n",
60
- ")\n",
61
- "from sklearn.calibration import calibration_curve\n",
62
- "\n",
63
- "# ---------- CONFIG ----------\n",
64
- "MODEL_DIR = \"PathoPreter_Ready_V1\"\n",
65
- "PARQUET_900K = \"900k_test.parquet\"\n",
66
- "BOTTOM_K = 100_000 # <--- using bottom 100k as requested\n",
67
- "OUT_PROBS = \"100k_probs.npy\"\n",
68
- "\n",
69
- "# feature columns exactly as training\n",
70
- "feature_cols = [\n",
71
- " \"gnomad_af\",\n",
72
- " \"GERP++_RS_rankscore\",\n",
73
- " \"GERP_91_mammals_rankscore\",\n",
74
- " \"phyloP100way_vertebrate_rankscore\",\n",
75
- " \"phyloP470way_mammalian_rankscore\",\n",
76
- " \"phyloP17way_primate_rankscore\",\n",
77
- " \"phastCons100way_vertebrate_rankscore\",\n",
78
- " \"phastCons470way_mammalian_rankscore\",\n",
79
- " \"phastCons17way_primate_rankscore\",\n",
80
- "]\n",
81
- "\n",
82
- "bench_cols = [\n",
83
- " \"CADD_raw_rankscore\",\"REVEL_rankscore\",\"AlphaMissense_rankscore\",\n",
84
- " \"ClinPred_rankscore\",\"PrimateAI_rankscore\",\"MPC_rankscore\",\n",
85
- " \"BayesDel_addAF_rankscore\",\"EVE_rankscore\",\"ESM1b_rankscore\"\n",
86
- "]\n",
87
- "\n",
88
- "DEVICE = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n",
89
- "print(\"Device:\", DEVICE)\n",
90
- "if DEVICE.type == \"cuda\":\n",
91
- " print(torch.cuda.get_device_properties(0))\n",
92
- "\n",
93
- "# ---------- helpers ----------\n",
94
- "def map_label_str(x):\n",
95
- " if pd.isna(x): return np.nan\n",
96
- " s = str(x).lower()\n",
97
- " if s.startswith(\"path\"): return 1\n",
98
- " if s.startswith(\"ben\"): return 0\n",
99
- " return np.nan\n",
100
- "\n",
101
- "class SequenceClassificationWithFeatures(nn.Module):\n",
102
- " def __init__(self, encoder, hidden_size, feature_dim, num_labels):\n",
103
- " super().__init__()\n",
104
- " self.encoder = encoder\n",
105
- " self.classifier = nn.Sequential(\n",
106
- " nn.Linear(hidden_size + feature_dim, hidden_size),\n",
107
- " nn.GELU(),\n",
108
- " nn.Dropout(0.1),\n",
109
- " nn.Linear(hidden_size, num_labels)\n",
110
- " )\n",
111
- " def forward(self, input_ids=None, attention_mask=None, features=None):\n",
112
- " out = self.encoder(input_ids=input_ids, attention_mask=attention_mask, return_dict=True)\n",
113
- " last = out.last_hidden_state\n",
114
- " mask = attention_mask.unsqueeze(-1)\n",
115
- " pooled = (last * mask).sum(1) / mask.sum(1).clamp(min=1e-9)\n",
116
- " features = features.to(pooled.device).to(pooled.dtype)\n",
117
- " logits = self.classifier(torch.cat([pooled, features], dim=1))\n",
118
- " return logits\n",
119
- "\n",
120
- "# ---------- load metadata + scalers + tokenizer ----------\n",
121
- "print(\"Loading model metadata and scalers...\")\n",
122
- "meta_path = os.path.join(MODEL_DIR, \"model_metadata.json\")\n",
123
- "if not os.path.exists(meta_path):\n",
124
- " raise FileNotFoundError(\"Missing model metadata: \" + meta_path)\n",
125
- "with open(meta_path, \"r\") as f:\n",
126
- " meta = json.load(f)\n",
127
- "\n",
128
- "feat_means_path = os.path.join(MODEL_DIR, \"feat_means.npy\")\n",
129
- "feat_stds_path = os.path.join(MODEL_DIR, \"feat_stds.npy\")\n",
130
- "if not (os.path.exists(feat_means_path) and os.path.exists(feat_stds_path)):\n",
131
- " raise FileNotFoundError(\"Missing feat_means.npy or feat_stds.npy in model directory.\")\n",
132
- "feat_means = np.load(feat_means_path)\n",
133
- "feat_stds = np.load(feat_stds_path)\n",
134
- "\n",
135
- "# sanity check feature lengths\n",
136
- "if len(feat_means) != len(feature_cols):\n",
137
- " print(\"Warning: feat_means length != feature_cols. Using feature_cols from meta if present.\")\n",
138
- " if \"feature_cols\" in meta:\n",
139
- " feature_cols = meta[\"feature_cols\"]\n",
140
- " print(\"Using meta feature_cols length:\", len(feature_cols))\n",
141
- " else:\n",
142
- " raise RuntimeError(\"feature_cols mismatch; check model metadata.\")\n",
143
- "\n",
144
- "print(\"Loading tokenizer...\")\n",
145
- "tokenizer = AutoTokenizer.from_pretrained(\"InstaDeepAI/nucleotide-transformer-500m-human-ref\", trust_remote_code=True)\n",
146
- "\n",
147
- "# ---------- load model weights safely ----------\n",
148
- "print(\"Loading encoder and model weights (safetensors)...\")\n",
149
- "base_encoder = AutoModel.from_pretrained(MODEL_DIR, trust_remote_code=True)\n",
150
- "hidden_size = base_encoder.config.hidden_size\n",
151
- "FEATURE_DIM = len(feature_cols)\n",
152
- "NUM_LABELS = meta.get(\"num_labels\", 2)\n",
153
- "\n",
154
- "model = SequenceClassificationWithFeatures(base_encoder, hidden_size, FEATURE_DIM, NUM_LABELS)\n",
155
- "state_path = os.path.join(MODEL_DIR, \"model.safetensors\")\n",
156
- "if not os.path.exists(state_path):\n",
157
- " raise FileNotFoundError(\"Missing model.safetensors in \" + MODEL_DIR)\n",
158
- "state = load_file(state_path)\n",
159
- "state_t = {k: torch.as_tensor(v) for k, v in state.items()}\n",
160
- "missing, unexpected = model.load_state_dict(state_t, strict=False)\n",
161
- "print(\"Loaded weights (strict=False). Missing keys:\", len(missing), \"Unexpected keys:\", len(unexpected))\n",
162
- "model.to(DEVICE).eval()\n",
163
- "torch.cuda.empty_cache()\n",
164
- "\n",
165
- "# ---------- prepare bottom-100k dataframe ----------\n",
166
- "print(f\"\\nLoading {PARQUET_900K} and slicing last {BOTTOM_K} rows (bottom)...\")\n",
167
- "if not os.path.exists(PARQUET_900K):\n",
168
- " raise FileNotFoundError(\"Missing parquet file: \" + PARQUET_900K)\n",
169
- "df_all = pd.read_parquet(PARQUET_900K)\n",
170
- "print(\"Total rows in file:\", len(df_all))\n",
171
- "df = df_all.tail(BOTTOM_K).reset_index(drop=True)\n",
172
- "print(\"Sliced rows:\", len(df))\n",
173
- "del df_all\n",
174
- "gc.collect()\n",
175
- "\n",
176
- "# ensure labels exist and map\n",
177
- "df[\"labels\"] = df[\"clean_label\"].map(map_label_str)\n",
178
- "valid_mask = ~df[\"labels\"].isna()\n",
179
- "print(\"Rows with labels present:\", valid_mask.sum())\n",
180
- "df = df.loc[valid_mask].reset_index(drop=True)\n",
181
- "df[\"labels\"] = df[\"labels\"].astype(int)\n",
182
- "\n",
183
- "# ---------- inference routine ----------\n",
184
- "def run_inference_on_df(df, name=\"bottom100k\", batch_candidates=(2048,1536,1024,768,512,256,128)):\n",
185
- " print(f\"\\nStarting inference on {name} ({len(df)} rows)\")\n",
186
- " # prepare sequences and features\n",
187
- " seqs = df[\"raw_sequence\"].astype(str).tolist()\n",
188
- " feats = df[feature_cols].copy()\n",
189
- " # impute missing with training means\n",
190
- " feats = feats.fillna(pd.Series(feat_means, index=feature_cols))\n",
191
- " feats_arr = feats.values.astype(np.float32)\n",
192
- " feats_norm = (feats_arr - feat_means.reshape(1,-1)) / (feat_stds.reshape(1,-1) + 1e-9)\n",
193
- " feats_tensor = torch.from_numpy(feats_norm)\n",
194
- "\n",
195
- " y_true = df[\"labels\"].values\n",
196
- "\n",
197
- " probs = None\n",
198
- " chosen_bs = None\n",
199
- " for bs in batch_candidates:\n",
200
- " try:\n",
201
- " print(f\"\\nTrying batch size {bs} ...\")\n",
202
- " probs_chunks = []\n",
203
- " t0 = time.time()\n",
204
- " for i in tqdm(range(0, len(seqs), bs), desc=f\"Inference @{bs}\"):\n",
205
- " j = min(len(seqs), i+bs)\n",
206
- " batch_seqs = seqs[i:j]\n",
207
- " tok = tokenizer(batch_seqs, padding=\"max_length\", truncation=True,\n",
208
- " max_length=tokenizer.model_max_length, return_tensors=\"pt\")\n",
209
- " ids = tok[\"input_ids\"].to(DEVICE)\n",
210
- " mask = tok[\"attention_mask\"].to(DEVICE)\n",
211
- " feats_batch = feats_tensor[i:j].to(DEVICE, non_blocking=True)\n",
212
- "\n",
213
- " with torch.no_grad():\n",
214
- " logits = model(ids, mask, feats_batch)\n",
215
- " probs_batch = torch.softmax(logits, dim=1)[:, 1].cpu()\n",
216
- " probs_chunks.append(probs_batch)\n",
217
- "\n",
218
- " # cleanup\n",
219
- " del ids, mask, feats_batch, tok, logits, probs_batch\n",
220
- " torch.cuda.empty_cache()\n",
221
- "\n",
222
- " probs = torch.cat(probs_chunks).numpy()\n",
223
- " chosen_bs = bs\n",
224
- " elapsed = (time.time() - t0) / 60.0\n",
225
- " print(f\"Finished inference with batch={bs} in {elapsed:.2f} min\")\n",
226
- " break\n",
227
- "\n",
228
- " except RuntimeError as e:\n",
229
- " msg = str(e).lower()\n",
230
- " print(f\"RuntimeError at bs={bs}: {msg}\")\n",
231
- " if \"out of memory\" in msg or \"cuda\" in msg:\n",
232
- " print(\" -> OOM, clearing cache and trying next smaller batch\")\n",
233
- " torch.cuda.empty_cache(); gc.collect(); time.sleep(2)\n",
234
- " continue\n",
235
- " else:\n",
236
- " raise\n",
237
- "\n",
238
- " if probs is None:\n",
239
- " raise RuntimeError(\"All batch sizes failed.\")\n",
240
- "\n",
241
- " # save probs\n",
242
- " np.save(OUT_PROBS, probs)\n",
243
- " print(\"Saved probabilities to\", OUT_PROBS)\n",
244
- "\n",
245
- " # metrics\n",
246
- " roc = roc_auc_score(y_true, probs)\n",
247
- " ap = average_precision_score(y_true, probs)\n",
248
- " print(f\"\\n{name} metrics: ROC-AUC={roc:.4f} | PR-AUC={ap:.4f} (batch={chosen_bs})\")\n",
249
- "\n",
250
- " # confusion at 0.5\n",
251
- " y_pred05 = (probs >= 0.5).astype(int)\n",
252
- " cm05 = confusion_matrix(y_true, y_pred05)\n",
253
- " print(\"Confusion (thr=0.5):\\n\", cm05)\n",
254
- "\n",
255
- " # best F1 threshold via precision-recall curve\n",
256
- " prec, rec, thr = precision_recall_curve(y_true, probs)\n",
257
- " f1 = 2 * prec * rec / (prec + rec + 1e-12)\n",
258
- " if len(thr) > 0:\n",
259
- " best_idx = np.nanargmax(f1[:-1])\n",
260
- " best_thr = thr[best_idx]\n",
261
- " else:\n",
262
- " best_thr = 0.5\n",
263
- " y_pred_best = (probs >= best_thr).astype(int)\n",
264
- " cm_best = confusion_matrix(y_true, y_pred_best)\n",
265
- " print(f\"Best-F1 thr={best_thr:.4f} -> Confusion:\\n\", cm_best)\n",
266
- "\n",
267
- " # calibration\n",
268
- " brier = brier_score_loss(y_true, probs)\n",
269
- " prob_true, prob_pred = calibration_curve(y_true, probs, n_bins=10, strategy=\"uniform\")\n",
270
- " print(f\"Brier score: {brier:.4f}\")\n",
271
- "\n",
272
- " # ranking metrics\n",
273
- " def recall_at_top_frac(scores, labels, frac):\n",
274
- " k = max(1, int(len(scores) * frac))\n",
275
- " idx = np.argsort(scores)[-k:]\n",
276
- " return labels[idx].sum() / (labels.sum() + 1e-12)\n",
277
- "\n",
278
- " print(\"Recall@Top1%:\", recall_at_top_frac(probs, y_true, 0.01))\n",
279
- " print(\"Recall@Top5%:\", recall_at_top_frac(probs, y_true, 0.05))\n",
280
- " print(\"Recall@Top10%:\", recall_at_top_frac(probs, y_true, 0.10))\n",
281
- "\n",
282
- " # recall at fixed FPR=1%\n",
283
- " fpr_vals, tpr_vals, t_thresh = roc_curve(y_true, probs)\n",
284
- " valid = np.where(fpr_vals <= 0.01)[0]\n",
285
- " if len(valid) > 0:\n",
286
- " idx = valid[np.argmax(tpr_vals[valid])]\n",
287
- " rec_at_1pct, thr_at_1pct = tpr_vals[idx], t_thresh[idx]\n",
288
- " else:\n",
289
- " rec_at_1pct, thr_at_1pct = 0.0, None\n",
290
- " print(f\"Recall @ FPR=1%: {rec_at_1pct:.4f} (thr={thr_at_1pct})\")\n"
291
- ]
292
- }
293
- ],
294
- "metadata": {
295
- "kernelspec": {
296
- "display_name": ".venv",
297
- "language": "python",
298
- "name": "python3"
299
- },
300
- "language_info": {
301
- "codemirror_mode": {
302
- "name": "ipython",
303
- "version": 3
304
- },
305
- "file_extension": ".py",
306
- "mimetype": "text/x-python",
307
- "name": "python",
308
- "nbconvert_exporter": "python",
309
- "pygments_lexer": "ipython3",
310
- "version": "3.10.11"
311
- }
312
- },
313
- "nbformat": 4,
314
- "nbformat_minor": 2
315
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
Instadeep_NT_500M_CPT/Neucletide_transformer.ipynb DELETED
The diff for this file is too large to render. See raw diff
 
Instadeep_NT_500M_CPT/PathScan/README.txt DELETED
@@ -1,24 +0,0 @@
1
-
2
- PATHO-PRETER v1 (A100 Fine-Tune)
3
- ================================
4
- Trained by: Rohit
5
- Base Model: Nucleotide Transformer 500M
6
- Architecture: Hybrid (DNA Sequence + 9 Conservation Scores)
7
-
8
- HOW TO LOAD:
9
- 1. Unzip this folder.
10
- 2. Place 'modeling_pathopreter.py' in your python path.
11
- 3. Run:
12
-
13
- from modeling_pathopreter import SequenceClassificationWithFeatures
14
- import numpy as np
15
-
16
- # Load Model
17
- model = SequenceClassificationWithFeatures.from_pretrained("./PathoPreter_Final_A100")
18
-
19
- # Load Scalers (Crucial for inference!)
20
- means = np.load("./PathoPreter_Final_A100/feat_means.npy")
21
- stds = np.load("./PathoPreter_Final_A100/feat_stds.npy")
22
-
23
- # Preprocessing
24
- # (features - means) / stds
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
Instadeep_NT_500M_CPT/PathScan/config.json DELETED
@@ -1,30 +0,0 @@
1
- {
2
- "architectures": [
3
- "SequenceClassificationWithFeatures"
4
- ],
5
- "attention_probs_dropout_prob": 0.0,
6
- "custom_feature_dim": 9,
7
- "custom_num_labels": 2,
8
- "dtype": "float32",
9
- "emb_layer_norm_before": false,
10
- "esmfold_config": null,
11
- "hidden_dropout_prob": 0.0,
12
- "hidden_size": 1280,
13
- "initializer_range": 0.02,
14
- "intermediate_size": 5120,
15
- "is_folding_model": false,
16
- "layer_norm_eps": 1e-12,
17
- "mask_token_id": 2,
18
- "max_position_embeddings": 1002,
19
- "model_type": "esm",
20
- "num_attention_heads": 20,
21
- "num_hidden_layers": 24,
22
- "pad_token_id": 1,
23
- "position_embedding_type": "absolute",
24
- "tie_word_embeddings": false,
25
- "token_dropout": true,
26
- "transformers_version": "4.57.4",
27
- "use_cache": false,
28
- "vocab_list": null,
29
- "vocab_size": 4105
30
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
Instadeep_NT_500M_CPT/PathScan/feat_means.npy DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:c55660bf4e0dbedc093efc8625eec3d08b6a82a1a791fa0734d77b4550b0d2d8
3
- size 164
 
 
 
 
Instadeep_NT_500M_CPT/PathScan/feat_stds.npy DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:39717a36811a53b5043ebf2892993e148bf3082e88f1a0c4066955b23cb57579
3
- size 164
 
 
 
 
Instadeep_NT_500M_CPT/PathScan/model.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:b4f8c7bb2fccb923fbbfe3fbe8e88e9cbb0539cb36a1989caedbcd5131855365
3
- size 1928412764
 
 
 
 
Instadeep_NT_500M_CPT/PathScan/model_metadata.json DELETED
@@ -1,17 +0,0 @@
1
- {
2
- "feature_cols": [
3
- "gnomad_af",
4
- "GERP++_RS_rankscore",
5
- "GERP_91_mammals_rankscore",
6
- "phyloP100way_vertebrate_rankscore",
7
- "phyloP470way_mammalian_rankscore",
8
- "phyloP17way_primate_rankscore",
9
- "phastCons100way_vertebrate_rankscore",
10
- "phastCons470way_mammalian_rankscore",
11
- "phastCons17way_primate_rankscore"
12
- ],
13
- "num_labels": 2,
14
- "feature_dim": 9,
15
- "model_type": "nt-500m-hybrid",
16
- "base_model": "InstaDeepAI/nucleotide-transformer-500m-human-ref"
17
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
Instadeep_NT_500M_CPT/PathScan/modeling_pathopreter.py DELETED
@@ -1,65 +0,0 @@
1
-
2
- import torch
3
- import torch.nn as nn
4
- from transformers import AutoModel
5
- from transformers.modeling_outputs import SequenceClassifierOutput
6
-
7
- class SequenceClassificationWithFeatures(nn.Module):
8
- def __init__(self, encoder, hidden_size, feature_dim, num_labels):
9
- super().__init__()
10
- self.encoder = encoder
11
- self.feature_dim = feature_dim
12
- self.classifier = nn.Sequential(
13
- nn.Linear(hidden_size + feature_dim, hidden_size),
14
- nn.GELU(),
15
- nn.Dropout(0.1),
16
- nn.Linear(hidden_size, num_labels)
17
- )
18
-
19
- @classmethod
20
- def from_pretrained(cls, path, device="cpu"):
21
- import json
22
- import os
23
- from safetensors.torch import load_file
24
-
25
- # Load Config
26
- with open(os.path.join(path, "model_metadata.json"), "r") as f:
27
- meta = json.load(f)
28
-
29
- # Load Encoder
30
- encoder = AutoModel.from_pretrained(path, trust_remote_code=True)
31
-
32
- # Init Model
33
- model = cls(
34
- encoder=encoder,
35
- hidden_size=encoder.config.hidden_size,
36
- feature_dim=meta["feature_dim"],
37
- num_labels=meta["num_labels"]
38
- )
39
-
40
- # Load Weights
41
- state_dict = load_file(os.path.join(path, "model.safetensors"))
42
- model.load_state_dict(state_dict)
43
-
44
- return model.to(device)
45
-
46
- def forward(self, input_ids=None, attention_mask=None, features=None, labels=None):
47
- out = self.encoder(input_ids=input_ids, attention_mask=attention_mask, return_dict=True)
48
-
49
- if hasattr(out, "pooler_output") and out.pooler_output is not None:
50
- pooled = out.pooler_output
51
- else:
52
- last = out.last_hidden_state
53
- mask = attention_mask.unsqueeze(-1)
54
- pooled = (last * mask).sum(1) / mask.sum(1).clamp(min=1e-9)
55
-
56
- # Cast features to match model dtype/device
57
- features = features.to(pooled.device).to(pooled.dtype)
58
- x = torch.cat([pooled, features], dim=1)
59
- logits = self.classifier(x)
60
-
61
- loss = None
62
- if labels is not None:
63
- loss = nn.CrossEntropyLoss()(logits, labels)
64
-
65
- return SequenceClassifierOutput(loss=loss, logits=logits)
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
Instadeep_NT_500M_CPT/PathScan/special_tokens_map.json DELETED
@@ -1,6 +0,0 @@
1
- {
2
- "cls_token": "<cls>",
3
- "mask_token": "<mask>",
4
- "pad_token": "<pad>",
5
- "unk_token": "<unk>"
6
- }
 
 
 
 
 
 
 
Instadeep_NT_500M_CPT/PathScan/tokenizer_config.json DELETED
@@ -1,45 +0,0 @@
1
- {
2
- "added_tokens_decoder": {
3
- "0": {
4
- "content": "<unk>",
5
- "lstrip": false,
6
- "normalized": false,
7
- "rstrip": false,
8
- "single_word": false,
9
- "special": true
10
- },
11
- "1": {
12
- "content": "<pad>",
13
- "lstrip": false,
14
- "normalized": false,
15
- "rstrip": false,
16
- "single_word": false,
17
- "special": true
18
- },
19
- "2": {
20
- "content": "<mask>",
21
- "lstrip": false,
22
- "normalized": false,
23
- "rstrip": false,
24
- "single_word": false,
25
- "special": true
26
- },
27
- "3": {
28
- "content": "<cls>",
29
- "lstrip": false,
30
- "normalized": false,
31
- "rstrip": false,
32
- "single_word": false,
33
- "special": true
34
- }
35
- },
36
- "clean_up_tokenization_spaces": true,
37
- "cls_token": "<cls>",
38
- "eos_token": null,
39
- "extra_special_tokens": {},
40
- "mask_token": "<mask>",
41
- "model_max_length": 1000,
42
- "pad_token": "<pad>",
43
- "tokenizer_class": "EsmTokenizer",
44
- "unk_token": "<unk>"
45
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
Instadeep_NT_500M_CPT/PathScan/vocab.txt DELETED
@@ -1,4107 +0,0 @@
1
- <unk>
2
- <pad>
3
- <mask>
4
- <cls>
5
- AAAAAA
6
- AAAAAT
7
- AAAAAC
8
- AAAAAG
9
- AAAATA
10
- AAAATT
11
- AAAATC
12
- AAAATG
13
- AAAACA
14
- AAAACT
15
- AAAACC
16
- AAAACG
17
- AAAAGA
18
- AAAAGT
19
- AAAAGC
20
- AAAAGG
21
- AAATAA
22
- AAATAT
23
- AAATAC
24
- AAATAG
25
- AAATTA
26
- AAATTT
27
- AAATTC
28
- AAATTG
29
- AAATCA
30
- AAATCT
31
- AAATCC
32
- AAATCG
33
- AAATGA
34
- AAATGT
35
- AAATGC
36
- AAATGG
37
- AAACAA
38
- AAACAT
39
- AAACAC
40
- AAACAG
41
- AAACTA
42
- AAACTT
43
- AAACTC
44
- AAACTG
45
- AAACCA
46
- AAACCT
47
- AAACCC
48
- AAACCG
49
- AAACGA
50
- AAACGT
51
- AAACGC
52
- AAACGG
53
- AAAGAA
54
- AAAGAT
55
- AAAGAC
56
- AAAGAG
57
- AAAGTA
58
- AAAGTT
59
- AAAGTC
60
- AAAGTG
61
- AAAGCA
62
- AAAGCT
63
- AAAGCC
64
- AAAGCG
65
- AAAGGA
66
- AAAGGT
67
- AAAGGC
68
- AAAGGG
69
- AATAAA
70
- AATAAT
71
- AATAAC
72
- AATAAG
73
- AATATA
74
- AATATT
75
- AATATC
76
- AATATG
77
- AATACA
78
- AATACT
79
- AATACC
80
- AATACG
81
- AATAGA
82
- AATAGT
83
- AATAGC
84
- AATAGG
85
- AATTAA
86
- AATTAT
87
- AATTAC
88
- AATTAG
89
- AATTTA
90
- AATTTT
91
- AATTTC
92
- AATTTG
93
- AATTCA
94
- AATTCT
95
- AATTCC
96
- AATTCG
97
- AATTGA
98
- AATTGT
99
- AATTGC
100
- AATTGG
101
- AATCAA
102
- AATCAT
103
- AATCAC
104
- AATCAG
105
- AATCTA
106
- AATCTT
107
- AATCTC
108
- AATCTG
109
- AATCCA
110
- AATCCT
111
- AATCCC
112
- AATCCG
113
- AATCGA
114
- AATCGT
115
- AATCGC
116
- AATCGG
117
- AATGAA
118
- AATGAT
119
- AATGAC
120
- AATGAG
121
- AATGTA
122
- AATGTT
123
- AATGTC
124
- AATGTG
125
- AATGCA
126
- AATGCT
127
- AATGCC
128
- AATGCG
129
- AATGGA
130
- AATGGT
131
- AATGGC
132
- AATGGG
133
- AACAAA
134
- AACAAT
135
- AACAAC
136
- AACAAG
137
- AACATA
138
- AACATT
139
- AACATC
140
- AACATG
141
- AACACA
142
- AACACT
143
- AACACC
144
- AACACG
145
- AACAGA
146
- AACAGT
147
- AACAGC
148
- AACAGG
149
- AACTAA
150
- AACTAT
151
- AACTAC
152
- AACTAG
153
- AACTTA
154
- AACTTT
155
- AACTTC
156
- AACTTG
157
- AACTCA
158
- AACTCT
159
- AACTCC
160
- AACTCG
161
- AACTGA
162
- AACTGT
163
- AACTGC
164
- AACTGG
165
- AACCAA
166
- AACCAT
167
- AACCAC
168
- AACCAG
169
- AACCTA
170
- AACCTT
171
- AACCTC
172
- AACCTG
173
- AACCCA
174
- AACCCT
175
- AACCCC
176
- AACCCG
177
- AACCGA
178
- AACCGT
179
- AACCGC
180
- AACCGG
181
- AACGAA
182
- AACGAT
183
- AACGAC
184
- AACGAG
185
- AACGTA
186
- AACGTT
187
- AACGTC
188
- AACGTG
189
- AACGCA
190
- AACGCT
191
- AACGCC
192
- AACGCG
193
- AACGGA
194
- AACGGT
195
- AACGGC
196
- AACGGG
197
- AAGAAA
198
- AAGAAT
199
- AAGAAC
200
- AAGAAG
201
- AAGATA
202
- AAGATT
203
- AAGATC
204
- AAGATG
205
- AAGACA
206
- AAGACT
207
- AAGACC
208
- AAGACG
209
- AAGAGA
210
- AAGAGT
211
- AAGAGC
212
- AAGAGG
213
- AAGTAA
214
- AAGTAT
215
- AAGTAC
216
- AAGTAG
217
- AAGTTA
218
- AAGTTT
219
- AAGTTC
220
- AAGTTG
221
- AAGTCA
222
- AAGTCT
223
- AAGTCC
224
- AAGTCG
225
- AAGTGA
226
- AAGTGT
227
- AAGTGC
228
- AAGTGG
229
- AAGCAA
230
- AAGCAT
231
- AAGCAC
232
- AAGCAG
233
- AAGCTA
234
- AAGCTT
235
- AAGCTC
236
- AAGCTG
237
- AAGCCA
238
- AAGCCT
239
- AAGCCC
240
- AAGCCG
241
- AAGCGA
242
- AAGCGT
243
- AAGCGC
244
- AAGCGG
245
- AAGGAA
246
- AAGGAT
247
- AAGGAC
248
- AAGGAG
249
- AAGGTA
250
- AAGGTT
251
- AAGGTC
252
- AAGGTG
253
- AAGGCA
254
- AAGGCT
255
- AAGGCC
256
- AAGGCG
257
- AAGGGA
258
- AAGGGT
259
- AAGGGC
260
- AAGGGG
261
- ATAAAA
262
- ATAAAT
263
- ATAAAC
264
- ATAAAG
265
- ATAATA
266
- ATAATT
267
- ATAATC
268
- ATAATG
269
- ATAACA
270
- ATAACT
271
- ATAACC
272
- ATAACG
273
- ATAAGA
274
- ATAAGT
275
- ATAAGC
276
- ATAAGG
277
- ATATAA
278
- ATATAT
279
- ATATAC
280
- ATATAG
281
- ATATTA
282
- ATATTT
283
- ATATTC
284
- ATATTG
285
- ATATCA
286
- ATATCT
287
- ATATCC
288
- ATATCG
289
- ATATGA
290
- ATATGT
291
- ATATGC
292
- ATATGG
293
- ATACAA
294
- ATACAT
295
- ATACAC
296
- ATACAG
297
- ATACTA
298
- ATACTT
299
- ATACTC
300
- ATACTG
301
- ATACCA
302
- ATACCT
303
- ATACCC
304
- ATACCG
305
- ATACGA
306
- ATACGT
307
- ATACGC
308
- ATACGG
309
- ATAGAA
310
- ATAGAT
311
- ATAGAC
312
- ATAGAG
313
- ATAGTA
314
- ATAGTT
315
- ATAGTC
316
- ATAGTG
317
- ATAGCA
318
- ATAGCT
319
- ATAGCC
320
- ATAGCG
321
- ATAGGA
322
- ATAGGT
323
- ATAGGC
324
- ATAGGG
325
- ATTAAA
326
- ATTAAT
327
- ATTAAC
328
- ATTAAG
329
- ATTATA
330
- ATTATT
331
- ATTATC
332
- ATTATG
333
- ATTACA
334
- ATTACT
335
- ATTACC
336
- ATTACG
337
- ATTAGA
338
- ATTAGT
339
- ATTAGC
340
- ATTAGG
341
- ATTTAA
342
- ATTTAT
343
- ATTTAC
344
- ATTTAG
345
- ATTTTA
346
- ATTTTT
347
- ATTTTC
348
- ATTTTG
349
- ATTTCA
350
- ATTTCT
351
- ATTTCC
352
- ATTTCG
353
- ATTTGA
354
- ATTTGT
355
- ATTTGC
356
- ATTTGG
357
- ATTCAA
358
- ATTCAT
359
- ATTCAC
360
- ATTCAG
361
- ATTCTA
362
- ATTCTT
363
- ATTCTC
364
- ATTCTG
365
- ATTCCA
366
- ATTCCT
367
- ATTCCC
368
- ATTCCG
369
- ATTCGA
370
- ATTCGT
371
- ATTCGC
372
- ATTCGG
373
- ATTGAA
374
- ATTGAT
375
- ATTGAC
376
- ATTGAG
377
- ATTGTA
378
- ATTGTT
379
- ATTGTC
380
- ATTGTG
381
- ATTGCA
382
- ATTGCT
383
- ATTGCC
384
- ATTGCG
385
- ATTGGA
386
- ATTGGT
387
- ATTGGC
388
- ATTGGG
389
- ATCAAA
390
- ATCAAT
391
- ATCAAC
392
- ATCAAG
393
- ATCATA
394
- ATCATT
395
- ATCATC
396
- ATCATG
397
- ATCACA
398
- ATCACT
399
- ATCACC
400
- ATCACG
401
- ATCAGA
402
- ATCAGT
403
- ATCAGC
404
- ATCAGG
405
- ATCTAA
406
- ATCTAT
407
- ATCTAC
408
- ATCTAG
409
- ATCTTA
410
- ATCTTT
411
- ATCTTC
412
- ATCTTG
413
- ATCTCA
414
- ATCTCT
415
- ATCTCC
416
- ATCTCG
417
- ATCTGA
418
- ATCTGT
419
- ATCTGC
420
- ATCTGG
421
- ATCCAA
422
- ATCCAT
423
- ATCCAC
424
- ATCCAG
425
- ATCCTA
426
- ATCCTT
427
- ATCCTC
428
- ATCCTG
429
- ATCCCA
430
- ATCCCT
431
- ATCCCC
432
- ATCCCG
433
- ATCCGA
434
- ATCCGT
435
- ATCCGC
436
- ATCCGG
437
- ATCGAA
438
- ATCGAT
439
- ATCGAC
440
- ATCGAG
441
- ATCGTA
442
- ATCGTT
443
- ATCGTC
444
- ATCGTG
445
- ATCGCA
446
- ATCGCT
447
- ATCGCC
448
- ATCGCG
449
- ATCGGA
450
- ATCGGT
451
- ATCGGC
452
- ATCGGG
453
- ATGAAA
454
- ATGAAT
455
- ATGAAC
456
- ATGAAG
457
- ATGATA
458
- ATGATT
459
- ATGATC
460
- ATGATG
461
- ATGACA
462
- ATGACT
463
- ATGACC
464
- ATGACG
465
- ATGAGA
466
- ATGAGT
467
- ATGAGC
468
- ATGAGG
469
- ATGTAA
470
- ATGTAT
471
- ATGTAC
472
- ATGTAG
473
- ATGTTA
474
- ATGTTT
475
- ATGTTC
476
- ATGTTG
477
- ATGTCA
478
- ATGTCT
479
- ATGTCC
480
- ATGTCG
481
- ATGTGA
482
- ATGTGT
483
- ATGTGC
484
- ATGTGG
485
- ATGCAA
486
- ATGCAT
487
- ATGCAC
488
- ATGCAG
489
- ATGCTA
490
- ATGCTT
491
- ATGCTC
492
- ATGCTG
493
- ATGCCA
494
- ATGCCT
495
- ATGCCC
496
- ATGCCG
497
- ATGCGA
498
- ATGCGT
499
- ATGCGC
500
- ATGCGG
501
- ATGGAA
502
- ATGGAT
503
- ATGGAC
504
- ATGGAG
505
- ATGGTA
506
- ATGGTT
507
- ATGGTC
508
- ATGGTG
509
- ATGGCA
510
- ATGGCT
511
- ATGGCC
512
- ATGGCG
513
- ATGGGA
514
- ATGGGT
515
- ATGGGC
516
- ATGGGG
517
- ACAAAA
518
- ACAAAT
519
- ACAAAC
520
- ACAAAG
521
- ACAATA
522
- ACAATT
523
- ACAATC
524
- ACAATG
525
- ACAACA
526
- ACAACT
527
- ACAACC
528
- ACAACG
529
- ACAAGA
530
- ACAAGT
531
- ACAAGC
532
- ACAAGG
533
- ACATAA
534
- ACATAT
535
- ACATAC
536
- ACATAG
537
- ACATTA
538
- ACATTT
539
- ACATTC
540
- ACATTG
541
- ACATCA
542
- ACATCT
543
- ACATCC
544
- ACATCG
545
- ACATGA
546
- ACATGT
547
- ACATGC
548
- ACATGG
549
- ACACAA
550
- ACACAT
551
- ACACAC
552
- ACACAG
553
- ACACTA
554
- ACACTT
555
- ACACTC
556
- ACACTG
557
- ACACCA
558
- ACACCT
559
- ACACCC
560
- ACACCG
561
- ACACGA
562
- ACACGT
563
- ACACGC
564
- ACACGG
565
- ACAGAA
566
- ACAGAT
567
- ACAGAC
568
- ACAGAG
569
- ACAGTA
570
- ACAGTT
571
- ACAGTC
572
- ACAGTG
573
- ACAGCA
574
- ACAGCT
575
- ACAGCC
576
- ACAGCG
577
- ACAGGA
578
- ACAGGT
579
- ACAGGC
580
- ACAGGG
581
- ACTAAA
582
- ACTAAT
583
- ACTAAC
584
- ACTAAG
585
- ACTATA
586
- ACTATT
587
- ACTATC
588
- ACTATG
589
- ACTACA
590
- ACTACT
591
- ACTACC
592
- ACTACG
593
- ACTAGA
594
- ACTAGT
595
- ACTAGC
596
- ACTAGG
597
- ACTTAA
598
- ACTTAT
599
- ACTTAC
600
- ACTTAG
601
- ACTTTA
602
- ACTTTT
603
- ACTTTC
604
- ACTTTG
605
- ACTTCA
606
- ACTTCT
607
- ACTTCC
608
- ACTTCG
609
- ACTTGA
610
- ACTTGT
611
- ACTTGC
612
- ACTTGG
613
- ACTCAA
614
- ACTCAT
615
- ACTCAC
616
- ACTCAG
617
- ACTCTA
618
- ACTCTT
619
- ACTCTC
620
- ACTCTG
621
- ACTCCA
622
- ACTCCT
623
- ACTCCC
624
- ACTCCG
625
- ACTCGA
626
- ACTCGT
627
- ACTCGC
628
- ACTCGG
629
- ACTGAA
630
- ACTGAT
631
- ACTGAC
632
- ACTGAG
633
- ACTGTA
634
- ACTGTT
635
- ACTGTC
636
- ACTGTG
637
- ACTGCA
638
- ACTGCT
639
- ACTGCC
640
- ACTGCG
641
- ACTGGA
642
- ACTGGT
643
- ACTGGC
644
- ACTGGG
645
- ACCAAA
646
- ACCAAT
647
- ACCAAC
648
- ACCAAG
649
- ACCATA
650
- ACCATT
651
- ACCATC
652
- ACCATG
653
- ACCACA
654
- ACCACT
655
- ACCACC
656
- ACCACG
657
- ACCAGA
658
- ACCAGT
659
- ACCAGC
660
- ACCAGG
661
- ACCTAA
662
- ACCTAT
663
- ACCTAC
664
- ACCTAG
665
- ACCTTA
666
- ACCTTT
667
- ACCTTC
668
- ACCTTG
669
- ACCTCA
670
- ACCTCT
671
- ACCTCC
672
- ACCTCG
673
- ACCTGA
674
- ACCTGT
675
- ACCTGC
676
- ACCTGG
677
- ACCCAA
678
- ACCCAT
679
- ACCCAC
680
- ACCCAG
681
- ACCCTA
682
- ACCCTT
683
- ACCCTC
684
- ACCCTG
685
- ACCCCA
686
- ACCCCT
687
- ACCCCC
688
- ACCCCG
689
- ACCCGA
690
- ACCCGT
691
- ACCCGC
692
- ACCCGG
693
- ACCGAA
694
- ACCGAT
695
- ACCGAC
696
- ACCGAG
697
- ACCGTA
698
- ACCGTT
699
- ACCGTC
700
- ACCGTG
701
- ACCGCA
702
- ACCGCT
703
- ACCGCC
704
- ACCGCG
705
- ACCGGA
706
- ACCGGT
707
- ACCGGC
708
- ACCGGG
709
- ACGAAA
710
- ACGAAT
711
- ACGAAC
712
- ACGAAG
713
- ACGATA
714
- ACGATT
715
- ACGATC
716
- ACGATG
717
- ACGACA
718
- ACGACT
719
- ACGACC
720
- ACGACG
721
- ACGAGA
722
- ACGAGT
723
- ACGAGC
724
- ACGAGG
725
- ACGTAA
726
- ACGTAT
727
- ACGTAC
728
- ACGTAG
729
- ACGTTA
730
- ACGTTT
731
- ACGTTC
732
- ACGTTG
733
- ACGTCA
734
- ACGTCT
735
- ACGTCC
736
- ACGTCG
737
- ACGTGA
738
- ACGTGT
739
- ACGTGC
740
- ACGTGG
741
- ACGCAA
742
- ACGCAT
743
- ACGCAC
744
- ACGCAG
745
- ACGCTA
746
- ACGCTT
747
- ACGCTC
748
- ACGCTG
749
- ACGCCA
750
- ACGCCT
751
- ACGCCC
752
- ACGCCG
753
- ACGCGA
754
- ACGCGT
755
- ACGCGC
756
- ACGCGG
757
- ACGGAA
758
- ACGGAT
759
- ACGGAC
760
- ACGGAG
761
- ACGGTA
762
- ACGGTT
763
- ACGGTC
764
- ACGGTG
765
- ACGGCA
766
- ACGGCT
767
- ACGGCC
768
- ACGGCG
769
- ACGGGA
770
- ACGGGT
771
- ACGGGC
772
- ACGGGG
773
- AGAAAA
774
- AGAAAT
775
- AGAAAC
776
- AGAAAG
777
- AGAATA
778
- AGAATT
779
- AGAATC
780
- AGAATG
781
- AGAACA
782
- AGAACT
783
- AGAACC
784
- AGAACG
785
- AGAAGA
786
- AGAAGT
787
- AGAAGC
788
- AGAAGG
789
- AGATAA
790
- AGATAT
791
- AGATAC
792
- AGATAG
793
- AGATTA
794
- AGATTT
795
- AGATTC
796
- AGATTG
797
- AGATCA
798
- AGATCT
799
- AGATCC
800
- AGATCG
801
- AGATGA
802
- AGATGT
803
- AGATGC
804
- AGATGG
805
- AGACAA
806
- AGACAT
807
- AGACAC
808
- AGACAG
809
- AGACTA
810
- AGACTT
811
- AGACTC
812
- AGACTG
813
- AGACCA
814
- AGACCT
815
- AGACCC
816
- AGACCG
817
- AGACGA
818
- AGACGT
819
- AGACGC
820
- AGACGG
821
- AGAGAA
822
- AGAGAT
823
- AGAGAC
824
- AGAGAG
825
- AGAGTA
826
- AGAGTT
827
- AGAGTC
828
- AGAGTG
829
- AGAGCA
830
- AGAGCT
831
- AGAGCC
832
- AGAGCG
833
- AGAGGA
834
- AGAGGT
835
- AGAGGC
836
- AGAGGG
837
- AGTAAA
838
- AGTAAT
839
- AGTAAC
840
- AGTAAG
841
- AGTATA
842
- AGTATT
843
- AGTATC
844
- AGTATG
845
- AGTACA
846
- AGTACT
847
- AGTACC
848
- AGTACG
849
- AGTAGA
850
- AGTAGT
851
- AGTAGC
852
- AGTAGG
853
- AGTTAA
854
- AGTTAT
855
- AGTTAC
856
- AGTTAG
857
- AGTTTA
858
- AGTTTT
859
- AGTTTC
860
- AGTTTG
861
- AGTTCA
862
- AGTTCT
863
- AGTTCC
864
- AGTTCG
865
- AGTTGA
866
- AGTTGT
867
- AGTTGC
868
- AGTTGG
869
- AGTCAA
870
- AGTCAT
871
- AGTCAC
872
- AGTCAG
873
- AGTCTA
874
- AGTCTT
875
- AGTCTC
876
- AGTCTG
877
- AGTCCA
878
- AGTCCT
879
- AGTCCC
880
- AGTCCG
881
- AGTCGA
882
- AGTCGT
883
- AGTCGC
884
- AGTCGG
885
- AGTGAA
886
- AGTGAT
887
- AGTGAC
888
- AGTGAG
889
- AGTGTA
890
- AGTGTT
891
- AGTGTC
892
- AGTGTG
893
- AGTGCA
894
- AGTGCT
895
- AGTGCC
896
- AGTGCG
897
- AGTGGA
898
- AGTGGT
899
- AGTGGC
900
- AGTGGG
901
- AGCAAA
902
- AGCAAT
903
- AGCAAC
904
- AGCAAG
905
- AGCATA
906
- AGCATT
907
- AGCATC
908
- AGCATG
909
- AGCACA
910
- AGCACT
911
- AGCACC
912
- AGCACG
913
- AGCAGA
914
- AGCAGT
915
- AGCAGC
916
- AGCAGG
917
- AGCTAA
918
- AGCTAT
919
- AGCTAC
920
- AGCTAG
921
- AGCTTA
922
- AGCTTT
923
- AGCTTC
924
- AGCTTG
925
- AGCTCA
926
- AGCTCT
927
- AGCTCC
928
- AGCTCG
929
- AGCTGA
930
- AGCTGT
931
- AGCTGC
932
- AGCTGG
933
- AGCCAA
934
- AGCCAT
935
- AGCCAC
936
- AGCCAG
937
- AGCCTA
938
- AGCCTT
939
- AGCCTC
940
- AGCCTG
941
- AGCCCA
942
- AGCCCT
943
- AGCCCC
944
- AGCCCG
945
- AGCCGA
946
- AGCCGT
947
- AGCCGC
948
- AGCCGG
949
- AGCGAA
950
- AGCGAT
951
- AGCGAC
952
- AGCGAG
953
- AGCGTA
954
- AGCGTT
955
- AGCGTC
956
- AGCGTG
957
- AGCGCA
958
- AGCGCT
959
- AGCGCC
960
- AGCGCG
961
- AGCGGA
962
- AGCGGT
963
- AGCGGC
964
- AGCGGG
965
- AGGAAA
966
- AGGAAT
967
- AGGAAC
968
- AGGAAG
969
- AGGATA
970
- AGGATT
971
- AGGATC
972
- AGGATG
973
- AGGACA
974
- AGGACT
975
- AGGACC
976
- AGGACG
977
- AGGAGA
978
- AGGAGT
979
- AGGAGC
980
- AGGAGG
981
- AGGTAA
982
- AGGTAT
983
- AGGTAC
984
- AGGTAG
985
- AGGTTA
986
- AGGTTT
987
- AGGTTC
988
- AGGTTG
989
- AGGTCA
990
- AGGTCT
991
- AGGTCC
992
- AGGTCG
993
- AGGTGA
994
- AGGTGT
995
- AGGTGC
996
- AGGTGG
997
- AGGCAA
998
- AGGCAT
999
- AGGCAC
1000
- AGGCAG
1001
- AGGCTA
1002
- AGGCTT
1003
- AGGCTC
1004
- AGGCTG
1005
- AGGCCA
1006
- AGGCCT
1007
- AGGCCC
1008
- AGGCCG
1009
- AGGCGA
1010
- AGGCGT
1011
- AGGCGC
1012
- AGGCGG
1013
- AGGGAA
1014
- AGGGAT
1015
- AGGGAC
1016
- AGGGAG
1017
- AGGGTA
1018
- AGGGTT
1019
- AGGGTC
1020
- AGGGTG
1021
- AGGGCA
1022
- AGGGCT
1023
- AGGGCC
1024
- AGGGCG
1025
- AGGGGA
1026
- AGGGGT
1027
- AGGGGC
1028
- AGGGGG
1029
- TAAAAA
1030
- TAAAAT
1031
- TAAAAC
1032
- TAAAAG
1033
- TAAATA
1034
- TAAATT
1035
- TAAATC
1036
- TAAATG
1037
- TAAACA
1038
- TAAACT
1039
- TAAACC
1040
- TAAACG
1041
- TAAAGA
1042
- TAAAGT
1043
- TAAAGC
1044
- TAAAGG
1045
- TAATAA
1046
- TAATAT
1047
- TAATAC
1048
- TAATAG
1049
- TAATTA
1050
- TAATTT
1051
- TAATTC
1052
- TAATTG
1053
- TAATCA
1054
- TAATCT
1055
- TAATCC
1056
- TAATCG
1057
- TAATGA
1058
- TAATGT
1059
- TAATGC
1060
- TAATGG
1061
- TAACAA
1062
- TAACAT
1063
- TAACAC
1064
- TAACAG
1065
- TAACTA
1066
- TAACTT
1067
- TAACTC
1068
- TAACTG
1069
- TAACCA
1070
- TAACCT
1071
- TAACCC
1072
- TAACCG
1073
- TAACGA
1074
- TAACGT
1075
- TAACGC
1076
- TAACGG
1077
- TAAGAA
1078
- TAAGAT
1079
- TAAGAC
1080
- TAAGAG
1081
- TAAGTA
1082
- TAAGTT
1083
- TAAGTC
1084
- TAAGTG
1085
- TAAGCA
1086
- TAAGCT
1087
- TAAGCC
1088
- TAAGCG
1089
- TAAGGA
1090
- TAAGGT
1091
- TAAGGC
1092
- TAAGGG
1093
- TATAAA
1094
- TATAAT
1095
- TATAAC
1096
- TATAAG
1097
- TATATA
1098
- TATATT
1099
- TATATC
1100
- TATATG
1101
- TATACA
1102
- TATACT
1103
- TATACC
1104
- TATACG
1105
- TATAGA
1106
- TATAGT
1107
- TATAGC
1108
- TATAGG
1109
- TATTAA
1110
- TATTAT
1111
- TATTAC
1112
- TATTAG
1113
- TATTTA
1114
- TATTTT
1115
- TATTTC
1116
- TATTTG
1117
- TATTCA
1118
- TATTCT
1119
- TATTCC
1120
- TATTCG
1121
- TATTGA
1122
- TATTGT
1123
- TATTGC
1124
- TATTGG
1125
- TATCAA
1126
- TATCAT
1127
- TATCAC
1128
- TATCAG
1129
- TATCTA
1130
- TATCTT
1131
- TATCTC
1132
- TATCTG
1133
- TATCCA
1134
- TATCCT
1135
- TATCCC
1136
- TATCCG
1137
- TATCGA
1138
- TATCGT
1139
- TATCGC
1140
- TATCGG
1141
- TATGAA
1142
- TATGAT
1143
- TATGAC
1144
- TATGAG
1145
- TATGTA
1146
- TATGTT
1147
- TATGTC
1148
- TATGTG
1149
- TATGCA
1150
- TATGCT
1151
- TATGCC
1152
- TATGCG
1153
- TATGGA
1154
- TATGGT
1155
- TATGGC
1156
- TATGGG
1157
- TACAAA
1158
- TACAAT
1159
- TACAAC
1160
- TACAAG
1161
- TACATA
1162
- TACATT
1163
- TACATC
1164
- TACATG
1165
- TACACA
1166
- TACACT
1167
- TACACC
1168
- TACACG
1169
- TACAGA
1170
- TACAGT
1171
- TACAGC
1172
- TACAGG
1173
- TACTAA
1174
- TACTAT
1175
- TACTAC
1176
- TACTAG
1177
- TACTTA
1178
- TACTTT
1179
- TACTTC
1180
- TACTTG
1181
- TACTCA
1182
- TACTCT
1183
- TACTCC
1184
- TACTCG
1185
- TACTGA
1186
- TACTGT
1187
- TACTGC
1188
- TACTGG
1189
- TACCAA
1190
- TACCAT
1191
- TACCAC
1192
- TACCAG
1193
- TACCTA
1194
- TACCTT
1195
- TACCTC
1196
- TACCTG
1197
- TACCCA
1198
- TACCCT
1199
- TACCCC
1200
- TACCCG
1201
- TACCGA
1202
- TACCGT
1203
- TACCGC
1204
- TACCGG
1205
- TACGAA
1206
- TACGAT
1207
- TACGAC
1208
- TACGAG
1209
- TACGTA
1210
- TACGTT
1211
- TACGTC
1212
- TACGTG
1213
- TACGCA
1214
- TACGCT
1215
- TACGCC
1216
- TACGCG
1217
- TACGGA
1218
- TACGGT
1219
- TACGGC
1220
- TACGGG
1221
- TAGAAA
1222
- TAGAAT
1223
- TAGAAC
1224
- TAGAAG
1225
- TAGATA
1226
- TAGATT
1227
- TAGATC
1228
- TAGATG
1229
- TAGACA
1230
- TAGACT
1231
- TAGACC
1232
- TAGACG
1233
- TAGAGA
1234
- TAGAGT
1235
- TAGAGC
1236
- TAGAGG
1237
- TAGTAA
1238
- TAGTAT
1239
- TAGTAC
1240
- TAGTAG
1241
- TAGTTA
1242
- TAGTTT
1243
- TAGTTC
1244
- TAGTTG
1245
- TAGTCA
1246
- TAGTCT
1247
- TAGTCC
1248
- TAGTCG
1249
- TAGTGA
1250
- TAGTGT
1251
- TAGTGC
1252
- TAGTGG
1253
- TAGCAA
1254
- TAGCAT
1255
- TAGCAC
1256
- TAGCAG
1257
- TAGCTA
1258
- TAGCTT
1259
- TAGCTC
1260
- TAGCTG
1261
- TAGCCA
1262
- TAGCCT
1263
- TAGCCC
1264
- TAGCCG
1265
- TAGCGA
1266
- TAGCGT
1267
- TAGCGC
1268
- TAGCGG
1269
- TAGGAA
1270
- TAGGAT
1271
- TAGGAC
1272
- TAGGAG
1273
- TAGGTA
1274
- TAGGTT
1275
- TAGGTC
1276
- TAGGTG
1277
- TAGGCA
1278
- TAGGCT
1279
- TAGGCC
1280
- TAGGCG
1281
- TAGGGA
1282
- TAGGGT
1283
- TAGGGC
1284
- TAGGGG
1285
- TTAAAA
1286
- TTAAAT
1287
- TTAAAC
1288
- TTAAAG
1289
- TTAATA
1290
- TTAATT
1291
- TTAATC
1292
- TTAATG
1293
- TTAACA
1294
- TTAACT
1295
- TTAACC
1296
- TTAACG
1297
- TTAAGA
1298
- TTAAGT
1299
- TTAAGC
1300
- TTAAGG
1301
- TTATAA
1302
- TTATAT
1303
- TTATAC
1304
- TTATAG
1305
- TTATTA
1306
- TTATTT
1307
- TTATTC
1308
- TTATTG
1309
- TTATCA
1310
- TTATCT
1311
- TTATCC
1312
- TTATCG
1313
- TTATGA
1314
- TTATGT
1315
- TTATGC
1316
- TTATGG
1317
- TTACAA
1318
- TTACAT
1319
- TTACAC
1320
- TTACAG
1321
- TTACTA
1322
- TTACTT
1323
- TTACTC
1324
- TTACTG
1325
- TTACCA
1326
- TTACCT
1327
- TTACCC
1328
- TTACCG
1329
- TTACGA
1330
- TTACGT
1331
- TTACGC
1332
- TTACGG
1333
- TTAGAA
1334
- TTAGAT
1335
- TTAGAC
1336
- TTAGAG
1337
- TTAGTA
1338
- TTAGTT
1339
- TTAGTC
1340
- TTAGTG
1341
- TTAGCA
1342
- TTAGCT
1343
- TTAGCC
1344
- TTAGCG
1345
- TTAGGA
1346
- TTAGGT
1347
- TTAGGC
1348
- TTAGGG
1349
- TTTAAA
1350
- TTTAAT
1351
- TTTAAC
1352
- TTTAAG
1353
- TTTATA
1354
- TTTATT
1355
- TTTATC
1356
- TTTATG
1357
- TTTACA
1358
- TTTACT
1359
- TTTACC
1360
- TTTACG
1361
- TTTAGA
1362
- TTTAGT
1363
- TTTAGC
1364
- TTTAGG
1365
- TTTTAA
1366
- TTTTAT
1367
- TTTTAC
1368
- TTTTAG
1369
- TTTTTA
1370
- TTTTTT
1371
- TTTTTC
1372
- TTTTTG
1373
- TTTTCA
1374
- TTTTCT
1375
- TTTTCC
1376
- TTTTCG
1377
- TTTTGA
1378
- TTTTGT
1379
- TTTTGC
1380
- TTTTGG
1381
- TTTCAA
1382
- TTTCAT
1383
- TTTCAC
1384
- TTTCAG
1385
- TTTCTA
1386
- TTTCTT
1387
- TTTCTC
1388
- TTTCTG
1389
- TTTCCA
1390
- TTTCCT
1391
- TTTCCC
1392
- TTTCCG
1393
- TTTCGA
1394
- TTTCGT
1395
- TTTCGC
1396
- TTTCGG
1397
- TTTGAA
1398
- TTTGAT
1399
- TTTGAC
1400
- TTTGAG
1401
- TTTGTA
1402
- TTTGTT
1403
- TTTGTC
1404
- TTTGTG
1405
- TTTGCA
1406
- TTTGCT
1407
- TTTGCC
1408
- TTTGCG
1409
- TTTGGA
1410
- TTTGGT
1411
- TTTGGC
1412
- TTTGGG
1413
- TTCAAA
1414
- TTCAAT
1415
- TTCAAC
1416
- TTCAAG
1417
- TTCATA
1418
- TTCATT
1419
- TTCATC
1420
- TTCATG
1421
- TTCACA
1422
- TTCACT
1423
- TTCACC
1424
- TTCACG
1425
- TTCAGA
1426
- TTCAGT
1427
- TTCAGC
1428
- TTCAGG
1429
- TTCTAA
1430
- TTCTAT
1431
- TTCTAC
1432
- TTCTAG
1433
- TTCTTA
1434
- TTCTTT
1435
- TTCTTC
1436
- TTCTTG
1437
- TTCTCA
1438
- TTCTCT
1439
- TTCTCC
1440
- TTCTCG
1441
- TTCTGA
1442
- TTCTGT
1443
- TTCTGC
1444
- TTCTGG
1445
- TTCCAA
1446
- TTCCAT
1447
- TTCCAC
1448
- TTCCAG
1449
- TTCCTA
1450
- TTCCTT
1451
- TTCCTC
1452
- TTCCTG
1453
- TTCCCA
1454
- TTCCCT
1455
- TTCCCC
1456
- TTCCCG
1457
- TTCCGA
1458
- TTCCGT
1459
- TTCCGC
1460
- TTCCGG
1461
- TTCGAA
1462
- TTCGAT
1463
- TTCGAC
1464
- TTCGAG
1465
- TTCGTA
1466
- TTCGTT
1467
- TTCGTC
1468
- TTCGTG
1469
- TTCGCA
1470
- TTCGCT
1471
- TTCGCC
1472
- TTCGCG
1473
- TTCGGA
1474
- TTCGGT
1475
- TTCGGC
1476
- TTCGGG
1477
- TTGAAA
1478
- TTGAAT
1479
- TTGAAC
1480
- TTGAAG
1481
- TTGATA
1482
- TTGATT
1483
- TTGATC
1484
- TTGATG
1485
- TTGACA
1486
- TTGACT
1487
- TTGACC
1488
- TTGACG
1489
- TTGAGA
1490
- TTGAGT
1491
- TTGAGC
1492
- TTGAGG
1493
- TTGTAA
1494
- TTGTAT
1495
- TTGTAC
1496
- TTGTAG
1497
- TTGTTA
1498
- TTGTTT
1499
- TTGTTC
1500
- TTGTTG
1501
- TTGTCA
1502
- TTGTCT
1503
- TTGTCC
1504
- TTGTCG
1505
- TTGTGA
1506
- TTGTGT
1507
- TTGTGC
1508
- TTGTGG
1509
- TTGCAA
1510
- TTGCAT
1511
- TTGCAC
1512
- TTGCAG
1513
- TTGCTA
1514
- TTGCTT
1515
- TTGCTC
1516
- TTGCTG
1517
- TTGCCA
1518
- TTGCCT
1519
- TTGCCC
1520
- TTGCCG
1521
- TTGCGA
1522
- TTGCGT
1523
- TTGCGC
1524
- TTGCGG
1525
- TTGGAA
1526
- TTGGAT
1527
- TTGGAC
1528
- TTGGAG
1529
- TTGGTA
1530
- TTGGTT
1531
- TTGGTC
1532
- TTGGTG
1533
- TTGGCA
1534
- TTGGCT
1535
- TTGGCC
1536
- TTGGCG
1537
- TTGGGA
1538
- TTGGGT
1539
- TTGGGC
1540
- TTGGGG
1541
- TCAAAA
1542
- TCAAAT
1543
- TCAAAC
1544
- TCAAAG
1545
- TCAATA
1546
- TCAATT
1547
- TCAATC
1548
- TCAATG
1549
- TCAACA
1550
- TCAACT
1551
- TCAACC
1552
- TCAACG
1553
- TCAAGA
1554
- TCAAGT
1555
- TCAAGC
1556
- TCAAGG
1557
- TCATAA
1558
- TCATAT
1559
- TCATAC
1560
- TCATAG
1561
- TCATTA
1562
- TCATTT
1563
- TCATTC
1564
- TCATTG
1565
- TCATCA
1566
- TCATCT
1567
- TCATCC
1568
- TCATCG
1569
- TCATGA
1570
- TCATGT
1571
- TCATGC
1572
- TCATGG
1573
- TCACAA
1574
- TCACAT
1575
- TCACAC
1576
- TCACAG
1577
- TCACTA
1578
- TCACTT
1579
- TCACTC
1580
- TCACTG
1581
- TCACCA
1582
- TCACCT
1583
- TCACCC
1584
- TCACCG
1585
- TCACGA
1586
- TCACGT
1587
- TCACGC
1588
- TCACGG
1589
- TCAGAA
1590
- TCAGAT
1591
- TCAGAC
1592
- TCAGAG
1593
- TCAGTA
1594
- TCAGTT
1595
- TCAGTC
1596
- TCAGTG
1597
- TCAGCA
1598
- TCAGCT
1599
- TCAGCC
1600
- TCAGCG
1601
- TCAGGA
1602
- TCAGGT
1603
- TCAGGC
1604
- TCAGGG
1605
- TCTAAA
1606
- TCTAAT
1607
- TCTAAC
1608
- TCTAAG
1609
- TCTATA
1610
- TCTATT
1611
- TCTATC
1612
- TCTATG
1613
- TCTACA
1614
- TCTACT
1615
- TCTACC
1616
- TCTACG
1617
- TCTAGA
1618
- TCTAGT
1619
- TCTAGC
1620
- TCTAGG
1621
- TCTTAA
1622
- TCTTAT
1623
- TCTTAC
1624
- TCTTAG
1625
- TCTTTA
1626
- TCTTTT
1627
- TCTTTC
1628
- TCTTTG
1629
- TCTTCA
1630
- TCTTCT
1631
- TCTTCC
1632
- TCTTCG
1633
- TCTTGA
1634
- TCTTGT
1635
- TCTTGC
1636
- TCTTGG
1637
- TCTCAA
1638
- TCTCAT
1639
- TCTCAC
1640
- TCTCAG
1641
- TCTCTA
1642
- TCTCTT
1643
- TCTCTC
1644
- TCTCTG
1645
- TCTCCA
1646
- TCTCCT
1647
- TCTCCC
1648
- TCTCCG
1649
- TCTCGA
1650
- TCTCGT
1651
- TCTCGC
1652
- TCTCGG
1653
- TCTGAA
1654
- TCTGAT
1655
- TCTGAC
1656
- TCTGAG
1657
- TCTGTA
1658
- TCTGTT
1659
- TCTGTC
1660
- TCTGTG
1661
- TCTGCA
1662
- TCTGCT
1663
- TCTGCC
1664
- TCTGCG
1665
- TCTGGA
1666
- TCTGGT
1667
- TCTGGC
1668
- TCTGGG
1669
- TCCAAA
1670
- TCCAAT
1671
- TCCAAC
1672
- TCCAAG
1673
- TCCATA
1674
- TCCATT
1675
- TCCATC
1676
- TCCATG
1677
- TCCACA
1678
- TCCACT
1679
- TCCACC
1680
- TCCACG
1681
- TCCAGA
1682
- TCCAGT
1683
- TCCAGC
1684
- TCCAGG
1685
- TCCTAA
1686
- TCCTAT
1687
- TCCTAC
1688
- TCCTAG
1689
- TCCTTA
1690
- TCCTTT
1691
- TCCTTC
1692
- TCCTTG
1693
- TCCTCA
1694
- TCCTCT
1695
- TCCTCC
1696
- TCCTCG
1697
- TCCTGA
1698
- TCCTGT
1699
- TCCTGC
1700
- TCCTGG
1701
- TCCCAA
1702
- TCCCAT
1703
- TCCCAC
1704
- TCCCAG
1705
- TCCCTA
1706
- TCCCTT
1707
- TCCCTC
1708
- TCCCTG
1709
- TCCCCA
1710
- TCCCCT
1711
- TCCCCC
1712
- TCCCCG
1713
- TCCCGA
1714
- TCCCGT
1715
- TCCCGC
1716
- TCCCGG
1717
- TCCGAA
1718
- TCCGAT
1719
- TCCGAC
1720
- TCCGAG
1721
- TCCGTA
1722
- TCCGTT
1723
- TCCGTC
1724
- TCCGTG
1725
- TCCGCA
1726
- TCCGCT
1727
- TCCGCC
1728
- TCCGCG
1729
- TCCGGA
1730
- TCCGGT
1731
- TCCGGC
1732
- TCCGGG
1733
- TCGAAA
1734
- TCGAAT
1735
- TCGAAC
1736
- TCGAAG
1737
- TCGATA
1738
- TCGATT
1739
- TCGATC
1740
- TCGATG
1741
- TCGACA
1742
- TCGACT
1743
- TCGACC
1744
- TCGACG
1745
- TCGAGA
1746
- TCGAGT
1747
- TCGAGC
1748
- TCGAGG
1749
- TCGTAA
1750
- TCGTAT
1751
- TCGTAC
1752
- TCGTAG
1753
- TCGTTA
1754
- TCGTTT
1755
- TCGTTC
1756
- TCGTTG
1757
- TCGTCA
1758
- TCGTCT
1759
- TCGTCC
1760
- TCGTCG
1761
- TCGTGA
1762
- TCGTGT
1763
- TCGTGC
1764
- TCGTGG
1765
- TCGCAA
1766
- TCGCAT
1767
- TCGCAC
1768
- TCGCAG
1769
- TCGCTA
1770
- TCGCTT
1771
- TCGCTC
1772
- TCGCTG
1773
- TCGCCA
1774
- TCGCCT
1775
- TCGCCC
1776
- TCGCCG
1777
- TCGCGA
1778
- TCGCGT
1779
- TCGCGC
1780
- TCGCGG
1781
- TCGGAA
1782
- TCGGAT
1783
- TCGGAC
1784
- TCGGAG
1785
- TCGGTA
1786
- TCGGTT
1787
- TCGGTC
1788
- TCGGTG
1789
- TCGGCA
1790
- TCGGCT
1791
- TCGGCC
1792
- TCGGCG
1793
- TCGGGA
1794
- TCGGGT
1795
- TCGGGC
1796
- TCGGGG
1797
- TGAAAA
1798
- TGAAAT
1799
- TGAAAC
1800
- TGAAAG
1801
- TGAATA
1802
- TGAATT
1803
- TGAATC
1804
- TGAATG
1805
- TGAACA
1806
- TGAACT
1807
- TGAACC
1808
- TGAACG
1809
- TGAAGA
1810
- TGAAGT
1811
- TGAAGC
1812
- TGAAGG
1813
- TGATAA
1814
- TGATAT
1815
- TGATAC
1816
- TGATAG
1817
- TGATTA
1818
- TGATTT
1819
- TGATTC
1820
- TGATTG
1821
- TGATCA
1822
- TGATCT
1823
- TGATCC
1824
- TGATCG
1825
- TGATGA
1826
- TGATGT
1827
- TGATGC
1828
- TGATGG
1829
- TGACAA
1830
- TGACAT
1831
- TGACAC
1832
- TGACAG
1833
- TGACTA
1834
- TGACTT
1835
- TGACTC
1836
- TGACTG
1837
- TGACCA
1838
- TGACCT
1839
- TGACCC
1840
- TGACCG
1841
- TGACGA
1842
- TGACGT
1843
- TGACGC
1844
- TGACGG
1845
- TGAGAA
1846
- TGAGAT
1847
- TGAGAC
1848
- TGAGAG
1849
- TGAGTA
1850
- TGAGTT
1851
- TGAGTC
1852
- TGAGTG
1853
- TGAGCA
1854
- TGAGCT
1855
- TGAGCC
1856
- TGAGCG
1857
- TGAGGA
1858
- TGAGGT
1859
- TGAGGC
1860
- TGAGGG
1861
- TGTAAA
1862
- TGTAAT
1863
- TGTAAC
1864
- TGTAAG
1865
- TGTATA
1866
- TGTATT
1867
- TGTATC
1868
- TGTATG
1869
- TGTACA
1870
- TGTACT
1871
- TGTACC
1872
- TGTACG
1873
- TGTAGA
1874
- TGTAGT
1875
- TGTAGC
1876
- TGTAGG
1877
- TGTTAA
1878
- TGTTAT
1879
- TGTTAC
1880
- TGTTAG
1881
- TGTTTA
1882
- TGTTTT
1883
- TGTTTC
1884
- TGTTTG
1885
- TGTTCA
1886
- TGTTCT
1887
- TGTTCC
1888
- TGTTCG
1889
- TGTTGA
1890
- TGTTGT
1891
- TGTTGC
1892
- TGTTGG
1893
- TGTCAA
1894
- TGTCAT
1895
- TGTCAC
1896
- TGTCAG
1897
- TGTCTA
1898
- TGTCTT
1899
- TGTCTC
1900
- TGTCTG
1901
- TGTCCA
1902
- TGTCCT
1903
- TGTCCC
1904
- TGTCCG
1905
- TGTCGA
1906
- TGTCGT
1907
- TGTCGC
1908
- TGTCGG
1909
- TGTGAA
1910
- TGTGAT
1911
- TGTGAC
1912
- TGTGAG
1913
- TGTGTA
1914
- TGTGTT
1915
- TGTGTC
1916
- TGTGTG
1917
- TGTGCA
1918
- TGTGCT
1919
- TGTGCC
1920
- TGTGCG
1921
- TGTGGA
1922
- TGTGGT
1923
- TGTGGC
1924
- TGTGGG
1925
- TGCAAA
1926
- TGCAAT
1927
- TGCAAC
1928
- TGCAAG
1929
- TGCATA
1930
- TGCATT
1931
- TGCATC
1932
- TGCATG
1933
- TGCACA
1934
- TGCACT
1935
- TGCACC
1936
- TGCACG
1937
- TGCAGA
1938
- TGCAGT
1939
- TGCAGC
1940
- TGCAGG
1941
- TGCTAA
1942
- TGCTAT
1943
- TGCTAC
1944
- TGCTAG
1945
- TGCTTA
1946
- TGCTTT
1947
- TGCTTC
1948
- TGCTTG
1949
- TGCTCA
1950
- TGCTCT
1951
- TGCTCC
1952
- TGCTCG
1953
- TGCTGA
1954
- TGCTGT
1955
- TGCTGC
1956
- TGCTGG
1957
- TGCCAA
1958
- TGCCAT
1959
- TGCCAC
1960
- TGCCAG
1961
- TGCCTA
1962
- TGCCTT
1963
- TGCCTC
1964
- TGCCTG
1965
- TGCCCA
1966
- TGCCCT
1967
- TGCCCC
1968
- TGCCCG
1969
- TGCCGA
1970
- TGCCGT
1971
- TGCCGC
1972
- TGCCGG
1973
- TGCGAA
1974
- TGCGAT
1975
- TGCGAC
1976
- TGCGAG
1977
- TGCGTA
1978
- TGCGTT
1979
- TGCGTC
1980
- TGCGTG
1981
- TGCGCA
1982
- TGCGCT
1983
- TGCGCC
1984
- TGCGCG
1985
- TGCGGA
1986
- TGCGGT
1987
- TGCGGC
1988
- TGCGGG
1989
- TGGAAA
1990
- TGGAAT
1991
- TGGAAC
1992
- TGGAAG
1993
- TGGATA
1994
- TGGATT
1995
- TGGATC
1996
- TGGATG
1997
- TGGACA
1998
- TGGACT
1999
- TGGACC
2000
- TGGACG
2001
- TGGAGA
2002
- TGGAGT
2003
- TGGAGC
2004
- TGGAGG
2005
- TGGTAA
2006
- TGGTAT
2007
- TGGTAC
2008
- TGGTAG
2009
- TGGTTA
2010
- TGGTTT
2011
- TGGTTC
2012
- TGGTTG
2013
- TGGTCA
2014
- TGGTCT
2015
- TGGTCC
2016
- TGGTCG
2017
- TGGTGA
2018
- TGGTGT
2019
- TGGTGC
2020
- TGGTGG
2021
- TGGCAA
2022
- TGGCAT
2023
- TGGCAC
2024
- TGGCAG
2025
- TGGCTA
2026
- TGGCTT
2027
- TGGCTC
2028
- TGGCTG
2029
- TGGCCA
2030
- TGGCCT
2031
- TGGCCC
2032
- TGGCCG
2033
- TGGCGA
2034
- TGGCGT
2035
- TGGCGC
2036
- TGGCGG
2037
- TGGGAA
2038
- TGGGAT
2039
- TGGGAC
2040
- TGGGAG
2041
- TGGGTA
2042
- TGGGTT
2043
- TGGGTC
2044
- TGGGTG
2045
- TGGGCA
2046
- TGGGCT
2047
- TGGGCC
2048
- TGGGCG
2049
- TGGGGA
2050
- TGGGGT
2051
- TGGGGC
2052
- TGGGGG
2053
- CAAAAA
2054
- CAAAAT
2055
- CAAAAC
2056
- CAAAAG
2057
- CAAATA
2058
- CAAATT
2059
- CAAATC
2060
- CAAATG
2061
- CAAACA
2062
- CAAACT
2063
- CAAACC
2064
- CAAACG
2065
- CAAAGA
2066
- CAAAGT
2067
- CAAAGC
2068
- CAAAGG
2069
- CAATAA
2070
- CAATAT
2071
- CAATAC
2072
- CAATAG
2073
- CAATTA
2074
- CAATTT
2075
- CAATTC
2076
- CAATTG
2077
- CAATCA
2078
- CAATCT
2079
- CAATCC
2080
- CAATCG
2081
- CAATGA
2082
- CAATGT
2083
- CAATGC
2084
- CAATGG
2085
- CAACAA
2086
- CAACAT
2087
- CAACAC
2088
- CAACAG
2089
- CAACTA
2090
- CAACTT
2091
- CAACTC
2092
- CAACTG
2093
- CAACCA
2094
- CAACCT
2095
- CAACCC
2096
- CAACCG
2097
- CAACGA
2098
- CAACGT
2099
- CAACGC
2100
- CAACGG
2101
- CAAGAA
2102
- CAAGAT
2103
- CAAGAC
2104
- CAAGAG
2105
- CAAGTA
2106
- CAAGTT
2107
- CAAGTC
2108
- CAAGTG
2109
- CAAGCA
2110
- CAAGCT
2111
- CAAGCC
2112
- CAAGCG
2113
- CAAGGA
2114
- CAAGGT
2115
- CAAGGC
2116
- CAAGGG
2117
- CATAAA
2118
- CATAAT
2119
- CATAAC
2120
- CATAAG
2121
- CATATA
2122
- CATATT
2123
- CATATC
2124
- CATATG
2125
- CATACA
2126
- CATACT
2127
- CATACC
2128
- CATACG
2129
- CATAGA
2130
- CATAGT
2131
- CATAGC
2132
- CATAGG
2133
- CATTAA
2134
- CATTAT
2135
- CATTAC
2136
- CATTAG
2137
- CATTTA
2138
- CATTTT
2139
- CATTTC
2140
- CATTTG
2141
- CATTCA
2142
- CATTCT
2143
- CATTCC
2144
- CATTCG
2145
- CATTGA
2146
- CATTGT
2147
- CATTGC
2148
- CATTGG
2149
- CATCAA
2150
- CATCAT
2151
- CATCAC
2152
- CATCAG
2153
- CATCTA
2154
- CATCTT
2155
- CATCTC
2156
- CATCTG
2157
- CATCCA
2158
- CATCCT
2159
- CATCCC
2160
- CATCCG
2161
- CATCGA
2162
- CATCGT
2163
- CATCGC
2164
- CATCGG
2165
- CATGAA
2166
- CATGAT
2167
- CATGAC
2168
- CATGAG
2169
- CATGTA
2170
- CATGTT
2171
- CATGTC
2172
- CATGTG
2173
- CATGCA
2174
- CATGCT
2175
- CATGCC
2176
- CATGCG
2177
- CATGGA
2178
- CATGGT
2179
- CATGGC
2180
- CATGGG
2181
- CACAAA
2182
- CACAAT
2183
- CACAAC
2184
- CACAAG
2185
- CACATA
2186
- CACATT
2187
- CACATC
2188
- CACATG
2189
- CACACA
2190
- CACACT
2191
- CACACC
2192
- CACACG
2193
- CACAGA
2194
- CACAGT
2195
- CACAGC
2196
- CACAGG
2197
- CACTAA
2198
- CACTAT
2199
- CACTAC
2200
- CACTAG
2201
- CACTTA
2202
- CACTTT
2203
- CACTTC
2204
- CACTTG
2205
- CACTCA
2206
- CACTCT
2207
- CACTCC
2208
- CACTCG
2209
- CACTGA
2210
- CACTGT
2211
- CACTGC
2212
- CACTGG
2213
- CACCAA
2214
- CACCAT
2215
- CACCAC
2216
- CACCAG
2217
- CACCTA
2218
- CACCTT
2219
- CACCTC
2220
- CACCTG
2221
- CACCCA
2222
- CACCCT
2223
- CACCCC
2224
- CACCCG
2225
- CACCGA
2226
- CACCGT
2227
- CACCGC
2228
- CACCGG
2229
- CACGAA
2230
- CACGAT
2231
- CACGAC
2232
- CACGAG
2233
- CACGTA
2234
- CACGTT
2235
- CACGTC
2236
- CACGTG
2237
- CACGCA
2238
- CACGCT
2239
- CACGCC
2240
- CACGCG
2241
- CACGGA
2242
- CACGGT
2243
- CACGGC
2244
- CACGGG
2245
- CAGAAA
2246
- CAGAAT
2247
- CAGAAC
2248
- CAGAAG
2249
- CAGATA
2250
- CAGATT
2251
- CAGATC
2252
- CAGATG
2253
- CAGACA
2254
- CAGACT
2255
- CAGACC
2256
- CAGACG
2257
- CAGAGA
2258
- CAGAGT
2259
- CAGAGC
2260
- CAGAGG
2261
- CAGTAA
2262
- CAGTAT
2263
- CAGTAC
2264
- CAGTAG
2265
- CAGTTA
2266
- CAGTTT
2267
- CAGTTC
2268
- CAGTTG
2269
- CAGTCA
2270
- CAGTCT
2271
- CAGTCC
2272
- CAGTCG
2273
- CAGTGA
2274
- CAGTGT
2275
- CAGTGC
2276
- CAGTGG
2277
- CAGCAA
2278
- CAGCAT
2279
- CAGCAC
2280
- CAGCAG
2281
- CAGCTA
2282
- CAGCTT
2283
- CAGCTC
2284
- CAGCTG
2285
- CAGCCA
2286
- CAGCCT
2287
- CAGCCC
2288
- CAGCCG
2289
- CAGCGA
2290
- CAGCGT
2291
- CAGCGC
2292
- CAGCGG
2293
- CAGGAA
2294
- CAGGAT
2295
- CAGGAC
2296
- CAGGAG
2297
- CAGGTA
2298
- CAGGTT
2299
- CAGGTC
2300
- CAGGTG
2301
- CAGGCA
2302
- CAGGCT
2303
- CAGGCC
2304
- CAGGCG
2305
- CAGGGA
2306
- CAGGGT
2307
- CAGGGC
2308
- CAGGGG
2309
- CTAAAA
2310
- CTAAAT
2311
- CTAAAC
2312
- CTAAAG
2313
- CTAATA
2314
- CTAATT
2315
- CTAATC
2316
- CTAATG
2317
- CTAACA
2318
- CTAACT
2319
- CTAACC
2320
- CTAACG
2321
- CTAAGA
2322
- CTAAGT
2323
- CTAAGC
2324
- CTAAGG
2325
- CTATAA
2326
- CTATAT
2327
- CTATAC
2328
- CTATAG
2329
- CTATTA
2330
- CTATTT
2331
- CTATTC
2332
- CTATTG
2333
- CTATCA
2334
- CTATCT
2335
- CTATCC
2336
- CTATCG
2337
- CTATGA
2338
- CTATGT
2339
- CTATGC
2340
- CTATGG
2341
- CTACAA
2342
- CTACAT
2343
- CTACAC
2344
- CTACAG
2345
- CTACTA
2346
- CTACTT
2347
- CTACTC
2348
- CTACTG
2349
- CTACCA
2350
- CTACCT
2351
- CTACCC
2352
- CTACCG
2353
- CTACGA
2354
- CTACGT
2355
- CTACGC
2356
- CTACGG
2357
- CTAGAA
2358
- CTAGAT
2359
- CTAGAC
2360
- CTAGAG
2361
- CTAGTA
2362
- CTAGTT
2363
- CTAGTC
2364
- CTAGTG
2365
- CTAGCA
2366
- CTAGCT
2367
- CTAGCC
2368
- CTAGCG
2369
- CTAGGA
2370
- CTAGGT
2371
- CTAGGC
2372
- CTAGGG
2373
- CTTAAA
2374
- CTTAAT
2375
- CTTAAC
2376
- CTTAAG
2377
- CTTATA
2378
- CTTATT
2379
- CTTATC
2380
- CTTATG
2381
- CTTACA
2382
- CTTACT
2383
- CTTACC
2384
- CTTACG
2385
- CTTAGA
2386
- CTTAGT
2387
- CTTAGC
2388
- CTTAGG
2389
- CTTTAA
2390
- CTTTAT
2391
- CTTTAC
2392
- CTTTAG
2393
- CTTTTA
2394
- CTTTTT
2395
- CTTTTC
2396
- CTTTTG
2397
- CTTTCA
2398
- CTTTCT
2399
- CTTTCC
2400
- CTTTCG
2401
- CTTTGA
2402
- CTTTGT
2403
- CTTTGC
2404
- CTTTGG
2405
- CTTCAA
2406
- CTTCAT
2407
- CTTCAC
2408
- CTTCAG
2409
- CTTCTA
2410
- CTTCTT
2411
- CTTCTC
2412
- CTTCTG
2413
- CTTCCA
2414
- CTTCCT
2415
- CTTCCC
2416
- CTTCCG
2417
- CTTCGA
2418
- CTTCGT
2419
- CTTCGC
2420
- CTTCGG
2421
- CTTGAA
2422
- CTTGAT
2423
- CTTGAC
2424
- CTTGAG
2425
- CTTGTA
2426
- CTTGTT
2427
- CTTGTC
2428
- CTTGTG
2429
- CTTGCA
2430
- CTTGCT
2431
- CTTGCC
2432
- CTTGCG
2433
- CTTGGA
2434
- CTTGGT
2435
- CTTGGC
2436
- CTTGGG
2437
- CTCAAA
2438
- CTCAAT
2439
- CTCAAC
2440
- CTCAAG
2441
- CTCATA
2442
- CTCATT
2443
- CTCATC
2444
- CTCATG
2445
- CTCACA
2446
- CTCACT
2447
- CTCACC
2448
- CTCACG
2449
- CTCAGA
2450
- CTCAGT
2451
- CTCAGC
2452
- CTCAGG
2453
- CTCTAA
2454
- CTCTAT
2455
- CTCTAC
2456
- CTCTAG
2457
- CTCTTA
2458
- CTCTTT
2459
- CTCTTC
2460
- CTCTTG
2461
- CTCTCA
2462
- CTCTCT
2463
- CTCTCC
2464
- CTCTCG
2465
- CTCTGA
2466
- CTCTGT
2467
- CTCTGC
2468
- CTCTGG
2469
- CTCCAA
2470
- CTCCAT
2471
- CTCCAC
2472
- CTCCAG
2473
- CTCCTA
2474
- CTCCTT
2475
- CTCCTC
2476
- CTCCTG
2477
- CTCCCA
2478
- CTCCCT
2479
- CTCCCC
2480
- CTCCCG
2481
- CTCCGA
2482
- CTCCGT
2483
- CTCCGC
2484
- CTCCGG
2485
- CTCGAA
2486
- CTCGAT
2487
- CTCGAC
2488
- CTCGAG
2489
- CTCGTA
2490
- CTCGTT
2491
- CTCGTC
2492
- CTCGTG
2493
- CTCGCA
2494
- CTCGCT
2495
- CTCGCC
2496
- CTCGCG
2497
- CTCGGA
2498
- CTCGGT
2499
- CTCGGC
2500
- CTCGGG
2501
- CTGAAA
2502
- CTGAAT
2503
- CTGAAC
2504
- CTGAAG
2505
- CTGATA
2506
- CTGATT
2507
- CTGATC
2508
- CTGATG
2509
- CTGACA
2510
- CTGACT
2511
- CTGACC
2512
- CTGACG
2513
- CTGAGA
2514
- CTGAGT
2515
- CTGAGC
2516
- CTGAGG
2517
- CTGTAA
2518
- CTGTAT
2519
- CTGTAC
2520
- CTGTAG
2521
- CTGTTA
2522
- CTGTTT
2523
- CTGTTC
2524
- CTGTTG
2525
- CTGTCA
2526
- CTGTCT
2527
- CTGTCC
2528
- CTGTCG
2529
- CTGTGA
2530
- CTGTGT
2531
- CTGTGC
2532
- CTGTGG
2533
- CTGCAA
2534
- CTGCAT
2535
- CTGCAC
2536
- CTGCAG
2537
- CTGCTA
2538
- CTGCTT
2539
- CTGCTC
2540
- CTGCTG
2541
- CTGCCA
2542
- CTGCCT
2543
- CTGCCC
2544
- CTGCCG
2545
- CTGCGA
2546
- CTGCGT
2547
- CTGCGC
2548
- CTGCGG
2549
- CTGGAA
2550
- CTGGAT
2551
- CTGGAC
2552
- CTGGAG
2553
- CTGGTA
2554
- CTGGTT
2555
- CTGGTC
2556
- CTGGTG
2557
- CTGGCA
2558
- CTGGCT
2559
- CTGGCC
2560
- CTGGCG
2561
- CTGGGA
2562
- CTGGGT
2563
- CTGGGC
2564
- CTGGGG
2565
- CCAAAA
2566
- CCAAAT
2567
- CCAAAC
2568
- CCAAAG
2569
- CCAATA
2570
- CCAATT
2571
- CCAATC
2572
- CCAATG
2573
- CCAACA
2574
- CCAACT
2575
- CCAACC
2576
- CCAACG
2577
- CCAAGA
2578
- CCAAGT
2579
- CCAAGC
2580
- CCAAGG
2581
- CCATAA
2582
- CCATAT
2583
- CCATAC
2584
- CCATAG
2585
- CCATTA
2586
- CCATTT
2587
- CCATTC
2588
- CCATTG
2589
- CCATCA
2590
- CCATCT
2591
- CCATCC
2592
- CCATCG
2593
- CCATGA
2594
- CCATGT
2595
- CCATGC
2596
- CCATGG
2597
- CCACAA
2598
- CCACAT
2599
- CCACAC
2600
- CCACAG
2601
- CCACTA
2602
- CCACTT
2603
- CCACTC
2604
- CCACTG
2605
- CCACCA
2606
- CCACCT
2607
- CCACCC
2608
- CCACCG
2609
- CCACGA
2610
- CCACGT
2611
- CCACGC
2612
- CCACGG
2613
- CCAGAA
2614
- CCAGAT
2615
- CCAGAC
2616
- CCAGAG
2617
- CCAGTA
2618
- CCAGTT
2619
- CCAGTC
2620
- CCAGTG
2621
- CCAGCA
2622
- CCAGCT
2623
- CCAGCC
2624
- CCAGCG
2625
- CCAGGA
2626
- CCAGGT
2627
- CCAGGC
2628
- CCAGGG
2629
- CCTAAA
2630
- CCTAAT
2631
- CCTAAC
2632
- CCTAAG
2633
- CCTATA
2634
- CCTATT
2635
- CCTATC
2636
- CCTATG
2637
- CCTACA
2638
- CCTACT
2639
- CCTACC
2640
- CCTACG
2641
- CCTAGA
2642
- CCTAGT
2643
- CCTAGC
2644
- CCTAGG
2645
- CCTTAA
2646
- CCTTAT
2647
- CCTTAC
2648
- CCTTAG
2649
- CCTTTA
2650
- CCTTTT
2651
- CCTTTC
2652
- CCTTTG
2653
- CCTTCA
2654
- CCTTCT
2655
- CCTTCC
2656
- CCTTCG
2657
- CCTTGA
2658
- CCTTGT
2659
- CCTTGC
2660
- CCTTGG
2661
- CCTCAA
2662
- CCTCAT
2663
- CCTCAC
2664
- CCTCAG
2665
- CCTCTA
2666
- CCTCTT
2667
- CCTCTC
2668
- CCTCTG
2669
- CCTCCA
2670
- CCTCCT
2671
- CCTCCC
2672
- CCTCCG
2673
- CCTCGA
2674
- CCTCGT
2675
- CCTCGC
2676
- CCTCGG
2677
- CCTGAA
2678
- CCTGAT
2679
- CCTGAC
2680
- CCTGAG
2681
- CCTGTA
2682
- CCTGTT
2683
- CCTGTC
2684
- CCTGTG
2685
- CCTGCA
2686
- CCTGCT
2687
- CCTGCC
2688
- CCTGCG
2689
- CCTGGA
2690
- CCTGGT
2691
- CCTGGC
2692
- CCTGGG
2693
- CCCAAA
2694
- CCCAAT
2695
- CCCAAC
2696
- CCCAAG
2697
- CCCATA
2698
- CCCATT
2699
- CCCATC
2700
- CCCATG
2701
- CCCACA
2702
- CCCACT
2703
- CCCACC
2704
- CCCACG
2705
- CCCAGA
2706
- CCCAGT
2707
- CCCAGC
2708
- CCCAGG
2709
- CCCTAA
2710
- CCCTAT
2711
- CCCTAC
2712
- CCCTAG
2713
- CCCTTA
2714
- CCCTTT
2715
- CCCTTC
2716
- CCCTTG
2717
- CCCTCA
2718
- CCCTCT
2719
- CCCTCC
2720
- CCCTCG
2721
- CCCTGA
2722
- CCCTGT
2723
- CCCTGC
2724
- CCCTGG
2725
- CCCCAA
2726
- CCCCAT
2727
- CCCCAC
2728
- CCCCAG
2729
- CCCCTA
2730
- CCCCTT
2731
- CCCCTC
2732
- CCCCTG
2733
- CCCCCA
2734
- CCCCCT
2735
- CCCCCC
2736
- CCCCCG
2737
- CCCCGA
2738
- CCCCGT
2739
- CCCCGC
2740
- CCCCGG
2741
- CCCGAA
2742
- CCCGAT
2743
- CCCGAC
2744
- CCCGAG
2745
- CCCGTA
2746
- CCCGTT
2747
- CCCGTC
2748
- CCCGTG
2749
- CCCGCA
2750
- CCCGCT
2751
- CCCGCC
2752
- CCCGCG
2753
- CCCGGA
2754
- CCCGGT
2755
- CCCGGC
2756
- CCCGGG
2757
- CCGAAA
2758
- CCGAAT
2759
- CCGAAC
2760
- CCGAAG
2761
- CCGATA
2762
- CCGATT
2763
- CCGATC
2764
- CCGATG
2765
- CCGACA
2766
- CCGACT
2767
- CCGACC
2768
- CCGACG
2769
- CCGAGA
2770
- CCGAGT
2771
- CCGAGC
2772
- CCGAGG
2773
- CCGTAA
2774
- CCGTAT
2775
- CCGTAC
2776
- CCGTAG
2777
- CCGTTA
2778
- CCGTTT
2779
- CCGTTC
2780
- CCGTTG
2781
- CCGTCA
2782
- CCGTCT
2783
- CCGTCC
2784
- CCGTCG
2785
- CCGTGA
2786
- CCGTGT
2787
- CCGTGC
2788
- CCGTGG
2789
- CCGCAA
2790
- CCGCAT
2791
- CCGCAC
2792
- CCGCAG
2793
- CCGCTA
2794
- CCGCTT
2795
- CCGCTC
2796
- CCGCTG
2797
- CCGCCA
2798
- CCGCCT
2799
- CCGCCC
2800
- CCGCCG
2801
- CCGCGA
2802
- CCGCGT
2803
- CCGCGC
2804
- CCGCGG
2805
- CCGGAA
2806
- CCGGAT
2807
- CCGGAC
2808
- CCGGAG
2809
- CCGGTA
2810
- CCGGTT
2811
- CCGGTC
2812
- CCGGTG
2813
- CCGGCA
2814
- CCGGCT
2815
- CCGGCC
2816
- CCGGCG
2817
- CCGGGA
2818
- CCGGGT
2819
- CCGGGC
2820
- CCGGGG
2821
- CGAAAA
2822
- CGAAAT
2823
- CGAAAC
2824
- CGAAAG
2825
- CGAATA
2826
- CGAATT
2827
- CGAATC
2828
- CGAATG
2829
- CGAACA
2830
- CGAACT
2831
- CGAACC
2832
- CGAACG
2833
- CGAAGA
2834
- CGAAGT
2835
- CGAAGC
2836
- CGAAGG
2837
- CGATAA
2838
- CGATAT
2839
- CGATAC
2840
- CGATAG
2841
- CGATTA
2842
- CGATTT
2843
- CGATTC
2844
- CGATTG
2845
- CGATCA
2846
- CGATCT
2847
- CGATCC
2848
- CGATCG
2849
- CGATGA
2850
- CGATGT
2851
- CGATGC
2852
- CGATGG
2853
- CGACAA
2854
- CGACAT
2855
- CGACAC
2856
- CGACAG
2857
- CGACTA
2858
- CGACTT
2859
- CGACTC
2860
- CGACTG
2861
- CGACCA
2862
- CGACCT
2863
- CGACCC
2864
- CGACCG
2865
- CGACGA
2866
- CGACGT
2867
- CGACGC
2868
- CGACGG
2869
- CGAGAA
2870
- CGAGAT
2871
- CGAGAC
2872
- CGAGAG
2873
- CGAGTA
2874
- CGAGTT
2875
- CGAGTC
2876
- CGAGTG
2877
- CGAGCA
2878
- CGAGCT
2879
- CGAGCC
2880
- CGAGCG
2881
- CGAGGA
2882
- CGAGGT
2883
- CGAGGC
2884
- CGAGGG
2885
- CGTAAA
2886
- CGTAAT
2887
- CGTAAC
2888
- CGTAAG
2889
- CGTATA
2890
- CGTATT
2891
- CGTATC
2892
- CGTATG
2893
- CGTACA
2894
- CGTACT
2895
- CGTACC
2896
- CGTACG
2897
- CGTAGA
2898
- CGTAGT
2899
- CGTAGC
2900
- CGTAGG
2901
- CGTTAA
2902
- CGTTAT
2903
- CGTTAC
2904
- CGTTAG
2905
- CGTTTA
2906
- CGTTTT
2907
- CGTTTC
2908
- CGTTTG
2909
- CGTTCA
2910
- CGTTCT
2911
- CGTTCC
2912
- CGTTCG
2913
- CGTTGA
2914
- CGTTGT
2915
- CGTTGC
2916
- CGTTGG
2917
- CGTCAA
2918
- CGTCAT
2919
- CGTCAC
2920
- CGTCAG
2921
- CGTCTA
2922
- CGTCTT
2923
- CGTCTC
2924
- CGTCTG
2925
- CGTCCA
2926
- CGTCCT
2927
- CGTCCC
2928
- CGTCCG
2929
- CGTCGA
2930
- CGTCGT
2931
- CGTCGC
2932
- CGTCGG
2933
- CGTGAA
2934
- CGTGAT
2935
- CGTGAC
2936
- CGTGAG
2937
- CGTGTA
2938
- CGTGTT
2939
- CGTGTC
2940
- CGTGTG
2941
- CGTGCA
2942
- CGTGCT
2943
- CGTGCC
2944
- CGTGCG
2945
- CGTGGA
2946
- CGTGGT
2947
- CGTGGC
2948
- CGTGGG
2949
- CGCAAA
2950
- CGCAAT
2951
- CGCAAC
2952
- CGCAAG
2953
- CGCATA
2954
- CGCATT
2955
- CGCATC
2956
- CGCATG
2957
- CGCACA
2958
- CGCACT
2959
- CGCACC
2960
- CGCACG
2961
- CGCAGA
2962
- CGCAGT
2963
- CGCAGC
2964
- CGCAGG
2965
- CGCTAA
2966
- CGCTAT
2967
- CGCTAC
2968
- CGCTAG
2969
- CGCTTA
2970
- CGCTTT
2971
- CGCTTC
2972
- CGCTTG
2973
- CGCTCA
2974
- CGCTCT
2975
- CGCTCC
2976
- CGCTCG
2977
- CGCTGA
2978
- CGCTGT
2979
- CGCTGC
2980
- CGCTGG
2981
- CGCCAA
2982
- CGCCAT
2983
- CGCCAC
2984
- CGCCAG
2985
- CGCCTA
2986
- CGCCTT
2987
- CGCCTC
2988
- CGCCTG
2989
- CGCCCA
2990
- CGCCCT
2991
- CGCCCC
2992
- CGCCCG
2993
- CGCCGA
2994
- CGCCGT
2995
- CGCCGC
2996
- CGCCGG
2997
- CGCGAA
2998
- CGCGAT
2999
- CGCGAC
3000
- CGCGAG
3001
- CGCGTA
3002
- CGCGTT
3003
- CGCGTC
3004
- CGCGTG
3005
- CGCGCA
3006
- CGCGCT
3007
- CGCGCC
3008
- CGCGCG
3009
- CGCGGA
3010
- CGCGGT
3011
- CGCGGC
3012
- CGCGGG
3013
- CGGAAA
3014
- CGGAAT
3015
- CGGAAC
3016
- CGGAAG
3017
- CGGATA
3018
- CGGATT
3019
- CGGATC
3020
- CGGATG
3021
- CGGACA
3022
- CGGACT
3023
- CGGACC
3024
- CGGACG
3025
- CGGAGA
3026
- CGGAGT
3027
- CGGAGC
3028
- CGGAGG
3029
- CGGTAA
3030
- CGGTAT
3031
- CGGTAC
3032
- CGGTAG
3033
- CGGTTA
3034
- CGGTTT
3035
- CGGTTC
3036
- CGGTTG
3037
- CGGTCA
3038
- CGGTCT
3039
- CGGTCC
3040
- CGGTCG
3041
- CGGTGA
3042
- CGGTGT
3043
- CGGTGC
3044
- CGGTGG
3045
- CGGCAA
3046
- CGGCAT
3047
- CGGCAC
3048
- CGGCAG
3049
- CGGCTA
3050
- CGGCTT
3051
- CGGCTC
3052
- CGGCTG
3053
- CGGCCA
3054
- CGGCCT
3055
- CGGCCC
3056
- CGGCCG
3057
- CGGCGA
3058
- CGGCGT
3059
- CGGCGC
3060
- CGGCGG
3061
- CGGGAA
3062
- CGGGAT
3063
- CGGGAC
3064
- CGGGAG
3065
- CGGGTA
3066
- CGGGTT
3067
- CGGGTC
3068
- CGGGTG
3069
- CGGGCA
3070
- CGGGCT
3071
- CGGGCC
3072
- CGGGCG
3073
- CGGGGA
3074
- CGGGGT
3075
- CGGGGC
3076
- CGGGGG
3077
- GAAAAA
3078
- GAAAAT
3079
- GAAAAC
3080
- GAAAAG
3081
- GAAATA
3082
- GAAATT
3083
- GAAATC
3084
- GAAATG
3085
- GAAACA
3086
- GAAACT
3087
- GAAACC
3088
- GAAACG
3089
- GAAAGA
3090
- GAAAGT
3091
- GAAAGC
3092
- GAAAGG
3093
- GAATAA
3094
- GAATAT
3095
- GAATAC
3096
- GAATAG
3097
- GAATTA
3098
- GAATTT
3099
- GAATTC
3100
- GAATTG
3101
- GAATCA
3102
- GAATCT
3103
- GAATCC
3104
- GAATCG
3105
- GAATGA
3106
- GAATGT
3107
- GAATGC
3108
- GAATGG
3109
- GAACAA
3110
- GAACAT
3111
- GAACAC
3112
- GAACAG
3113
- GAACTA
3114
- GAACTT
3115
- GAACTC
3116
- GAACTG
3117
- GAACCA
3118
- GAACCT
3119
- GAACCC
3120
- GAACCG
3121
- GAACGA
3122
- GAACGT
3123
- GAACGC
3124
- GAACGG
3125
- GAAGAA
3126
- GAAGAT
3127
- GAAGAC
3128
- GAAGAG
3129
- GAAGTA
3130
- GAAGTT
3131
- GAAGTC
3132
- GAAGTG
3133
- GAAGCA
3134
- GAAGCT
3135
- GAAGCC
3136
- GAAGCG
3137
- GAAGGA
3138
- GAAGGT
3139
- GAAGGC
3140
- GAAGGG
3141
- GATAAA
3142
- GATAAT
3143
- GATAAC
3144
- GATAAG
3145
- GATATA
3146
- GATATT
3147
- GATATC
3148
- GATATG
3149
- GATACA
3150
- GATACT
3151
- GATACC
3152
- GATACG
3153
- GATAGA
3154
- GATAGT
3155
- GATAGC
3156
- GATAGG
3157
- GATTAA
3158
- GATTAT
3159
- GATTAC
3160
- GATTAG
3161
- GATTTA
3162
- GATTTT
3163
- GATTTC
3164
- GATTTG
3165
- GATTCA
3166
- GATTCT
3167
- GATTCC
3168
- GATTCG
3169
- GATTGA
3170
- GATTGT
3171
- GATTGC
3172
- GATTGG
3173
- GATCAA
3174
- GATCAT
3175
- GATCAC
3176
- GATCAG
3177
- GATCTA
3178
- GATCTT
3179
- GATCTC
3180
- GATCTG
3181
- GATCCA
3182
- GATCCT
3183
- GATCCC
3184
- GATCCG
3185
- GATCGA
3186
- GATCGT
3187
- GATCGC
3188
- GATCGG
3189
- GATGAA
3190
- GATGAT
3191
- GATGAC
3192
- GATGAG
3193
- GATGTA
3194
- GATGTT
3195
- GATGTC
3196
- GATGTG
3197
- GATGCA
3198
- GATGCT
3199
- GATGCC
3200
- GATGCG
3201
- GATGGA
3202
- GATGGT
3203
- GATGGC
3204
- GATGGG
3205
- GACAAA
3206
- GACAAT
3207
- GACAAC
3208
- GACAAG
3209
- GACATA
3210
- GACATT
3211
- GACATC
3212
- GACATG
3213
- GACACA
3214
- GACACT
3215
- GACACC
3216
- GACACG
3217
- GACAGA
3218
- GACAGT
3219
- GACAGC
3220
- GACAGG
3221
- GACTAA
3222
- GACTAT
3223
- GACTAC
3224
- GACTAG
3225
- GACTTA
3226
- GACTTT
3227
- GACTTC
3228
- GACTTG
3229
- GACTCA
3230
- GACTCT
3231
- GACTCC
3232
- GACTCG
3233
- GACTGA
3234
- GACTGT
3235
- GACTGC
3236
- GACTGG
3237
- GACCAA
3238
- GACCAT
3239
- GACCAC
3240
- GACCAG
3241
- GACCTA
3242
- GACCTT
3243
- GACCTC
3244
- GACCTG
3245
- GACCCA
3246
- GACCCT
3247
- GACCCC
3248
- GACCCG
3249
- GACCGA
3250
- GACCGT
3251
- GACCGC
3252
- GACCGG
3253
- GACGAA
3254
- GACGAT
3255
- GACGAC
3256
- GACGAG
3257
- GACGTA
3258
- GACGTT
3259
- GACGTC
3260
- GACGTG
3261
- GACGCA
3262
- GACGCT
3263
- GACGCC
3264
- GACGCG
3265
- GACGGA
3266
- GACGGT
3267
- GACGGC
3268
- GACGGG
3269
- GAGAAA
3270
- GAGAAT
3271
- GAGAAC
3272
- GAGAAG
3273
- GAGATA
3274
- GAGATT
3275
- GAGATC
3276
- GAGATG
3277
- GAGACA
3278
- GAGACT
3279
- GAGACC
3280
- GAGACG
3281
- GAGAGA
3282
- GAGAGT
3283
- GAGAGC
3284
- GAGAGG
3285
- GAGTAA
3286
- GAGTAT
3287
- GAGTAC
3288
- GAGTAG
3289
- GAGTTA
3290
- GAGTTT
3291
- GAGTTC
3292
- GAGTTG
3293
- GAGTCA
3294
- GAGTCT
3295
- GAGTCC
3296
- GAGTCG
3297
- GAGTGA
3298
- GAGTGT
3299
- GAGTGC
3300
- GAGTGG
3301
- GAGCAA
3302
- GAGCAT
3303
- GAGCAC
3304
- GAGCAG
3305
- GAGCTA
3306
- GAGCTT
3307
- GAGCTC
3308
- GAGCTG
3309
- GAGCCA
3310
- GAGCCT
3311
- GAGCCC
3312
- GAGCCG
3313
- GAGCGA
3314
- GAGCGT
3315
- GAGCGC
3316
- GAGCGG
3317
- GAGGAA
3318
- GAGGAT
3319
- GAGGAC
3320
- GAGGAG
3321
- GAGGTA
3322
- GAGGTT
3323
- GAGGTC
3324
- GAGGTG
3325
- GAGGCA
3326
- GAGGCT
3327
- GAGGCC
3328
- GAGGCG
3329
- GAGGGA
3330
- GAGGGT
3331
- GAGGGC
3332
- GAGGGG
3333
- GTAAAA
3334
- GTAAAT
3335
- GTAAAC
3336
- GTAAAG
3337
- GTAATA
3338
- GTAATT
3339
- GTAATC
3340
- GTAATG
3341
- GTAACA
3342
- GTAACT
3343
- GTAACC
3344
- GTAACG
3345
- GTAAGA
3346
- GTAAGT
3347
- GTAAGC
3348
- GTAAGG
3349
- GTATAA
3350
- GTATAT
3351
- GTATAC
3352
- GTATAG
3353
- GTATTA
3354
- GTATTT
3355
- GTATTC
3356
- GTATTG
3357
- GTATCA
3358
- GTATCT
3359
- GTATCC
3360
- GTATCG
3361
- GTATGA
3362
- GTATGT
3363
- GTATGC
3364
- GTATGG
3365
- GTACAA
3366
- GTACAT
3367
- GTACAC
3368
- GTACAG
3369
- GTACTA
3370
- GTACTT
3371
- GTACTC
3372
- GTACTG
3373
- GTACCA
3374
- GTACCT
3375
- GTACCC
3376
- GTACCG
3377
- GTACGA
3378
- GTACGT
3379
- GTACGC
3380
- GTACGG
3381
- GTAGAA
3382
- GTAGAT
3383
- GTAGAC
3384
- GTAGAG
3385
- GTAGTA
3386
- GTAGTT
3387
- GTAGTC
3388
- GTAGTG
3389
- GTAGCA
3390
- GTAGCT
3391
- GTAGCC
3392
- GTAGCG
3393
- GTAGGA
3394
- GTAGGT
3395
- GTAGGC
3396
- GTAGGG
3397
- GTTAAA
3398
- GTTAAT
3399
- GTTAAC
3400
- GTTAAG
3401
- GTTATA
3402
- GTTATT
3403
- GTTATC
3404
- GTTATG
3405
- GTTACA
3406
- GTTACT
3407
- GTTACC
3408
- GTTACG
3409
- GTTAGA
3410
- GTTAGT
3411
- GTTAGC
3412
- GTTAGG
3413
- GTTTAA
3414
- GTTTAT
3415
- GTTTAC
3416
- GTTTAG
3417
- GTTTTA
3418
- GTTTTT
3419
- GTTTTC
3420
- GTTTTG
3421
- GTTTCA
3422
- GTTTCT
3423
- GTTTCC
3424
- GTTTCG
3425
- GTTTGA
3426
- GTTTGT
3427
- GTTTGC
3428
- GTTTGG
3429
- GTTCAA
3430
- GTTCAT
3431
- GTTCAC
3432
- GTTCAG
3433
- GTTCTA
3434
- GTTCTT
3435
- GTTCTC
3436
- GTTCTG
3437
- GTTCCA
3438
- GTTCCT
3439
- GTTCCC
3440
- GTTCCG
3441
- GTTCGA
3442
- GTTCGT
3443
- GTTCGC
3444
- GTTCGG
3445
- GTTGAA
3446
- GTTGAT
3447
- GTTGAC
3448
- GTTGAG
3449
- GTTGTA
3450
- GTTGTT
3451
- GTTGTC
3452
- GTTGTG
3453
- GTTGCA
3454
- GTTGCT
3455
- GTTGCC
3456
- GTTGCG
3457
- GTTGGA
3458
- GTTGGT
3459
- GTTGGC
3460
- GTTGGG
3461
- GTCAAA
3462
- GTCAAT
3463
- GTCAAC
3464
- GTCAAG
3465
- GTCATA
3466
- GTCATT
3467
- GTCATC
3468
- GTCATG
3469
- GTCACA
3470
- GTCACT
3471
- GTCACC
3472
- GTCACG
3473
- GTCAGA
3474
- GTCAGT
3475
- GTCAGC
3476
- GTCAGG
3477
- GTCTAA
3478
- GTCTAT
3479
- GTCTAC
3480
- GTCTAG
3481
- GTCTTA
3482
- GTCTTT
3483
- GTCTTC
3484
- GTCTTG
3485
- GTCTCA
3486
- GTCTCT
3487
- GTCTCC
3488
- GTCTCG
3489
- GTCTGA
3490
- GTCTGT
3491
- GTCTGC
3492
- GTCTGG
3493
- GTCCAA
3494
- GTCCAT
3495
- GTCCAC
3496
- GTCCAG
3497
- GTCCTA
3498
- GTCCTT
3499
- GTCCTC
3500
- GTCCTG
3501
- GTCCCA
3502
- GTCCCT
3503
- GTCCCC
3504
- GTCCCG
3505
- GTCCGA
3506
- GTCCGT
3507
- GTCCGC
3508
- GTCCGG
3509
- GTCGAA
3510
- GTCGAT
3511
- GTCGAC
3512
- GTCGAG
3513
- GTCGTA
3514
- GTCGTT
3515
- GTCGTC
3516
- GTCGTG
3517
- GTCGCA
3518
- GTCGCT
3519
- GTCGCC
3520
- GTCGCG
3521
- GTCGGA
3522
- GTCGGT
3523
- GTCGGC
3524
- GTCGGG
3525
- GTGAAA
3526
- GTGAAT
3527
- GTGAAC
3528
- GTGAAG
3529
- GTGATA
3530
- GTGATT
3531
- GTGATC
3532
- GTGATG
3533
- GTGACA
3534
- GTGACT
3535
- GTGACC
3536
- GTGACG
3537
- GTGAGA
3538
- GTGAGT
3539
- GTGAGC
3540
- GTGAGG
3541
- GTGTAA
3542
- GTGTAT
3543
- GTGTAC
3544
- GTGTAG
3545
- GTGTTA
3546
- GTGTTT
3547
- GTGTTC
3548
- GTGTTG
3549
- GTGTCA
3550
- GTGTCT
3551
- GTGTCC
3552
- GTGTCG
3553
- GTGTGA
3554
- GTGTGT
3555
- GTGTGC
3556
- GTGTGG
3557
- GTGCAA
3558
- GTGCAT
3559
- GTGCAC
3560
- GTGCAG
3561
- GTGCTA
3562
- GTGCTT
3563
- GTGCTC
3564
- GTGCTG
3565
- GTGCCA
3566
- GTGCCT
3567
- GTGCCC
3568
- GTGCCG
3569
- GTGCGA
3570
- GTGCGT
3571
- GTGCGC
3572
- GTGCGG
3573
- GTGGAA
3574
- GTGGAT
3575
- GTGGAC
3576
- GTGGAG
3577
- GTGGTA
3578
- GTGGTT
3579
- GTGGTC
3580
- GTGGTG
3581
- GTGGCA
3582
- GTGGCT
3583
- GTGGCC
3584
- GTGGCG
3585
- GTGGGA
3586
- GTGGGT
3587
- GTGGGC
3588
- GTGGGG
3589
- GCAAAA
3590
- GCAAAT
3591
- GCAAAC
3592
- GCAAAG
3593
- GCAATA
3594
- GCAATT
3595
- GCAATC
3596
- GCAATG
3597
- GCAACA
3598
- GCAACT
3599
- GCAACC
3600
- GCAACG
3601
- GCAAGA
3602
- GCAAGT
3603
- GCAAGC
3604
- GCAAGG
3605
- GCATAA
3606
- GCATAT
3607
- GCATAC
3608
- GCATAG
3609
- GCATTA
3610
- GCATTT
3611
- GCATTC
3612
- GCATTG
3613
- GCATCA
3614
- GCATCT
3615
- GCATCC
3616
- GCATCG
3617
- GCATGA
3618
- GCATGT
3619
- GCATGC
3620
- GCATGG
3621
- GCACAA
3622
- GCACAT
3623
- GCACAC
3624
- GCACAG
3625
- GCACTA
3626
- GCACTT
3627
- GCACTC
3628
- GCACTG
3629
- GCACCA
3630
- GCACCT
3631
- GCACCC
3632
- GCACCG
3633
- GCACGA
3634
- GCACGT
3635
- GCACGC
3636
- GCACGG
3637
- GCAGAA
3638
- GCAGAT
3639
- GCAGAC
3640
- GCAGAG
3641
- GCAGTA
3642
- GCAGTT
3643
- GCAGTC
3644
- GCAGTG
3645
- GCAGCA
3646
- GCAGCT
3647
- GCAGCC
3648
- GCAGCG
3649
- GCAGGA
3650
- GCAGGT
3651
- GCAGGC
3652
- GCAGGG
3653
- GCTAAA
3654
- GCTAAT
3655
- GCTAAC
3656
- GCTAAG
3657
- GCTATA
3658
- GCTATT
3659
- GCTATC
3660
- GCTATG
3661
- GCTACA
3662
- GCTACT
3663
- GCTACC
3664
- GCTACG
3665
- GCTAGA
3666
- GCTAGT
3667
- GCTAGC
3668
- GCTAGG
3669
- GCTTAA
3670
- GCTTAT
3671
- GCTTAC
3672
- GCTTAG
3673
- GCTTTA
3674
- GCTTTT
3675
- GCTTTC
3676
- GCTTTG
3677
- GCTTCA
3678
- GCTTCT
3679
- GCTTCC
3680
- GCTTCG
3681
- GCTTGA
3682
- GCTTGT
3683
- GCTTGC
3684
- GCTTGG
3685
- GCTCAA
3686
- GCTCAT
3687
- GCTCAC
3688
- GCTCAG
3689
- GCTCTA
3690
- GCTCTT
3691
- GCTCTC
3692
- GCTCTG
3693
- GCTCCA
3694
- GCTCCT
3695
- GCTCCC
3696
- GCTCCG
3697
- GCTCGA
3698
- GCTCGT
3699
- GCTCGC
3700
- GCTCGG
3701
- GCTGAA
3702
- GCTGAT
3703
- GCTGAC
3704
- GCTGAG
3705
- GCTGTA
3706
- GCTGTT
3707
- GCTGTC
3708
- GCTGTG
3709
- GCTGCA
3710
- GCTGCT
3711
- GCTGCC
3712
- GCTGCG
3713
- GCTGGA
3714
- GCTGGT
3715
- GCTGGC
3716
- GCTGGG
3717
- GCCAAA
3718
- GCCAAT
3719
- GCCAAC
3720
- GCCAAG
3721
- GCCATA
3722
- GCCATT
3723
- GCCATC
3724
- GCCATG
3725
- GCCACA
3726
- GCCACT
3727
- GCCACC
3728
- GCCACG
3729
- GCCAGA
3730
- GCCAGT
3731
- GCCAGC
3732
- GCCAGG
3733
- GCCTAA
3734
- GCCTAT
3735
- GCCTAC
3736
- GCCTAG
3737
- GCCTTA
3738
- GCCTTT
3739
- GCCTTC
3740
- GCCTTG
3741
- GCCTCA
3742
- GCCTCT
3743
- GCCTCC
3744
- GCCTCG
3745
- GCCTGA
3746
- GCCTGT
3747
- GCCTGC
3748
- GCCTGG
3749
- GCCCAA
3750
- GCCCAT
3751
- GCCCAC
3752
- GCCCAG
3753
- GCCCTA
3754
- GCCCTT
3755
- GCCCTC
3756
- GCCCTG
3757
- GCCCCA
3758
- GCCCCT
3759
- GCCCCC
3760
- GCCCCG
3761
- GCCCGA
3762
- GCCCGT
3763
- GCCCGC
3764
- GCCCGG
3765
- GCCGAA
3766
- GCCGAT
3767
- GCCGAC
3768
- GCCGAG
3769
- GCCGTA
3770
- GCCGTT
3771
- GCCGTC
3772
- GCCGTG
3773
- GCCGCA
3774
- GCCGCT
3775
- GCCGCC
3776
- GCCGCG
3777
- GCCGGA
3778
- GCCGGT
3779
- GCCGGC
3780
- GCCGGG
3781
- GCGAAA
3782
- GCGAAT
3783
- GCGAAC
3784
- GCGAAG
3785
- GCGATA
3786
- GCGATT
3787
- GCGATC
3788
- GCGATG
3789
- GCGACA
3790
- GCGACT
3791
- GCGACC
3792
- GCGACG
3793
- GCGAGA
3794
- GCGAGT
3795
- GCGAGC
3796
- GCGAGG
3797
- GCGTAA
3798
- GCGTAT
3799
- GCGTAC
3800
- GCGTAG
3801
- GCGTTA
3802
- GCGTTT
3803
- GCGTTC
3804
- GCGTTG
3805
- GCGTCA
3806
- GCGTCT
3807
- GCGTCC
3808
- GCGTCG
3809
- GCGTGA
3810
- GCGTGT
3811
- GCGTGC
3812
- GCGTGG
3813
- GCGCAA
3814
- GCGCAT
3815
- GCGCAC
3816
- GCGCAG
3817
- GCGCTA
3818
- GCGCTT
3819
- GCGCTC
3820
- GCGCTG
3821
- GCGCCA
3822
- GCGCCT
3823
- GCGCCC
3824
- GCGCCG
3825
- GCGCGA
3826
- GCGCGT
3827
- GCGCGC
3828
- GCGCGG
3829
- GCGGAA
3830
- GCGGAT
3831
- GCGGAC
3832
- GCGGAG
3833
- GCGGTA
3834
- GCGGTT
3835
- GCGGTC
3836
- GCGGTG
3837
- GCGGCA
3838
- GCGGCT
3839
- GCGGCC
3840
- GCGGCG
3841
- GCGGGA
3842
- GCGGGT
3843
- GCGGGC
3844
- GCGGGG
3845
- GGAAAA
3846
- GGAAAT
3847
- GGAAAC
3848
- GGAAAG
3849
- GGAATA
3850
- GGAATT
3851
- GGAATC
3852
- GGAATG
3853
- GGAACA
3854
- GGAACT
3855
- GGAACC
3856
- GGAACG
3857
- GGAAGA
3858
- GGAAGT
3859
- GGAAGC
3860
- GGAAGG
3861
- GGATAA
3862
- GGATAT
3863
- GGATAC
3864
- GGATAG
3865
- GGATTA
3866
- GGATTT
3867
- GGATTC
3868
- GGATTG
3869
- GGATCA
3870
- GGATCT
3871
- GGATCC
3872
- GGATCG
3873
- GGATGA
3874
- GGATGT
3875
- GGATGC
3876
- GGATGG
3877
- GGACAA
3878
- GGACAT
3879
- GGACAC
3880
- GGACAG
3881
- GGACTA
3882
- GGACTT
3883
- GGACTC
3884
- GGACTG
3885
- GGACCA
3886
- GGACCT
3887
- GGACCC
3888
- GGACCG
3889
- GGACGA
3890
- GGACGT
3891
- GGACGC
3892
- GGACGG
3893
- GGAGAA
3894
- GGAGAT
3895
- GGAGAC
3896
- GGAGAG
3897
- GGAGTA
3898
- GGAGTT
3899
- GGAGTC
3900
- GGAGTG
3901
- GGAGCA
3902
- GGAGCT
3903
- GGAGCC
3904
- GGAGCG
3905
- GGAGGA
3906
- GGAGGT
3907
- GGAGGC
3908
- GGAGGG
3909
- GGTAAA
3910
- GGTAAT
3911
- GGTAAC
3912
- GGTAAG
3913
- GGTATA
3914
- GGTATT
3915
- GGTATC
3916
- GGTATG
3917
- GGTACA
3918
- GGTACT
3919
- GGTACC
3920
- GGTACG
3921
- GGTAGA
3922
- GGTAGT
3923
- GGTAGC
3924
- GGTAGG
3925
- GGTTAA
3926
- GGTTAT
3927
- GGTTAC
3928
- GGTTAG
3929
- GGTTTA
3930
- GGTTTT
3931
- GGTTTC
3932
- GGTTTG
3933
- GGTTCA
3934
- GGTTCT
3935
- GGTTCC
3936
- GGTTCG
3937
- GGTTGA
3938
- GGTTGT
3939
- GGTTGC
3940
- GGTTGG
3941
- GGTCAA
3942
- GGTCAT
3943
- GGTCAC
3944
- GGTCAG
3945
- GGTCTA
3946
- GGTCTT
3947
- GGTCTC
3948
- GGTCTG
3949
- GGTCCA
3950
- GGTCCT
3951
- GGTCCC
3952
- GGTCCG
3953
- GGTCGA
3954
- GGTCGT
3955
- GGTCGC
3956
- GGTCGG
3957
- GGTGAA
3958
- GGTGAT
3959
- GGTGAC
3960
- GGTGAG
3961
- GGTGTA
3962
- GGTGTT
3963
- GGTGTC
3964
- GGTGTG
3965
- GGTGCA
3966
- GGTGCT
3967
- GGTGCC
3968
- GGTGCG
3969
- GGTGGA
3970
- GGTGGT
3971
- GGTGGC
3972
- GGTGGG
3973
- GGCAAA
3974
- GGCAAT
3975
- GGCAAC
3976
- GGCAAG
3977
- GGCATA
3978
- GGCATT
3979
- GGCATC
3980
- GGCATG
3981
- GGCACA
3982
- GGCACT
3983
- GGCACC
3984
- GGCACG
3985
- GGCAGA
3986
- GGCAGT
3987
- GGCAGC
3988
- GGCAGG
3989
- GGCTAA
3990
- GGCTAT
3991
- GGCTAC
3992
- GGCTAG
3993
- GGCTTA
3994
- GGCTTT
3995
- GGCTTC
3996
- GGCTTG
3997
- GGCTCA
3998
- GGCTCT
3999
- GGCTCC
4000
- GGCTCG
4001
- GGCTGA
4002
- GGCTGT
4003
- GGCTGC
4004
- GGCTGG
4005
- GGCCAA
4006
- GGCCAT
4007
- GGCCAC
4008
- GGCCAG
4009
- GGCCTA
4010
- GGCCTT
4011
- GGCCTC
4012
- GGCCTG
4013
- GGCCCA
4014
- GGCCCT
4015
- GGCCCC
4016
- GGCCCG
4017
- GGCCGA
4018
- GGCCGT
4019
- GGCCGC
4020
- GGCCGG
4021
- GGCGAA
4022
- GGCGAT
4023
- GGCGAC
4024
- GGCGAG
4025
- GGCGTA
4026
- GGCGTT
4027
- GGCGTC
4028
- GGCGTG
4029
- GGCGCA
4030
- GGCGCT
4031
- GGCGCC
4032
- GGCGCG
4033
- GGCGGA
4034
- GGCGGT
4035
- GGCGGC
4036
- GGCGGG
4037
- GGGAAA
4038
- GGGAAT
4039
- GGGAAC
4040
- GGGAAG
4041
- GGGATA
4042
- GGGATT
4043
- GGGATC
4044
- GGGATG
4045
- GGGACA
4046
- GGGACT
4047
- GGGACC
4048
- GGGACG
4049
- GGGAGA
4050
- GGGAGT
4051
- GGGAGC
4052
- GGGAGG
4053
- GGGTAA
4054
- GGGTAT
4055
- GGGTAC
4056
- GGGTAG
4057
- GGGTTA
4058
- GGGTTT
4059
- GGGTTC
4060
- GGGTTG
4061
- GGGTCA
4062
- GGGTCT
4063
- GGGTCC
4064
- GGGTCG
4065
- GGGTGA
4066
- GGGTGT
4067
- GGGTGC
4068
- GGGTGG
4069
- GGGCAA
4070
- GGGCAT
4071
- GGGCAC
4072
- GGGCAG
4073
- GGGCTA
4074
- GGGCTT
4075
- GGGCTC
4076
- GGGCTG
4077
- GGGCCA
4078
- GGGCCT
4079
- GGGCCC
4080
- GGGCCG
4081
- GGGCGA
4082
- GGGCGT
4083
- GGGCGC
4084
- GGGCGG
4085
- GGGGAA
4086
- GGGGAT
4087
- GGGGAC
4088
- GGGGAG
4089
- GGGGTA
4090
- GGGGTT
4091
- GGGGTC
4092
- GGGGTG
4093
- GGGGCA
4094
- GGGGCT
4095
- GGGGCC
4096
- GGGGCG
4097
- GGGGGA
4098
- GGGGGT
4099
- GGGGGC
4100
- GGGGGG
4101
- A
4102
- T
4103
- C
4104
- G
4105
- N
4106
- <eos>
4107
- <bos>
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
Instadeep_NT_500M_CPT/ablation_study_10_tests.png DELETED

Git LFS Details

  • SHA256: c5ee27b9d42bdaa6ab76f26225d7aa976e48be98876670258029b93b5c13d1a1
  • Pointer size: 131 Bytes
  • Size of remote file: 583 kB
Instadeep_NT_500M_CPT/shap_modality_comparison.png DELETED
Binary file (93.4 kB)
 
Instadeep_NT_500M_CPT/shap_tabular_beeswarm.png DELETED

Git LFS Details

  • SHA256: dc493a5dcf42823fa31fbe9aae21ada530588d56e095c0c83820e2d6fb0556a0
  • Pointer size: 131 Bytes
  • Size of remote file: 110 kB