LoocasGoose commited on
Commit
e223904
·
1 Parent(s): 287a5ea

update website with better UI

Browse files
Files changed (2) hide show
  1. data/desktop.ini +2 -0
  2. data/jcvi_csv_to_fasta.py +14 -0
data/desktop.ini ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ [LocalizedFileNames]
2
+ jcvi_syn30_unknown_gene_hits.csv=@jcvi_syn30_unknown_gene_hits.csv,0
data/jcvi_csv_to_fasta.py ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import pandas as pd
2
+
3
+ df = pd.read_csv("data/jcvi_full_unknown_gene.csv")
4
+
5
+ # Columns in this file include the query id and the query amino-acid sequence
6
+ # (names may vary slightly; inspect df.columns if needed)
7
+ query_id_col = "Locus tag (accession CP002027). "
8
+ seq_col = "Amino acid sequence. RNA's are labeled xrna."
9
+
10
+ queries = df[[query_id_col, seq_col]].drop_duplicates()
11
+
12
+ with open("jcvi_full_unknown_genes.fasta", "w") as f:
13
+ for qid, seq in queries.itertuples(index=False):
14
+ f.write(f">{qid}\n{seq}\n")