Spaces:

Jayesh13
/

HI_SCBL

Runtime error

Jayesh13 commited on Oct 11, 2024

Commit

a361d73

verified ·

1 Parent(s): 9870495

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -54,27 +54,6 @@ def process_csv(file):
     return homorepeats, sequence_data
-import pandas as pd
-import streamlit as st
-from io import BytesIO
-import xlsxwriter
-# Function to process the Excel file
-def process_excel(excel_data):
-    # Custom logic to process each sheet within the Excel file
-    homorepeats = set()
-    sequence_data = []
-    for sheet_name in excel_data.sheet_names:
-        df = excel_data.parse(sheet_name)
-        for index, row in df.iterrows():
-            entry_id = row['Entry ID']
-            protein_name = row['Protein Name']
-            freq = {repeat: row[repeat] for repeat in df.columns[2:]}  # Assuming repeats start from 3rd column
-            sequence_data.append((entry_id, protein_name, freq))
-            homorepeats.update(freq.keys())
-    return homorepeats, sequence_data
 # Function to generate and download Excel workbook with separate sheets for each input file
 def create_excel(sequences_data, homorepeats, filenames):
@@ -109,6 +88,23 @@ def create_excel(sequences_data, homorepeats, filenames):
     output.seek(0)
     return output
 # Streamlit UI components
 st.title("Protein Homorepeat Analysis")

     return homorepeats, sequence_data
 # Function to generate and download Excel workbook with separate sheets for each input file
 def create_excel(sequences_data, homorepeats, filenames):
     output.seek(0)
     return output
+# Function to process the Excel file
+def process_excel(excel_data):
+    # Custom logic to process each sheet within the Excel file
+    homorepeats = set()
+    sequence_data = []
+    for sheet_name in excel_data.sheet_names:
+        df = excel_data.parse(sheet_name)
+        for index, row in df.iterrows():
+            entry_id = row['Entry ID']
+            protein_name = row['Protein Name']
+            freq = {repeat: row[repeat] for repeat in df.columns[2:]}  # Assuming repeats start from 3rd column
+            sequence_data.append((entry_id, protein_name, freq))
+            homorepeats.update(freq.keys())
+    return homorepeats, sequence_data
 # Streamlit UI components
 st.title("Protein Homorepeat Analysis")