Haseeb-001 commited on
Commit
26895e4
·
verified ·
1 Parent(s): a897338

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +48 -39
app.py CHANGED
@@ -80,45 +80,54 @@ def main():
80
  dataset_url = st.text_input("Paste the URL of the dataset")
81
 
82
  if uploaded_file or dataset_url:
83
- if dataset_url:
84
- st.info("Downloading dataset from URL...")
85
- uploaded_file = download_dataset(dataset_url)
86
-
87
- if uploaded_file:
88
- st.success("File uploaded successfully!")
89
- st.write("Processing the file...")
90
-
91
- # Load dataset
92
- df = pd.read_csv(uploaded_file)
93
- st.write("**Original Dataset**")
94
- st.dataframe(df)
95
-
96
- # Process data
97
- st.info("Cleaning and simplifying the dataset...")
98
- df_cleaned = process_data(df)
99
-
100
- # Display cleaned data
101
- st.write("**Cleaned Dataset**")
102
- st.dataframe(df_cleaned)
103
-
104
- # Chunk data
105
- st.info("Creating chunks for AI models...")
106
- processed_files = chunk_dataset(df_cleaned)
107
-
108
- # Allow download of processed chunks
109
- st.success(f"Processing complete! {len(processed_files)} chunk(s) created.")
110
- for file_name in processed_files:
111
- with open(file_name, 'rb') as file:
112
- st.download_button(
113
- label=f"Download {file_name}",
114
- data=file,
115
- file_name=file_name,
116
- mime="text/csv",
117
- )
118
-
119
- # Cleanup generated files
120
- for file_name in processed_files:
121
- os.remove(file_name)
 
 
 
 
 
 
 
 
 
122
 
123
  if __name__ == "__main__":
124
  main()
 
80
  dataset_url = st.text_input("Paste the URL of the dataset")
81
 
82
  if uploaded_file or dataset_url:
83
+ try:
84
+ if dataset_url:
85
+ st.info("Downloading dataset from URL...")
86
+ uploaded_file = download_dataset(dataset_url)
87
+
88
+ if uploaded_file:
89
+ st.success("File uploaded successfully!")
90
+ st.write("Processing the file...")
91
+
92
+ # Load dataset
93
+ if hasattr(uploaded_file, 'read'): # Streamlit file upload
94
+ df = pd.read_csv(uploaded_file)
95
+ else: # File from URL download or local path
96
+ with open(uploaded_file, 'r') as file:
97
+ df = pd.read_csv(file)
98
+
99
+ st.write("**Original Dataset**")
100
+ st.dataframe(df)
101
+
102
+ # Process data
103
+ st.info("Cleaning and simplifying the dataset...")
104
+ df_cleaned = process_data(df)
105
+
106
+ # Display cleaned data
107
+ st.write("**Cleaned Dataset**")
108
+ st.dataframe(df_cleaned)
109
+
110
+ # Chunk data
111
+ st.info("Creating chunks for AI models...")
112
+ processed_files = chunk_dataset(df_cleaned)
113
+
114
+ # Allow download of processed chunks
115
+ st.success(f"Processing complete! {len(processed_files)} chunk(s) created.")
116
+ for file_name in processed_files:
117
+ with open(file_name, 'rb') as file:
118
+ st.download_button(
119
+ label=f"Download {file_name}",
120
+ data=file,
121
+ file_name=file_name,
122
+ mime="text/csv",
123
+ )
124
+
125
+ # Cleanup generated files
126
+ for file_name in processed_files:
127
+ os.remove(file_name)
128
+
129
+ except Exception as e:
130
+ st.error(f"An error occurred: {e}")
131
 
132
  if __name__ == "__main__":
133
  main()