Spaces:

Vashishta-S-2141
/

LLM_Powered_Database_Chatbot

Sleeping

App Files Files Community

SVashishta1 commited on Mar 3

Commit

f35c7b5

1 Parent(s): 9c8c8b2

Error Fix

Browse files

Files changed (1) hide show

app.py +27 -23

app.py CHANGED Viewed

@@ -223,8 +223,11 @@ def process_file_upload(files):
                 # Create table name from filename
                 table_name = os.path.splitext(file_name)[0].replace(' ', '_').lower()
-                # Load CSV into SQLite
                 conn = sqlite3.connect(DB_PATH)
                 load_csv_to_sqlite(file_path, conn, table_name)
                 # Update current context
@@ -234,35 +237,26 @@ def process_file_upload(files):
                     "table_name": table_name
                 }
-                # Get column info
                 cursor = conn.cursor()
-                cursor.execute(f"PRAGMA table_info({table_name});")
-                columns = [f"{col[1]} ({col[2]})" for col in cursor.fetchall()]
-                # Get row count
                 cursor.execute(f"SELECT COUNT(*) FROM {table_name};")
                 row_count = cursor.fetchone()[0]
-                # Get sample of data
-                cursor.execute(f"SELECT * FROM {table_name} LIMIT 5;")
-                sample_rows = cursor.fetchall()
                 conn.close()
                 file_info.append("✅ CSV File Successfully Loaded")
                 file_info.append(f"📊 Table Name: {table_name}")
                 file_info.append(f"📈 Total Rows: {row_count:,}")
-                file_info.append(f"\n📋 Columns:")
-                for col in columns:
-                    file_info.append(f"  • {col}")
-                if sample_rows:
-                    file_info.append("\n🔍 Sample Data (first 5 rows):")
-                    sample_df = pd.DataFrame(sample_rows, columns=[col.split(' ')[0] for col in columns])
-                    file_info.append(f"```\n{sample_df.to_string()}\n```")
             except Exception as e:
                 file_info.append(f"❌ Error loading CSV {file_name}: {str(e)}")
         else:
             # Process PDF or other document types
@@ -322,9 +316,11 @@ def load_csv_to_sqlite(file_path, conn, table_name):
     conn.execute("PRAGMA journal_mode = MEMORY")
     conn.execute("PRAGMA temp_store = MEMORY")
     conn.execute("PRAGMA cache_size = 10000")
-    conn.execute("BEGIN TRANSACTION")
     try:
         # Read the CSV in chunks
         for i, chunk in enumerate(pd.read_csv(file_path, chunksize=chunksize)):
             # Optimize column types
@@ -343,13 +339,21 @@ def load_csv_to_sqlite(file_path, conn, table_name):
         # Create indices for common query columns
         for col in ['pickup_datetime', 'dropoff_datetime', 'tip_amount', 'fare_amount', 'total_amount']:
             try:
-                conn.execute(f"CREATE INDEX IF NOT EXISTS idx_{table_name}_{col} ON {table_name}({col})")
-            except:
-                pass
-        conn.execute("COMMIT")
     except Exception as e:
-        conn.execute("ROLLBACK")
         raise e
 def list_documents():

                 # Create table name from filename
                 table_name = os.path.splitext(file_name)[0].replace(' ', '_').lower()
+                # Create a new connection for each file
                 conn = sqlite3.connect(DB_PATH)
+                # Load CSV into SQLite
+                file_info.append(f"Loading CSV file: {file_name}...")
                 load_csv_to_sqlite(file_path, conn, table_name)
                 # Update current context
                     "table_name": table_name
                 }
+                # Get basic info about the table
                 cursor = conn.cursor()
                 cursor.execute(f"SELECT COUNT(*) FROM {table_name};")
                 row_count = cursor.fetchone()[0]
+                cursor.execute(f"PRAGMA table_info({table_name});")
+                columns = [col[1] for col in cursor.fetchall()]
                 conn.close()
                 file_info.append("✅ CSV File Successfully Loaded")
                 file_info.append(f"📊 Table Name: {table_name}")
                 file_info.append(f"📈 Total Rows: {row_count:,}")
+                file_info.append(f"📋 Columns: {len(columns)}")
             except Exception as e:
                 file_info.append(f"❌ Error loading CSV {file_name}: {str(e)}")
+                # Print the full error for debugging
+                import traceback
+                print(traceback.format_exc())
         else:
             # Process PDF or other document types
     conn.execute("PRAGMA journal_mode = MEMORY")
     conn.execute("PRAGMA temp_store = MEMORY")
     conn.execute("PRAGMA cache_size = 10000")
     try:
+        # Start transaction manually
+        conn.execute("BEGIN TRANSACTION")
         # Read the CSV in chunks
         for i, chunk in enumerate(pd.read_csv(file_path, chunksize=chunksize)):
             # Optimize column types
         # Create indices for common query columns
         for col in ['pickup_datetime', 'dropoff_datetime', 'tip_amount', 'fare_amount', 'total_amount']:
             try:
+                if col in chunk.columns:  # Only create index if column exists
+                    conn.execute(f"CREATE INDEX IF NOT EXISTS idx_{table_name}_{col} ON {table_name}({col})")
+            except Exception as idx_error:
+                print(f"Warning: Could not create index on {col}: {str(idx_error)}")
+        # Commit the transaction
+        conn.commit()
+        print(f"Successfully loaded {table_name} into database")
     except Exception as e:
+        # Only try to rollback if we're in a transaction
+        try:
+            conn.rollback()
+        except:
+            pass  # If rollback fails, just continue
         raise e
 def list_documents():