Spaces:

gk2410
/

NaturalDisasters

Sleeping

App Files Files Community

gk2410 commited on Jun 12, 2025

Commit

3131056

verified ·

1 Parent(s): 54fe94f

chromadb - v2

Browse files

Files changed (1) hide show

app.py +20 -12

app.py CHANGED Viewed

@@ -1,4 +1,4 @@
-import os
 import shutil
 import streamlit as st
 import chromadb
@@ -9,15 +9,19 @@ from weather import get_weather_summary
 from travel import get_travel_spots
 import spacy
-# Clean up previous DB state (important for Spaces or clean reboots)
 if os.path.exists("/tmp/chroma"):
     shutil.rmtree("/tmp/chroma")
-# Initialize ChromaDB with proper settings
-client = chromadb.Client(Settings(
     chroma_db_impl="duckdb+parquet",
     persist_directory="/tmp/chroma"
-))
 db = client.get_or_create_collection("disaster_news")
 # Load models
@@ -25,11 +29,11 @@ embed_model = SentenceTransformer("all-MiniLM-L6-v2")
 qa_pipeline = pipeline("text2text-generation", model="google/flan-t5-base")
 nlp = spacy.load("en_core_web_sm")
-# Keyword lists
 weather_keywords = ["weather", "forecast", "rain", "snow", "temperature", "wind", "climate", "humid", "cold", "hot"]
 travel_keywords = ["visit", "travel", "tourist", "see", "go", "spots", "places", "explore", "attractions"]
-# Extract location and intent
 def extract_location_and_intent(query):
     doc = nlp(query)
     locations = [ent.text for ent in doc.ents if ent.label_ in ("GPE", "LOC")]
@@ -38,7 +42,7 @@ def extract_location_and_intent(query):
     is_travel = any(word in query.lower() for word in travel_keywords)
     return location, is_weather, is_travel
-# Fallback RAG response
 def query_rag_system(query):
     query_emb = embed_model.encode(query).tolist()
     results = db.query(query_embeddings=[query_emb], n_results=5)
@@ -55,20 +59,16 @@ user_input = st.text_input("Ask anything (e.g. 'Rain forecast in Pune', 'Places
 if st.button("Submit") and user_input:
     location, is_weather, is_travel = extract_location_and_intent(user_input)
     response_parts = []
-    # Weather
     if is_weather and location:
         weather_summary = get_weather_summary(location)
         response_parts.append(weather_summary)
-    # Travel
     if is_travel and location:
         travel_suggestions = get_travel_spots(location)
         response_parts.append(travel_suggestions)
-    # RAG fallback
     if not is_weather and not is_travel:
         rag_response = query_rag_system(user_input)
         response_parts.append(rag_response)
@@ -79,3 +79,11 @@ if st.button("Submit") and user_input:
     st.markdown("### 🔎 Response:")
     for part in response_parts:
         st.write(part)

+from chromadb.config import Settingsimport os
 import shutil
 import streamlit as st
 import chromadb
 from travel import get_travel_spots
 import spacy
+# Force Chroma to use a valid persist directory
+os.environ["PERSIST_DIRECTORY"] = "/tmp/chroma"
+# Clean up any stale DB state (optional but avoids schema errors)
 if os.path.exists("/tmp/chroma"):
     shutil.rmtree("/tmp/chroma")
+# Initialize Chroma with valid settings
+settings = Settings(
     chroma_db_impl="duckdb+parquet",
     persist_directory="/tmp/chroma"
+)
+client = chromadb.Client(settings)
 db = client.get_or_create_collection("disaster_news")
 # Load models
 qa_pipeline = pipeline("text2text-generation", model="google/flan-t5-base")
 nlp = spacy.load("en_core_web_sm")
+# Define keyword lists
 weather_keywords = ["weather", "forecast", "rain", "snow", "temperature", "wind", "climate", "humid", "cold", "hot"]
 travel_keywords = ["visit", "travel", "tourist", "see", "go", "spots", "places", "explore", "attractions"]
+# Extract location and user intent
 def extract_location_and_intent(query):
     doc = nlp(query)
     locations = [ent.text for ent in doc.ents if ent.label_ in ("GPE", "LOC")]
     is_travel = any(word in query.lower() for word in travel_keywords)
     return location, is_weather, is_travel
+# Fallback: semantic search + QA
 def query_rag_system(query):
     query_emb = embed_model.encode(query).tolist()
     results = db.query(query_embeddings=[query_emb], n_results=5)
 if st.button("Submit") and user_input:
     location, is_weather, is_travel = extract_location_and_intent(user_input)
     response_parts = []
     if is_weather and location:
         weather_summary = get_weather_summary(location)
         response_parts.append(weather_summary)
     if is_travel and location:
         travel_suggestions = get_travel_spots(location)
         response_parts.append(travel_suggestions)
     if not is_weather and not is_travel:
         rag_response = query_rag_system(user_input)
         response_parts.append(rag_response)
     st.markdown("### 🔎 Response:")
     for part in response_parts:
         st.write(part)
+settings = Settings(
+    chroma_db_impl="duckdb+parquet",
+    persist_directory="/tmp/chroma"  # must not be None
+)
+client = chromadb.Client(settings)