Spaces:

polinapred
/

CapstoneProject

Sleeping

App Files Files Community

polinapred commited on May 4

Commit

28fff8f

verified ·

1 Parent(s): ab57d69

still having errors? fixed indentation

Browse files

Files changed (1) hide show

app.py +12 -14

app.py CHANGED Viewed

@@ -5,7 +5,7 @@ import json
 import numpy as np
 import faiss
 from sentence_transformers import SentenceTransformer
-from bs4 import BeautifulSoup #help clean up the HTML tags in my JSON data
 hf_token = os.getenv("HF_Token")
 client = InferenceClient("Qwen/Qwen2.5-7B-Instruct", token=hf_token)
@@ -19,12 +19,10 @@ def preprocess_text(text):
         chunks.extend(i.split(". "))
     cleaned_chunks = []
     for chunk in chunks:
         chunk = chunk.strip()
         if len(chunk) > 0:
             cleaned_chunks.append(chunk)
     return cleaned_chunks
 def prepare_docs():
@@ -35,17 +33,16 @@ def prepare_docs():
     for item in raw_data:
         soup = BeautifulSoup(item['popup'], 'html.parser')
         raw_html_text = soup.get_text(separator=" ")
-    chunks = preprocess_text(raw_html_text)
-    for chunk in chunks:
-            all_processed_chunks.append(chunk)
     return all_processed_chunks
 processed_data = prepare_docs()
 embeddings = embed_model.encode(processed_data)
 index = faiss.IndexFlatL2(embeddings.shape[1])
 index.add(np.array(embeddings).astype('float32'))
@@ -70,8 +67,9 @@ def respond(message, history):
     messages = [{"role": "system", "content": system_prompt}]
-    for msg in history:
-        messages.append(msg)
     messages.append({"role": "user", "content": message})
@@ -90,9 +88,9 @@ def respond(message, history):
 chatbot = gr.ChatInterface(
     respond,
-    type="messages",
     title="CityScout: Unique Spot Finder",
-    description="Tell me your city and interests to find a cool spot!"
 )
-chatbot.launch()

 import numpy as np
 import faiss
 from sentence_transformers import SentenceTransformer
+from bs4 import BeautifulSoup
 hf_token = os.getenv("HF_Token")
 client = InferenceClient("Qwen/Qwen2.5-7B-Instruct", token=hf_token)
         chunks.extend(i.split(". "))
     cleaned_chunks = []
     for chunk in chunks:
         chunk = chunk.strip()
         if len(chunk) > 0:
             cleaned_chunks.append(chunk)
     return cleaned_chunks
 def prepare_docs():
     for item in raw_data:
         soup = BeautifulSoup(item['popup'], 'html.parser')
+        name = soup.find(class_='infobox-title').get_text() if soup.find(class_='infobox-title') else "Unknown Spot"
         raw_html_text = soup.get_text(separator=" ")
+        chunks = preprocess_text(raw_html_text)
+        for chunk in chunks:
+            all_processed_chunks.append(f"[{name}]: {chunk}")
     return all_processed_chunks
 processed_data = prepare_docs()
 embeddings = embed_model.encode(processed_data)
 index = faiss.IndexFlatL2(embeddings.shape[1])
 index.add(np.array(embeddings).astype('float32'))
     messages = [{"role": "system", "content": system_prompt}]
+    for user_msg, assistant_msg in history:
+        if user_msg: messages.append({"role": "user", "content": user_msg})
+        if assistant_msg: messages.append({"role": "assistant", "content": assistant_msg})
     messages.append({"role": "user", "content": message})
 chatbot = gr.ChatInterface(
     respond,
     title="CityScout: Unique Spot Finder",
+    description="Tell me your city or interests (e.g. 'mummies' or 'New York')!"
 )
+if __name__ == "__main__":
+    chatbot.launch()