Spaces:

anikapro
/

capstone_project

Runtime error

App Files Files Community

anikapro commited on May 11, 2025

Commit

1db403f

verified ·

1 Parent(s): dd331e2

Add RAG using semantic search method and knowledge base

Browse files

Files changed (1) hide show

app.py +43 -1

app.py CHANGED Viewed

@@ -1,9 +1,51 @@
 import gradio as gr
 import random
 from huggingface_hub import InferenceClient
 client = InferenceClient("HuggingFaceH4/zephyr-7b-beta", provider='hf-inference')
 def respond(message, history):
     system_message = "You are a knowledgable and friendly chatbot that gives good information."
@@ -14,7 +56,7 @@ def respond(message, history):
     if history:
         messages.extend(history)
-    messages.append({"role": "user", "content": message})
     response = ""

 import gradio as gr
 import random
 from huggingface_hub import InferenceClient
+from sentence_transformers import SentenceTransformer
+import torch
 client = InferenceClient("HuggingFaceH4/zephyr-7b-beta", provider='hf-inference')
+#loading and processing knowledge base
+with open("bookbans.txt", "r", encoding="utf-8") as file:
+  book_bans_text = file.read()
+#cleaning and chunking text
+cleaned_text = book_bans_text.strip()
+chunks = cleaned_text.split("\n")
+cleaned_chunks = []
+for chunk in chunks:
+  stripped_chunk = chunk.strip()
+  if stripped_chunk:
+    cleaned_chunks.append(stripped_chunk)
+#importing model for embeddings
+model = SentenceTransformer('all-MiniLM-L6-v2')
+chunk_embeddings = model.encode(cleaned_chunks, convert_to_tensor=True)
+#function to get top chunks that are most similar to query by calculating similarity scores based off of embeddings
+def get_top_chunk(message):
+  query_embedding = model.encode(message, convert_to_tensor=True)
+  query_embedding_normalized = query_embedding / query_embedding.norm()
+  chunk_embeddings_normalized = chunk_embeddings / chunk_embeddings.norm(dim=1, keepdim=True)
+  similarities = torch.matmul(chunk_embeddings_normalized, query_embedding_normalized)
+  top_indices = torch.topk(similarities, k=1).indices
+  top_chunks = []
+  for i in top_indices:
+    chunk = chunks[i]
+    top_chunks.append(chunk)
+  return top_chunks
 def respond(message, history):
     system_message = "You are a knowledgable and friendly chatbot that gives good information."
     if history:
         messages.extend(history)
+    messages.append({"role": "user", "content": message, get_top_chunk(message)})
     response = ""