Spaces:

jefalod
/

rag-bot

Sleeping

App Files Files Community

jefalod commited on Jun 26, 2025

Commit

0ce2499

verified ·

1 Parent(s): a9917b9

Update app.py

Browse files

Files changed (1) hide show

app.py +28 -58

app.py CHANGED Viewed

@@ -1,80 +1,50 @@
 import os
-from typing import List, Optional
 from langchain_community.document_loaders import TextLoader
-from langchain_community.embeddings import HuggingFaceEmbeddings
-from langchain_community.vectorstores import Chroma
 from langchain.text_splitter import RecursiveCharacterTextSplitter
 from langchain.chains import RetrievalQA
-from langchain.llms.base import LLM
-from groq import Groq
-import gradio as gr
-# ✅ Create sample file if missing
-if not os.path.exists("sample_readme.txt"):
-    with open("sample_readme.txt", "w") as f:
-        f.write(
-            "# Sample Project\n\nThis project demonstrates an example of a LangChain-powered RAG pipeline. "
-            "It uses FAISS for vector search and a GROQ-hosted LLaMA3 model for response generation.\n\n"
-            "## Features\n- Document embedding\n- Vector similarity search\n- LLM-based QA over documents"
-        )
-# Load & split
 loader = TextLoader("sample_readme.txt")
 documents = loader.load()
 text_splitter = RecursiveCharacterTextSplitter(chunk_size=500, chunk_overlap=50)
 docs = text_splitter.split_documents(documents)
-# Embed & store vectors
 embedding = HuggingFaceEmbeddings(model_name="all-MiniLM-L6-v2")
 vectorstore = Chroma.from_documents(docs, embedding, persist_directory="rag_chroma_groq")
 # Groq LLM
-class GroqLLM(LLM):
-    model: str = "llama3-8b-8192"
-    api_key: str = os.environ.get("GROQ_API_KEY")
-    temperature: float = 0.0
-    def _call(self, prompt: str, stop: Optional[List[str]] = None) -> str:
-        client = Groq(api_key=self.api_key)
-        messages = [
-            {"role": "system", "content": "You are a helpful assistant."},
-            {"role": "user", "content": prompt}
-        ]
-        response = client.chat.completions.create(
-            model=self.model,
-            messages=messages,
-            temperature=self.temperature,
-        )
-        return response.choices[0].message.content
-    @property
-    def _llm_type(self) -> str:
-        return "groq-llm"
-# QA setup
-retriever = vectorstore.as_retriever()
-groq_llm = GroqLLM()
 qa_chain = RetrievalQA.from_chain_type(
     llm=groq_llm,
     retriever=retriever,
-    return_source_documents=True
 )
 # Gradio UI
-def ask_question(query):
-    response = qa_chain(query)
-    answer = response["result"]
-    sources = "\n".join(
-        [doc.metadata.get("source", "sample_readme.txt") for doc in response["source_documents"]]
-    )
-    return f"### Answer:\n{answer}\n\n### Sources:\n{sources}"
-gr.Interface(
-    fn=ask_question,
-    inputs=gr.Textbox(label="Ask something about the README"),
-    outputs=gr.Markdown(),
-    title="📄 RAG Chatbot with Groq LLaMA3",
-    description="Ask questions about a README file using a LangChain + Groq LLaMA3-powered chatbot.",
-    theme="soft"
-).launch()

 import os
+import gradio as gr
 from langchain_community.document_loaders import TextLoader
 from langchain.text_splitter import RecursiveCharacterTextSplitter
+from langchain_huggingface import HuggingFaceEmbeddings
+from langchain_community.vectorstores import Chroma
 from langchain.chains import RetrievalQA
+from langchain_groq import ChatGroq
+# Load documents
 loader = TextLoader("sample_readme.txt")
 documents = loader.load()
+# Split into chunks
 text_splitter = RecursiveCharacterTextSplitter(chunk_size=500, chunk_overlap=50)
 docs = text_splitter.split_documents(documents)
+# Create embeddings
 embedding = HuggingFaceEmbeddings(model_name="all-MiniLM-L6-v2")
+# Vector DB
 vectorstore = Chroma.from_documents(docs, embedding, persist_directory="rag_chroma_groq")
+retriever = vectorstore.as_retriever()
 # Groq LLM
+groq_llm = ChatGroq(api_key=os.getenv("GROQ_API_KEY"), model_name="llama3-70b-8192")
+# RAG chain
 qa_chain = RetrievalQA.from_chain_type(
     llm=groq_llm,
     retriever=retriever,
+    return_source_documents=False
 )
+# Chat function
+def chatbot_interface(user_query):
+    result = qa_chain({"query": user_query})
+    return result["result"]
 # Gradio UI
+iface = gr.Interface(
+    fn=chatbot_interface,
+    inputs=gr.Textbox(label="Ask a question about the document"),
+    outputs=gr.Textbox(label="Answer"),
+    title="RAG Chatbot with Groq + LangChain",
+    description="Ask questions about sample_readme.txt using Groq LLM"
+)
+if __name__ == "__main__":
+    iface.launch()