Spaces:

Nav772
/

rag-document-qa

Runtime error

App Files Files Community

Nav772 commited on 3 days ago

Commit

2395611

verified ·

1 Parent(s): 66dedca

Upload app.py with huggingface_hub

Browse files

Files changed (1) hide show

app.py +169 -0

app.py ADDED Viewed

	@@ -0,0 +1,169 @@

+import gradio as gr
+from langchain_community.document_loaders import PyPDFLoader
+from langchain_text_splitters import RecursiveCharacterTextSplitter
+from langchain_huggingface import HuggingFaceEmbeddings
+from langchain_community.vectorstores import FAISS
+from huggingface_hub import InferenceClient
+import tempfile
+import os
+# Initialize embedding model (runs on CPU, small enough for free tier)
+embedding_model = HuggingFaceEmbeddings(
+    model_name="sentence-transformers/all-MiniLM-L6-v2",
+    model_kwargs={'device': 'cpu'}
+)
+# Initialize Inference Client (uses free API)
+client = InferenceClient(model="HuggingFaceH4/zephyr-7b-beta")
+# Global variable to store vectorstore
+vectorstore = None
+def process_pdf(pdf_file):
+    """Process uploaded PDF and create vector store."""
+    global vectorstore
+    if pdf_file is None:
+        return "Please upload a PDF file."
+    try:
+        # Load PDF
+        loader = PyPDFLoader(pdf_file.name)
+        documents = loader.load()
+        # Split into chunks
+        text_splitter = RecursiveCharacterTextSplitter(
+            chunk_size=1000,
+            chunk_overlap=200,
+        )
+        chunks = text_splitter.split_documents(documents)
+        # Create vector store
+        vectorstore = FAISS.from_documents(
+            documents=chunks,
+            embedding=embedding_model
+        )
+        return f"✅ Successfully processed {len(documents)} pages into {len(chunks)} chunks. You can now ask questions!"
+    except Exception as e:
+        return f"❌ Error processing PDF: {str(e)}"
+def answer_question(question):
+    """Answer question using RAG."""
+    global vectorstore
+    if vectorstore is None:
+        return "Please upload and process a PDF first.", ""
+    if not question.strip():
+        return "Please enter a question.", ""
+    try:
+        # Retrieve relevant chunks
+        docs = vectorstore.similarity_search(question, k=3)
+        # Format context
+        context = "\n\n".join([doc.page_content for doc in docs])
+        # Create prompt
+        prompt = f"""<|system|>
+You are a helpful assistant that answers questions based on the provided context. Only use information from the context to answer. If the answer is not in the context, say "I cannot find this information in the document."
+</s>
+<|user|>
+Context:
+{context}
+Question: {question}
+</s>
+<|assistant|>"""
+        # Call Inference API
+        response = client.text_generation(
+            prompt,
+            max_new_tokens=512,
+            temperature=0.7,
+        )
+        # Format sources
+        sources = []
+        for i, doc in enumerate(docs, 1):
+            page = doc.metadata.get('page', 'N/A')
+            if isinstance(page, int):
+                page += 1
+            preview = doc.page_content[:150].replace('\n', ' ')
+            sources.append(f"{i}. Page {page}: {preview}...")
+        sources_text = "\n".join(sources)
+        return response, sources_text
+    except Exception as e:
+        return f"❌ Error: {str(e)}", ""
+# Create Gradio interface
+with gr.Blocks(theme=gr.themes.Soft()) as demo:
+    gr.Markdown("""
+    # 📚 RAG Document Q&A System
+    Upload a PDF document and ask questions about its content.
+    **How it works:**
+    1. Upload a PDF file
+    2. Click "Process PDF" to analyze the document
+    3. Ask questions about the document content
+    """)
+    with gr.Row():
+        with gr.Column(scale=1):
+            pdf_input = gr.File(label="Upload PDF", file_types=[".pdf"])
+            process_btn = gr.Button("📄 Process PDF", variant="primary")
+            status_output = gr.Textbox(label="Status", interactive=False)
+        with gr.Column(scale=2):
+            question_input = gr.Textbox(
+                label="Your Question",
+                placeholder="What is this document about?",
+                lines=2
+            )
+            ask_btn = gr.Button("🔍 Ask Question", variant="primary")
+            answer_output = gr.Textbox(label="Answer", lines=6, interactive=False)
+            sources_output = gr.Textbox(label="Sources", lines=4, interactive=False)
+    gr.Markdown("""
+    ---
+    ### 🛠️ Technical Details
+    | Component | Technology |
+    |-----------|------------|
+    | Embeddings | sentence-transformers/all-MiniLM-L6-v2 |
+    | Vector Store | FAISS |
+    | LLM | Zephyr-7B via Inference API |
+    | Chunking | 1000 chars, 200 overlap |
+    ### ⚠️ Development Challenges Documented
+    This project encountered several technical challenges:
+    - **LangChain API changes**: Package restructuring required updated imports
+    - **PDF parsing issues**: Required proper HTTP headers for downloads
+    - **LLM response quality**: FLAN-T5 produced short responses; switched to Zephyr-7B
+    - **Memory management**: Required explicit GPU cleanup between model loads
+    Built by [Nav772](https://huggingface.co/Nav772) as part of AI Engineering portfolio.
+    """)
+    # Connect buttons to functions
+    process_btn.click(
+        fn=process_pdf,
+        inputs=[pdf_input],
+        outputs=[status_output]
+    )
+    ask_btn.click(
+        fn=answer_question,
+        inputs=[question_input],
+        outputs=[answer_output, sources_output]
+    )
+demo.launch()