Spaces:

ZunairaHawwar
/

IcodeGuru_Chatbot

Sleeping

App Files Files Community

ZunairaHawwar commited on Jul 27, 2025

Commit

50adcc7

verified ·

1 Parent(s): 6e9c490

Update app.py

Browse files

Files changed (1) hide show

app.py +329 -58

app.py CHANGED Viewed

@@ -92,15 +92,15 @@ class LangChainRAGSystem:
         Use the following context to answer the user's question comprehensively and accurately.
         Always provide relevant video links, website links, or resources when available in the context.
         If you don't know the answer based on the context, say so clearly.
         Context: {context}
         Chat History: {chat_history}
         Human: {question}
         Assistant: I'll help you with that based on the iCodeGuru knowledge base.
         """
         PROMPT = PromptTemplate(
@@ -108,7 +108,8 @@ class LangChainRAGSystem:
             input_variables=["context", "chat_history", "question"]
         )
-        if self.vectorstore and self.vectorstore._collection.count() > 0:
             # Create retriever
             retriever = self.vectorstore.as_retriever(
                 search_type="similarity",
@@ -124,8 +125,11 @@ class LangChainRAGSystem:
                 return_source_documents=True,
                 verbose=True
             )
-        else:
-            st.warning("⚠️ No documents in knowledge base. Please refresh the knowledge base first.")
     def load_and_process_documents(self) -> List[Document]:
         """Load and process JSON documents from the docs directory."""
@@ -230,15 +234,22 @@ class LangChainRAGSystem:
                 st.success(f"✅ Successfully ingested {len(chunks)} document chunks!")
-                # Recreate retrieval chain with new data
                 self.setup_retrieval_chain()
                 return True
             except Exception as e:
                 st.error(f"❌ Error during ingestion: {str(e)}")
                 return False
     def get_answer(self, question: str) -> dict:
         """Get answer for a user question."""
         if not self.retrieval_chain:
@@ -248,9 +259,28 @@ class LangChainRAGSystem:
             }
         try:
             # Get response from the chain
             response = self.retrieval_chain({"question": question})
             return response
         except Exception as e:
             return {
                 "answer": f"❌ Error getting answer: {str(e)}",
@@ -269,7 +299,7 @@ def get_rag_system():
     return LangChainRAGSystem()
 def main():
-    """Main Streamlit application."""
     st.set_page_config(
         page_title="EduBot for iCodeGuru",
         page_icon="🎓",
@@ -277,89 +307,317 @@ def main():
         initial_sidebar_state="expanded"
     )
-    # Header
-    st.title("🎓 EduBot for @icodeguru0")
-    st.markdown("**Powered by LangChain** | Ask anything based on pre-loaded iCodeGuru knowledge.")
     # Initialize RAG system
     rag_system = get_rag_system()
-    # Sidebar for admin functions
     with st.sidebar:
-        st.header("⚙️ Admin Panel")
-        if st.button("🔄 Refresh Knowledge Base", type="primary"):
-            success = rag_system.ingest_documents()
-            if success:
-                st.balloons()
-        if st.button("🗑️ Clear Conversation"):
-            rag_system.reset_conversation()
         st.markdown("---")
-        st.subheader("📊 System Info")
-        # Show vectorstore stats
         if rag_system.vectorstore:
             try:
                 doc_count = rag_system.vectorstore._collection.count()
-                st.metric("Documents in KB", doc_count)
             except:
-                st.metric("Documents in KB", "N/A")
         st.markdown("---")
-        st.caption("🧠 **ChromaDB** for vector storage")
-        st.caption("⚡ **Groq LLM** for answers")
-        st.caption("🔗 **LangChain** for orchestration")
-    # Main chat interface
-    st.markdown("---")
-    # Initialize session state for chat history
     if "messages" not in st.session_state:
         st.session_state.messages = []
-    # Display chat history
-    for message in st.session_state.messages:
-        with st.chat_message(message["role"]):
-            st.markdown(message["content"])
-            if "sources" in message and message["sources"]:
-                with st.expander("📚 Sources"):
-                    for i, source in enumerate(message["sources"], 1):
-                        st.markdown(f"**Source {i}:** {source}")
-    # User input
-    if prompt := st.chat_input("💬 Ask your question about iCodeGuru..."):
-        # Add user message to chat history
-        st.session_state.messages.append({"role": "user", "content": prompt})
         # Display user message
         with st.chat_message("user"):
-            st.markdown(prompt)
-        # Get assistant response
         with st.chat_message("assistant"):
-            with st.spinner("🤔 Thinking..."):
-                response = rag_system.get_answer(prompt)
-                answer = response.get("answer", "No answer available.")
                 source_docs = response.get("source_documents", [])
                 st.markdown(answer)
-                # Show sources if available
                 if source_docs:
                     sources = []
-                    for doc in source_docs[:3]:  # Show top 3 sources
-                        source = doc.metadata.get('source_file', 'Unknown source')
-                        content_preview = doc.page_content[:100] + "..." if len(doc.page_content) > 100 else doc.page_content
-                        sources.append(f"{source}: {content_preview}")
                     if sources:
-                        with st.expander("📚 Sources"):
                             for i, source in enumerate(sources, 1):
-                                st.markdown(f"**Source {i}:** {source}")
-                        # Add to session state with sources
                         st.session_state.messages.append({
                             "role": "assistant",
                             "content": answer,
@@ -369,6 +627,19 @@ def main():
                         st.session_state.messages.append({"role": "assistant", "content": answer})
                 else:
                     st.session_state.messages.append({"role": "assistant", "content": answer})
 if __name__ == "__main__":
     main()

         Use the following context to answer the user's question comprehensively and accurately.
         Always provide relevant video links, website links, or resources when available in the context.
         If you don't know the answer based on the context, say so clearly.
         Context: {context}
         Chat History: {chat_history}
         Human: {question}
         Assistant: I'll help you with that based on the iCodeGuru knowledge base.
         """
         PROMPT = PromptTemplate(
             input_variables=["context", "chat_history", "question"]
         )
+        # Always try to create retriever - let it handle empty collections gracefully
+        try:
             # Create retriever
             retriever = self.vectorstore.as_retriever(
                 search_type="similarity",
                 return_source_documents=True,
                 verbose=True
             )
+            st.success("✅ Retrieval chain setup successfully!")
+        except Exception as e:
+            st.warning(f"⚠️ Retrieval chain setup issue: {str(e)}")
+            self.retrieval_chain = None
     def load_and_process_documents(self) -> List[Document]:
         """Load and process JSON documents from the docs directory."""
                 st.success(f"✅ Successfully ingested {len(chunks)} document chunks!")
+                # Force recreate retrieval chain with new data
                 self.setup_retrieval_chain()
+                # Verify the setup worked
+                try:
+                    doc_count = self.vectorstore._collection.count()
+                    st.info(f"📊 Knowledge base now contains {doc_count} documents")
+                except:
+                    st.info("📊 Knowledge base updated successfully")
                 return True
             except Exception as e:
                 st.error(f"❌ Error during ingestion: {str(e)}")
                 return False
     def get_answer(self, question: str) -> dict:
         """Get answer for a user question."""
         if not self.retrieval_chain:
             }
         try:
+            # Check if vectorstore has documents before querying
+            doc_count = 0
+            try:
+                doc_count = self.vectorstore._collection.count()
+            except:
+                # If count fails, try a simple similarity search to test
+                try:
+                    test_results = self.vectorstore.similarity_search("test", k=1)
+                    doc_count = len(test_results) if test_results else 0
+                except:
+                    doc_count = 0
+            if doc_count == 0:
+                return {
+                    "answer": "⚠️ No documents found in knowledge base. Please refresh the knowledge base first.",
+                    "source_documents": []
+                }
             # Get response from the chain
             response = self.retrieval_chain({"question": question})
             return response
         except Exception as e:
             return {
                 "answer": f"❌ Error getting answer: {str(e)}",
     return LangChainRAGSystem()
 def main():
+    """Main Streamlit application with enhanced UI."""
     st.set_page_config(
         page_title="EduBot for iCodeGuru",
         page_icon="🎓",
         initial_sidebar_state="expanded"
     )
+    # Custom CSS for better styling
+    st.markdown("""
+    <style>
+    .main-header {
+        background: linear-gradient(90deg, #667eea 0%, #764ba2 100%);
+        padding: 2rem;
+        border-radius: 10px;
+        margin-bottom: 2rem;
+        text-align: center;
+    }
+    .main-header h1 {
+        color: white;
+        margin: 0;
+        font-size: 2.5rem;
+    }
+    .main-header p {
+        color: #f0f0f0;
+        margin: 0.5rem 0 0 0;
+        font-size: 1.1rem;
+    }
+    .metric-card {
+        background: #f8f9fa;
+        padding: 1rem;
+        border-radius: 10px;
+        border-left: 4px solid #667eea;
+        margin: 0.5rem 0;
+    }
+    .status-online {
+        color: #28a745;
+        font-weight: bold;
+    }
+    .status-offline {
+        color: #dc3545;
+        font-weight: bold;
+    }
+    .chat-input {
+        position: fixed;
+        bottom: 0;
+        background: white;
+        padding: 1rem;
+        border-top: 1px solid #e0e0e0;
+    }
+    .source-card {
+        background: #f8f9fa;
+        border: 1px solid #e9ecef;
+        border-radius: 8px;
+        padding: 0.8rem;
+        margin: 0.3rem 0;
+    }
+    .quick-action-btn {
+        background: linear-gradient(45deg, #667eea, #764ba2);
+        color: white;
+        border: none;
+        padding: 0.5rem 1rem;
+        border-radius: 20px;
+        margin: 0.2rem;
+    }
+    </style>
+    """, unsafe_allow_html=True)
+    # Enhanced Header
+    st.markdown("""
+    <div class="main-header">
+        <h1>🎓 EduBot for iCodeGuru</h1>
+        <p>Powered by LangChain | Your AI Programming Assistant</p>
+    </div>
+    """, unsafe_allow_html=True)
     # Initialize RAG system
     rag_system = get_rag_system()
+    # Enhanced Sidebar
     with st.sidebar:
+        st.markdown("### ⚙️ Control Panel")
+        # Status indicator
+        if rag_system.vectorstore:
+            try:
+                doc_count = rag_system.vectorstore._collection.count()
+                if doc_count > 0:
+                    st.markdown('<p class="status-online">🟢 System Online</p>', unsafe_allow_html=True)
+                else:
+                    st.markdown('<p class="status-offline">🔴 No Knowledge Base</p>', unsafe_allow_html=True)
+            except:
+                st.markdown('<p class="status-offline">🟡 System Loading</p>', unsafe_allow_html=True)
+        st.markdown("---")
+        # Admin Actions
+        col1, col2 = st.columns(2)
+        with col1:
+            if st.button("🔄 Refresh KB", type="primary", use_container_width=True):
+                with st.spinner("Loading documents..."):
+                    success = rag_system.ingest_documents()
+                    if success:
+                        st.balloons()
+                        st.success("Knowledge base updated!")
+                        st.rerun()
+        with col2:
+            if st.button("🗑️ Clear Chat", use_container_width=True):
+                rag_system.reset_conversation()
+                st.session_state.messages = []
+                st.rerun()
+        # Quick Actions
+        st.markdown("### ⚡ Quick Actions")
+        if st.button("📚 Show Available Topics", use_container_width=True):
+            st.session_state.show_topics = True
+        if st.button("💡 Get Random Tip", use_container_width=True):
+            random_questions = [
+                "What are the best programming practices?",
+                "How to optimize code performance?",
+                "What are common coding mistakes?",
+                "Explain object-oriented programming",
+                "What is the difference between frontend and backend?"
+            ]
+            import random
+            random_q = random.choice(random_questions)
+            st.session_state.messages.append({"role": "user", "content": f"🎲 {random_q}"})
+            st.rerun()
         st.markdown("---")
+        # Enhanced System Info
+        st.markdown("### 📊 System Statistics")
         if rag_system.vectorstore:
             try:
                 doc_count = rag_system.vectorstore._collection.count()
+                st.markdown(f"""
+                <div class="metric-card">
+                    <strong>📄 Documents:</strong><br>
+                    <span style="font-size: 1.5rem; color: #667eea;">{doc_count}</span>
+                </div>
+                """, unsafe_allow_html=True)
             except:
+                st.markdown("""
+                <div class="metric-card">
+                    <strong>📄 Documents:</strong><br>
+                    <span style="color: #dc3545;">N/A</span>
+                </div>
+                """, unsafe_allow_html=True)
+        # Conversation count
+        chat_count = len([msg for msg in st.session_state.get("messages", []) if msg["role"] == "user"])
+        st.markdown(f"""
+        <div class="metric-card">
+            <strong>💬 Questions Asked:</strong><br>
+            <span style="font-size: 1.5rem; color: #28a745;">{chat_count}</span>
+        </div>
+        """, unsafe_allow_html=True)
         st.markdown("---")
+        # Tech Stack
+        st.markdown("### 🛠️ Technology Stack")
+        tech_stack = {
+            "🧠": "ChromaDB",
+            "⚡": "Groq LLM",
+            "🔗": "LangChain",
+            "🎨": "Streamlit",
+            "🤗": "HuggingFace"
+        }
+        for icon, tech in tech_stack.items():
+            st.markdown(f"{icon} **{tech}**")
+        st.markdown("---")
+        st.markdown("*Built with ❤️ for iCodeGuru community*")
+    # Main Content Area
+    # Initialize session state
     if "messages" not in st.session_state:
         st.session_state.messages = []
+    if "show_topics" not in st.session_state:
+        st.session_state.show_topics = False
+    # Welcome message for new users
+    if len(st.session_state.messages) == 0:
+        st.markdown("""
+        ### 👋 Welcome to EduBot!
+        I'm your AI programming assistant, ready to help you with:
+        - **Programming concepts** and tutorials
+        - **Code examples** and best practices
+        - **Debugging** and troubleshooting
+        - **Learning resources** and recommendations
+        🚀 **Get started by asking me anything about programming!**
+        """)
+        # Sample questions
+        st.markdown("### 💡 Try these sample questions:")
+        sample_questions = [
+            "What is Python?",
+            "How to create a REST API?",
+            "Explain machine learning basics",
+            "Best practices for web development"
+        ]
+        cols = st.columns(2)
+        for i, question in enumerate(sample_questions):
+            with cols[i % 2]:
+                if st.button(f"❓ {question}", key=f"sample_{i}", use_container_width=True):
+                    st.session_state.messages.append({"role": "user", "content": question})
+                    st.rerun()
+    # Show topics if requested
+    if st.session_state.get("show_topics", False):
+        with st.expander("📚 Available Topics", expanded=True):
+            st.markdown("""
+            Based on your knowledge base, I can help with:
+            - Web Development (HTML, CSS, JavaScript)
+            - Python Programming
+            - Data Science & Machine Learning
+            - Database Management
+            - Software Engineering Practices
+            - API Development
+            - And much more!
+            *Ask me anything specific about these topics!*
+            """)
+            if st.button("Close Topics"):
+                st.session_state.show_topics = False
+                st.rerun()
+    # Chat History with Enhanced Styling
+    if st.session_state.messages:
+        st.markdown("### 💬 Conversation History")
+        for i, message in enumerate(st.session_state.messages):
+            with st.chat_message(message["role"]):
+                # Enhanced message display
+                if message["role"] == "user":
+                    st.markdown(f"**You:** {message['content']}")
+                else:
+                    st.markdown(message["content"])
+                    # Enhanced sources display
+                    if "sources" in message and message["sources"]:
+                        with st.expander(f"📚 Sources ({len(message['sources'])} found)", expanded=False):
+                            for j, source in enumerate(message["sources"], 1):
+                                st.markdown(f"""
+                                <div class="source-card">
+                                    <strong>Source {j}:</strong><br>
+                                    {source}
+                                </div>
+                                """, unsafe_allow_html=True)
+    # Enhanced User Input Area
+    st.markdown("---")
+    # Input with suggestions
+    col1, col2 = st.columns([4, 1])
+    with col1:
+        user_input = st.text_input(
+            "💬 Ask your question:",
+            placeholder="e.g., How do I create a Python function?",
+            key="user_input"
+        )
+    with col2:
+        send_button = st.button("Send 🚀", type="primary", use_container_width=True)
+    # Alternative chat input (modern style)
+    if prompt := st.chat_input("💬 Ask anything about programming..."):
+        user_input = prompt
+        send_button = True
+    # Process user input
+    if (send_button and user_input) or prompt:
+        question = user_input if send_button else prompt
+        # Add user message
+        st.session_state.messages.append({"role": "user", "content": question})
         # Display user message
         with st.chat_message("user"):
+            st.markdown(f"**You:** {question}")
+        # Get and display assistant response
         with st.chat_message("assistant"):
+            with st.spinner("🤔 Let me think about that..."):
+                response = rag_system.get_answer(question)
+                answer = response.get("answer", "I couldn't find an answer to that question.")
                 source_docs = response.get("source_documents", [])
                 st.markdown(answer)
+                # Enhanced sources display
                 if source_docs:
                     sources = []
+                    for doc in source_docs[:4]:  # Show top 4 sources
+                        source_file = doc.metadata.get('source_file', 'Unknown')
+                        content_preview = doc.page_content[:150] + "..." if len(doc.page_content) > 150 else doc.page_content
+                        sources.append(f"**{source_file}**\n{content_preview}")
                     if sources:
+                        with st.expander(f"📚 Sources ({len(sources)} found)", expanded=False):
                             for i, source in enumerate(sources, 1):
+                                st.markdown(f"""
+                                <div class="source-card">
+                                    <strong>📄 Source {i}:</strong><br>
+                                    {source}
+                                </div>
+                                """, unsafe_allow_html=True)
+                        # Add to session state
                         st.session_state.messages.append({
                             "role": "assistant",
                             "content": answer,
                         st.session_state.messages.append({"role": "assistant", "content": answer})
                 else:
                     st.session_state.messages.append({"role": "assistant", "content": answer})
+        # Clear input and rerun
+        if send_button:
+            st.rerun()
+    # Footer
+    st.markdown("---")
+    st.markdown("""
+    <div style="text-align: center; color: #666; padding: 1rem;">
+        <p>🎓 <strong>EduBot for iCodeGuru</strong> | Empowering developers worldwide</p>
+        <p>Made with ❤️ using Streamlit • LangChain • ChromaDB • Groq</p>
+    </div>
+    """, unsafe_allow_html=True)
 if __name__ == "__main__":
     main()