Spaces:

akryldigital
/

audit_assistant

Sleeping

App Files Files Community

Ara Yeroyan commited on Oct 31

Commit

02d7f4f

1 Parent(s): 7c8b783

refactor and add sample questions

Browse files

Files changed (2) hide show

app.py +428 -211
smart_chatbot.py +4 -3

app.py CHANGED Viewed

@@ -3,7 +3,29 @@ Intelligent Audit Report Chatbot UI
 """
 import os
-import sys
 # ===== CRITICAL: Fix OMP_NUM_THREADS FIRST, before ANY other imports =====
 # Some libraries load at import time and will fail if OMP_NUM_THREADS is invalid
@@ -29,42 +51,30 @@ except (ValueError, TypeError):
 # ===== Setup HuggingFace cache directories BEFORE any model imports =====
 # CRITICAL: Set these before any imports that might use HuggingFace (like sentence-transformers)
-# This ensures models downloaded during Docker build are found at runtime
-cache_dir = "/app/.cache/huggingface"
-os.environ["HF_HOME"] = cache_dir
-os.environ["TRANSFORMERS_CACHE"] = cache_dir
-os.environ["HF_DATASETS_CACHE"] = cache_dir
-os.environ["HF_HUB_CACHE"] = cache_dir
-os.environ["SENTENCE_TRANSFORMERS_HOME"] = cache_dir
-# Ensure cache directory exists (created in Dockerfile, but ensure it's there)
-try:
-    os.makedirs(cache_dir, mode=0o755, exist_ok=True)
-except (PermissionError, OSError) as e:
-    # If we can't create it, log but continue (might already exist from Dockerfile)
-    # HuggingFace will try to create subdirectories, but we need parent to exist
-    pass
-import time
-import json
-import uuid
-import logging
-from pathlib import Path
-import argparse
-import streamlit as st
-from langchain_core.messages import HumanMessage, AIMessage
-from multi_agent_chatbot import get_multi_agent_chatbot
-from smart_chatbot import get_chatbot as get_smart_chatbot
-from src.reporting.feedback_schema import create_feedback_from_dict
 # Configure logging
 logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
 logger = logging.getLogger(__name__)
 # Log environment setup for debugging
-logger.info(f"📁 HuggingFace cache directory: {os.environ.get('HF_HOME', 'NOT SET')}")
 logger.info(f"🔧 OMP_NUM_THREADS: {os.environ.get('OMP_NUM_THREADS', 'NOT SET')}")
@@ -94,6 +104,54 @@ st.markdown("""
         margin-bottom: 2rem;
     }
     .session-info {
         background-color: #f0f2f6;
         padding: 10px;
@@ -218,10 +276,11 @@ def serialize_documents(sources):
 @st.cache_data
 def load_filter_options():
     try:
-        with open("src/config/filter_options.json", "r") as f:
             return json.load(f)
     except FileNotFoundError:
-        st.info([x for x in os.listdir() if x.endswith('.json')])
         st.error("filter_options.json not found. Please run the metadata analysis script.")
         return {"sources": [], "years": [], "districts": [], 'filenames': []}
@@ -254,16 +313,8 @@ def main():
         st.session_state.reset_conversation = False
         st.rerun()
-    # Header with system indicator
-    col1, col2 = st.columns([3, 1])
-    with col1:
-        st.markdown('<h1 class="main-header">🤖 Intelligent Audit Report Chatbot</h1>', unsafe_allow_html=True)
-    with col2:
-        system_type = get_system_type()
-        if "Multi-Agent" in system_type:
-            st.success(f"🔧 {system_type}")
-        else:
-            st.info(f"🔧 {system_type}")
     st.markdown('<p class="subtitle">Ask questions about audit reports. Use the sidebar filters to narrow down your search!</p>', unsafe_allow_html=True)
     # Session info
@@ -375,12 +426,85 @@ def main():
             if 'input_counter' not in st.session_state:
                 st.session_state.input_counter = 0
             user_input = st.text_input(
                 "Type your message here...",
                 placeholder="Ask about budget allocations, expenditures, or audit findings...",
-                key=f"user_input_{st.session_state.input_counter}",
-                label_visibility="collapsed"
             )
         with col2:
             send_button = st.button("Send", key="send_button", use_container_width=True)
@@ -389,12 +513,11 @@ def main():
         if st.button("🗑️ Clear Chat", key="clear_chat_button"):
             st.session_state.reset_conversation = True
             # Clear all conversation files
-            import os
-            conversations_dir = "conversations"
-            if os.path.exists(conversations_dir):
-                for file in os.listdir(conversations_dir):
-                    if file.endswith('.json'):
-                        os.remove(os.path.join(conversations_dir, file))
             st.rerun()
         # Handle user input
@@ -487,11 +610,11 @@ def main():
                     filename = getattr(doc, 'metadata', {}).get('filename', 'Unknown')
                     unique_filenames.add(filename)
-                st.markdown(f"**Found {len(sources)} document chunks from {len(unique_filenames)} unique documents (showing top 10):**")
                 if len(unique_filenames) < len(sources):
                     st.info(f"💡 **Note**: Each document is split into multiple chunks. You're seeing {len(sources)} chunks from {len(unique_filenames)} documents.")
-                for i, doc in enumerate(sources[:10]):  # Show top 10
                     # Get relevance score and ID if available
                     metadata = getattr(doc, 'metadata', {})
                     score = metadata.get('reranked_score', metadata.get('original_score', None))
@@ -543,180 +666,187 @@ def main():
         if 'feedback_submitted' not in st.session_state:
             st.session_state.feedback_submitted = False
-        # Feedback form
-        with st.form("feedback_form", clear_on_submit=False):
-            col1, col2 = st.columns([1, 1])
-            with col1:
-                feedback_score = st.slider(
-                    "Rate this conversation (1-5)",
-                    min_value=1,
-                    max_value=5,
-                    help="How satisfied are you with the conversation?"
-                )
-            with col2:
-                is_feedback_about_last_retrieval = st.checkbox(
-                    "Feedback about last retrieval only",
-                    value=True,
-                    help="If checked, feedback applies to the most recent document retrieval"
-                )
-            open_ended_feedback = st.text_area(
-                "Your feedback (optional)",
-                placeholder="Tell us what went well or what could be improved...",
-                height=100
-            )
-            # Disable submit if no score selected
-            submit_disabled = feedback_score is None
-            submitted = st.form_submit_button(
-                "📤 Submit Feedback",
-                use_container_width=True,
-                disabled=submit_disabled
-            )
-            if submitted and not st.session_state.feedback_submitted:
-                # Log the feedback data being submitted
-                print("=" * 80)
-                print("🔄 FEEDBACK SUBMISSION: Starting...")
-                print("=" * 80)
-                st.write("🔍 **Debug: Feedback Data Being Submitted:**")
-                # Create feedback data dictionary
-                feedback_dict = {
-                    "open_ended_feedback": open_ended_feedback,
-                    "score": feedback_score,
-                    "is_feedback_about_last_retrieval": is_feedback_about_last_retrieval,
-                    "retrieved_data": st.session_state.rag_retrieval_history.copy() if st.session_state.rag_retrieval_history else [],
-                    "conversation_id": st.session_state.conversation_id,
-                    "timestamp": time.time(),
-                    "message_count": len(st.session_state.messages),
-                    "has_retrievals": has_retrievals,
-                    "retrieval_count": len(st.session_state.rag_retrieval_history)
-                }
-                print(f"📝 FEEDBACK SUBMISSION: Score={feedback_score}, Retrievals={len(st.session_state.rag_retrieval_history) if st.session_state.rag_retrieval_history else 0}")
-                # Create UserFeedback dataclass instance
-                feedback_obj = None  # Initialize outside try block
-                try:
-                    feedback_obj = create_feedback_from_dict(feedback_dict)
-                    print(f"✅ FEEDBACK SUBMISSION: Feedback object created - ID={feedback_obj.feedback_id}")
-                    st.write(f"✅ **Feedback Object Created**")
-                    st.write(f"- Feedback ID: {feedback_obj.feedback_id}")
-                    st.write(f"- Score: {feedback_obj.score}/5")
-                    st.write(f"- Has Retrievals: {feedback_obj.has_retrievals}")
-                    # Convert back to dict for JSON serialization
-                    feedback_data = feedback_obj.to_dict()
-                except Exception as e:
-                    print(f"❌ FEEDBACK SUBMISSION: Failed to create feedback object: {e}")
-                    st.error(f"Failed to create feedback object: {e}")
-                    feedback_data = feedback_dict
-                # Display the data being submitted
-                st.json(feedback_data)
-                # Save feedback to file - use absolute path in /app to ensure writability
-                feedback_dir = Path("/app/feedback")
-                try:
-                    # Ensure directory exists with write permissions (777 for compatibility)
-                    feedback_dir.mkdir(parents=True, mode=0o777, exist_ok=True)
-                except (PermissionError, OSError) as e:
-                    logger.warning(f"Could not create feedback directory at {feedback_dir}: {e}")
-                    # Fallback to relative path
-                    feedback_dir = Path("feedback")
-                    feedback_dir.mkdir(parents=True, mode=0o777, exist_ok=True)
-                feedback_file = feedback_dir / f"feedback_{st.session_state.conversation_id}_{int(time.time())}.json"
-                try:
-                    # Ensure parent directory exists before writing
-                    feedback_file.parent.mkdir(parents=True, mode=0o777, exist_ok=True)
-                    # Save to local file
-                    print(f"💾 FEEDBACK SAVE: Saving to local file: {feedback_file}")
-                    with open(feedback_file, 'w') as f:
-                        json.dump(feedback_data, f, indent=2, default=str)
-                    print(f"✅ FEEDBACK SAVE: Local file saved successfully")
-                    st.success("✅ Thank you for your feedback! It has been saved locally.")
-                    st.balloons()
-                    # Save to Snowflake if enabled and credentials available
-                    logger.info("🔄 FEEDBACK SAVE: Starting Snowflake save process...")
-                    logger.info(f"📊 FEEDBACK SAVE: feedback_obj={'exists' if feedback_obj else 'None'}")
                     try:
-                        import os
-                        snowflake_enabled = os.getenv("SNOWFLAKE_ENABLED", "false").lower() == "true"
-                        logger.info(f"🔍 SNOWFLAKE CHECK: enabled={snowflake_enabled}")
-                        if snowflake_enabled:
-                            if feedback_obj:
-                                try:
-                                    from src.reporting.snowflake_connector import save_to_snowflake
-                                    logger.info("📤 SNOWFLAKE UI: Attempting to save feedback to Snowflake...")
-                                    print("📤 SNOWFLAKE UI: Attempting to save feedback to Snowflake...")  # Also print to terminal
-                                    if save_to_snowflake(feedback_obj):
-                                        logger.info("✅ SNOWFLAKE UI: Successfully saved to Snowflake")
-                                        print("✅ SNOWFLAKE UI: Successfully saved to Snowflake")  # Also print to terminal
-                                        st.success("✅ Feedback also saved to Snowflake!")
-                                    else:
-                                        logger.warning("⚠️ SNOWFLAKE UI: Save failed")
-                                        print("⚠️ SNOWFLAKE UI: Save failed")  # Also print to terminal
-                                        st.warning("⚠️ Snowflake save failed, but local save succeeded")
-                                except Exception as e:
-                                    logger.error(f"❌ SNOWFLAKE UI ERROR: {e}")
-                                    print(f"❌ SNOWFLAKE UI ERROR: {e}")  # Also print to terminal
-                                    import traceback
-                                    traceback.print_exc()  # Print full traceback to terminal
-                                    st.warning(f"⚠️ Could not save to Snowflake: {e}")
-                            else:
-                                logger.warning("⚠️ SNOWFLAKE UI: Skipping (feedback object not created)")
-                                print("⚠️ SNOWFLAKE UI: Skipping (feedback object not created)")  # Also print to terminal
-                                st.warning("⚠️ Skipping Snowflake save (feedback object not created)")
-                        else:
-                            logger.info("💡 SNOWFLAKE UI: Integration disabled")
-                            print("💡 SNOWFLAKE UI: Integration disabled")  # Also print to terminal
-                            st.info("💡 Snowflake integration disabled (set SNOWFLAKE_ENABLED=true to enable)")
-                    except NameError as e:
-                        import traceback
-                        traceback.print_exc()
-                        logger.error(f"❌ NameError in Snowflake save: {e}")
-                        print(f"❌ NameError in Snowflake save: {e}")  # Also print to terminal
-                        st.warning(f"⚠️ Snowflake save error: {e}")
                     except Exception as e:
-                        logger.error(f"❌ Exception in Snowflake save: {type(e).__name__}: {e}")
-                        print(f"❌ Exception in Snowflake save: {type(e).__name__}: {e}")  # Also print to terminal
-                        st.warning(f"⚠️ Snowflake save error: {e}")
-                    # Mark feedback as submitted to prevent resubmission
-                    st.session_state.feedback_submitted = True
-                    print("=" * 80)
-                    print(f"✅ FEEDBACK SUBMISSION: Completed successfully")
-                    print("=" * 80)
-                    # Log file location
-                    st.info(f"📁 Feedback saved to: {feedback_file}")
-                except Exception as e:
-                    print(f"❌ FEEDBACK SUBMISSION: Error saving feedback: {e}")
-                    print(f"❌ FEEDBACK SUBMISSION: Error type: {type(e).__name__}")
-                    import traceback
-                    traceback.print_exc()
-                    st.error(f"❌ Error saving feedback: {e}")
-                    st.write(f"Debug error: {str(e)}")
-            elif st.session_state.feedback_submitted:
-                st.success("✅ Feedback already submitted for this conversation!")
-                if st.button("🔄 Submit New Feedback", key="new_feedback_button"):
-                    st.session_state.feedback_submitted = False
-                    st.rerun()
     # Display retrieval history stats
     if st.session_state.rag_retrieval_history:
@@ -738,6 +868,93 @@ def main():
                 })
                 st.markdown("---")
     # Auto-scroll to bottom
     st.markdown("""
     <script>

 """
 import os
+import time
+import json
+import uuid
+import logging
+import traceback
+from pathlib import Path
+import streamlit as st
+from langchain_core.messages import HumanMessage, AIMessage
+from multi_agent_chatbot import get_multi_agent_chatbot
+from smart_chatbot import get_chatbot as get_smart_chatbot
+from src.reporting.feedback_schema import create_feedback_from_dict
+from src.reporting.snowflake_connector import save_to_snowflake
+from src.config.paths import (
+    IS_DEPLOYED,
+    PROJECT_DIR,
+    HF_CACHE_DIR,
+    FEEDBACK_DIR,
+    CONVERSATIONS_DIR,
+)
 # ===== CRITICAL: Fix OMP_NUM_THREADS FIRST, before ANY other imports =====
 # Some libraries load at import time and will fail if OMP_NUM_THREADS is invalid
 # ===== Setup HuggingFace cache directories BEFORE any model imports =====
 # CRITICAL: Set these before any imports that might use HuggingFace (like sentence-transformers)
+# Only override cache directories in deployed environment (local uses defaults)
+if IS_DEPLOYED and HF_CACHE_DIR:
+    cache_dir = str(HF_CACHE_DIR)
+    os.environ["HF_HOME"] = cache_dir
+    os.environ["TRANSFORMERS_CACHE"] = cache_dir
+    os.environ["HF_DATASETS_CACHE"] = cache_dir
+    os.environ["HF_HUB_CACHE"] = cache_dir
+    os.environ["SENTENCE_TRANSFORMERS_HOME"] = cache_dir
+    # Ensure cache directory exists (created in Dockerfile, but ensure it's there)
+    try:
+        os.makedirs(cache_dir, mode=0o755, exist_ok=True)
+    except (PermissionError, OSError):
+        # If we can't create it, log but continue (might already exist from Dockerfile)
+        pass
 # Configure logging
 logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
 logger = logging.getLogger(__name__)
 # Log environment setup for debugging
+logger.info(f"🌍 Environment: {'DEPLOYED' if IS_DEPLOYED else 'LOCAL'}")
+logger.info(f"📁 PROJECT_DIR: {PROJECT_DIR}")
+logger.info(f"📁 HuggingFace cache: {os.environ.get('HF_HOME', 'DEFAULT (not overridden)')}")
 logger.info(f"🔧 OMP_NUM_THREADS: {os.environ.get('OMP_NUM_THREADS', 'NOT SET')}")
         margin-bottom: 2rem;
     }
+    .example-questions-header {
+        text-align: center;
+        margin-bottom: 1rem;
+    }
+    .example-questions-description {
+        text-align: center;
+        color: #666;
+        margin-bottom: 2rem;
+    }
+    /* Hide ALL default Streamlit text input help messages about Enter key */
+    /* This is the key one - hides "Press Enter to apply" message inside input field */
+    div[data-testid="InputInstructions"],
+    span[data-testid="InputInstructions"],
+    *[data-testid="InputInstructions"] {
+        display: none !important;
+        visibility: hidden !important;
+        opacity: 0 !important;
+        height: 0 !important;
+        width: 0 !important;
+        overflow: hidden !important;
+        position: absolute !important;
+        left: -9999px !important;
+    }
+    /* Also hide other potential locations */
+    div[data-testid="stTextInput"] + div > small,
+    div[data-testid="stTextInput"] ~ div > small,
+    div[data-testid="stTextInputContainer"] + div > small,
+    div[data-testid="stTextInputContainer"] ~ div > small,
+    div[data-baseweb="input"] + div > small,
+    div[data-baseweb="input"] ~ div > small {
+        display: none !important;
+        visibility: hidden !important;
+        opacity: 0 !important;
+        height: 0 !important;
+        overflow: hidden !important;
+    }
+    /* Custom help text for input */
+    .input-help-text {
+        font-size: 0.85rem;
+        color: #666;
+        margin-top: 0.25rem;
+        text-align: left;
+    }
     .session-info {
         background-color: #f0f2f6;
         padding: 10px;
 @st.cache_data
 def load_filter_options():
     try:
+        filter_options_path = PROJECT_DIR / "src" / "config" / "filter_options.json"
+        with open(filter_options_path, "r") as f:
             return json.load(f)
     except FileNotFoundError:
+        st.info(f"Looking for filter_options.json in: {PROJECT_DIR / 'src' / 'config'}")
         st.error("filter_options.json not found. Please run the metadata analysis script.")
         return {"sources": [], "years": [], "districts": [], 'filenames': []}
         st.session_state.reset_conversation = False
         st.rerun()
+    # Header - centered
+    st.markdown('<h1 class="main-header">🤖 Intelligent Audit Report Chatbot</h1>', unsafe_allow_html=True)
     st.markdown('<p class="subtitle">Ask questions about audit reports. Use the sidebar filters to narrow down your search!</p>', unsafe_allow_html=True)
     # Session info
             if 'input_counter' not in st.session_state:
                 st.session_state.input_counter = 0
+            # Handle pending question from example questions section
+            if 'pending_question' in st.session_state and st.session_state.pending_question:
+                default_value = st.session_state.pending_question
+                # Increment counter to force new input widget
+                st.session_state.input_counter = (st.session_state.get('input_counter', 0) + 1) % 1000
+                del st.session_state.pending_question
+                key_suffix = st.session_state.input_counter
+            else:
+                default_value = ""
+                key_suffix = st.session_state.input_counter
             user_input = st.text_input(
                 "Type your message here...",
                 placeholder="Ask about budget allocations, expenditures, or audit findings...",
+                key=f"user_input_{key_suffix}",
+                label_visibility="collapsed",
+                value=default_value if default_value else None
             )
+            # Use JavaScript to specifically target and hide "Press Enter to apply" message
+            st.markdown("""
+            <script>
+                (function() {
+                    // Hide InputInstructions element (contains "Press Enter to apply")
+                    function hideInputInstructions() {
+                        // Target the specific Streamlit element
+                        const instructions = document.querySelector('[data-testid="InputInstructions"]');
+                        if (instructions) {
+                            instructions.style.display = 'none';
+                            instructions.style.visibility = 'hidden';
+                            instructions.style.opacity = '0';
+                            instructions.style.height = '0';
+                            instructions.style.width = '0';
+                            instructions.style.overflow = 'hidden';
+                            instructions.style.position = 'absolute';
+                            instructions.style.left = '-9999px';
+                        }
+                        // Also search for any text containing "Press Enter" or "apply" inside input containers
+                        const allElements = document.querySelectorAll('*');
+                        allElements.forEach(el => {
+                            const text = el.textContent || el.innerText || '';
+                            if ((text.toLowerCase().includes('press enter') ||
+                                 text.toLowerCase().includes('enter to') ||
+                                 text.toLowerCase().includes('to apply')) &&
+                                (el.tagName === 'SPAN' || el.tagName === 'DIV' || el.tagName === 'SMALL')) {
+                                const style = window.getComputedStyle(el);
+                                const fontSize = parseFloat(style.fontSize);
+                                // Hide if it's small text (likely help text)
+                                if (fontSize < 14 || el.hasAttribute('data-testid')) {
+                                    el.style.display = 'none';
+                                    el.style.visibility = 'hidden';
+                                    el.style.height = '0';
+                                    el.style.overflow = 'hidden';
+                                }
+                            }
+                        });
+                    }
+                    // Run immediately and after delays to catch dynamic elements
+                    hideInputInstructions();
+                    setTimeout(hideInputInstructions, 50);
+                    setTimeout(hideInputInstructions, 100);
+                    setTimeout(hideInputInstructions, 500);
+                    // Observe for new elements added by Streamlit
+                    const observer = new MutationObserver(function(mutations) {
+                        hideInputInstructions();
+                    });
+                    observer.observe(document.body, { childList: true, subtree: true, attributes: true });
+                })();
+            </script>
+            """, unsafe_allow_html=True)
+            # # Show custom help text below input - this replaces the default "Press Enter" message
+            # st.markdown(
+            #     "<div class='input-help-text'>💡 Press the <strong>Send</strong> button to submit your question</div>",
+            #     unsafe_allow_html=True
+            # )
         with col2:
             send_button = st.button("Send", key="send_button", use_container_width=True)
         if st.button("🗑️ Clear Chat", key="clear_chat_button"):
             st.session_state.reset_conversation = True
             # Clear all conversation files
+            conversations_path = CONVERSATIONS_DIR
+            if conversations_path.exists():
+                for file in conversations_path.iterdir():
+                    if file.suffix == '.json':
+                        file.unlink()
             st.rerun()
         # Handle user input
                     filename = getattr(doc, 'metadata', {}).get('filename', 'Unknown')
                     unique_filenames.add(filename)
+                st.markdown(f"**Found {len(sources)} document chunks from {len(unique_filenames)} unique documents (showing top 20):**")
                 if len(unique_filenames) < len(sources):
                     st.info(f"💡 **Note**: Each document is split into multiple chunks. You're seeing {len(sources)} chunks from {len(unique_filenames)} documents.")
+                for i, doc in enumerate(sources):  # Show top 10
                     # Get relevance score and ID if available
                     metadata = getattr(doc, 'metadata', {})
                     score = metadata.get('reranked_score', metadata.get('original_score', None))
         if 'feedback_submitted' not in st.session_state:
             st.session_state.feedback_submitted = False
+        # Feedback form - only show if feedback not already submitted
+        if not st.session_state.feedback_submitted:
+            with st.form("feedback_form", clear_on_submit=False):
+                col1, col2 = st.columns([1, 1])
+                with col1:
+                    feedback_score = st.slider(
+                        "Rate this conversation (1-5)",
+                        min_value=1,
+                        max_value=5,
+                        help="How satisfied are you with the conversation?"
+                    )
+                with col2:
+                    is_feedback_about_last_retrieval = st.checkbox(
+                        "Feedback about last retrieval only",
+                        value=True,
+                        help="If checked, feedback applies to the most recent document retrieval"
+                    )
+                open_ended_feedback = st.text_area(
+                    "Your feedback (optional)",
+                    placeholder="Tell us what went well or what could be improved...",
+                    height=100
+                )
+                # Disable submit if no score selected
+                submit_disabled = feedback_score is None
+                submitted = st.form_submit_button(
+                    "📤 Submit Feedback",
+                    use_container_width=True,
+                    disabled=submit_disabled
+                )
+                if submitted:
+                    # Log the feedback data being submitted
+                    print("=" * 80)
+                    print("🔄 FEEDBACK SUBMISSION: Starting...")
+                    print("=" * 80)
+                    st.write("🔍 **Debug: Feedback Data Being Submitted:**")
+                    # Create feedback data dictionary
+                    feedback_dict = {
+                        "open_ended_feedback": open_ended_feedback,
+                        "score": feedback_score,
+                        "is_feedback_about_last_retrieval": is_feedback_about_last_retrieval,
+                        "retrieved_data": st.session_state.rag_retrieval_history.copy() if st.session_state.rag_retrieval_history else [],
+                        "conversation_id": st.session_state.conversation_id,
+                        "timestamp": time.time(),
+                        "message_count": len(st.session_state.messages),
+                        "has_retrievals": has_retrievals,
+                        "retrieval_count": len(st.session_state.rag_retrieval_history)
+                    }
+                    print(f"📝 FEEDBACK SUBMISSION: Score={feedback_score}, Retrievals={len(st.session_state.rag_retrieval_history) if st.session_state.rag_retrieval_history else 0}")
+                    # Create UserFeedback dataclass instance
+                    feedback_obj = None  # Initialize outside try block
                     try:
+                        feedback_obj = create_feedback_from_dict(feedback_dict)
+                        print(f"✅ FEEDBACK SUBMISSION: Feedback object created - ID={feedback_obj.feedback_id}")
+                        st.write(f"✅ **Feedback Object Created**")
+                        st.write(f"- Feedback ID: {feedback_obj.feedback_id}")
+                        st.write(f"- Score: {feedback_obj.score}/5")
+                        st.write(f"- Has Retrievals: {feedback_obj.has_retrievals}")
+                        # Convert back to dict for JSON serialization
+                        feedback_data = feedback_obj.to_dict()
                     except Exception as e:
+                        print(f"❌ FEEDBACK SUBMISSION: Failed to create feedback object: {e}")
+                        st.error(f"Failed to create feedback object: {e}")
+                        feedback_data = feedback_dict
+                    # Display the data being submitted
+                    st.json(feedback_data)
+                    # Save feedback to file - use PROJECT_DIR to ensure writability
+                    feedback_dir = FEEDBACK_DIR
+                    try:
+                        # Ensure directory exists with write permissions (777 for compatibility)
+                        feedback_dir.mkdir(parents=True, mode=0o777, exist_ok=True)
+                    except (PermissionError, OSError) as e:
+                        logger.warning(f"Could not create feedback directory at {feedback_dir}: {e}")
+                        # Fallback to relative path
+                        feedback_dir = Path("feedback")
+                        feedback_dir.mkdir(parents=True, mode=0o777, exist_ok=True)
+                    feedback_file = feedback_dir / f"feedback_{st.session_state.conversation_id}_{int(time.time())}.json"
+                    try:
+                        # Ensure parent directory exists before writing
+                        feedback_file.parent.mkdir(parents=True, mode=0o777, exist_ok=True)
+                        # Save to local file
+                        print(f"💾 FEEDBACK SAVE: Saving to local file: {feedback_file}")
+                        with open(feedback_file, 'w') as f:
+                            json.dump(feedback_data, f, indent=2, default=str)
+                        print(f"✅ FEEDBACK SAVE: Local file saved successfully")
+                        st.success("✅ Thank you for your feedback! It has been saved locally.")
+                        st.balloons()
+                        # Save to Snowflake if enabled and credentials available
+                        logger.info("🔄 FEEDBACK SAVE: Starting Snowflake save process...")
+                        logger.info(f"📊 FEEDBACK SAVE: feedback_obj={'exists' if feedback_obj else 'None'}")
+                        try:
+                            snowflake_enabled = os.getenv("SNOWFLAKE_ENABLED", "false").lower() == "true"
+                            logger.info(f"🔍 SNOWFLAKE CHECK: enabled={snowflake_enabled}")
+                            if snowflake_enabled:
+                                if feedback_obj:
+                                    try:
+                                        logger.info("📤 SNOWFLAKE UI: Attempting to save feedback to Snowflake...")
+                                        print("📤 SNOWFLAKE UI: Attempting to save feedback to Snowflake...")
+                                        if save_to_snowflake(feedback_obj):
+                                            logger.info("✅ SNOWFLAKE UI: Successfully saved to Snowflake")
+                                            print("✅ SNOWFLAKE UI: Successfully saved to Snowflake")
+                                            st.success("✅ Feedback also saved to Snowflake!")
+                                        else:
+                                            logger.warning("⚠️ SNOWFLAKE UI: Save failed")
+                                            print("⚠️ SNOWFLAKE UI: Save failed")
+                                            st.warning("⚠️ Snowflake save failed, but local save succeeded")
+                                    except Exception as e:
+                                        logger.error(f"❌ SNOWFLAKE UI ERROR: {e}")
+                                        print(f"❌ SNOWFLAKE UI ERROR: {e}")
+                                        traceback.print_exc()
+                                        st.warning(f"⚠️ Could not save to Snowflake: {e}")
+                                else:
+                                    logger.warning("⚠️ SNOWFLAKE UI: Skipping (feedback object not created)")
+                                    print("⚠️ SNOWFLAKE UI: Skipping (feedback object not created)")
+                                    st.warning("⚠️ Skipping Snowflake save (feedback object not created)")
+                            else:
+                                logger.info("💡 SNOWFLAKE UI: Integration disabled")
+                                print("💡 SNOWFLAKE UI: Integration disabled")
+                                st.info("💡 Snowflake integration disabled (set SNOWFLAKE_ENABLED=true to enable)")
+                        except NameError as e:
+                            traceback.print_exc()
+                            logger.error(f"❌ NameError in Snowflake save: {e}")
+                            print(f"❌ NameError in Snowflake save: {e}")
+                            st.warning(f"⚠️ Snowflake save error: {e}")
+                        except Exception as e:
+                            logger.error(f"❌ Exception in Snowflake save: {type(e).__name__}: {e}")
+                            print(f"❌ Exception in Snowflake save: {type(e).__name__}: {e}")
+                            st.warning(f"⚠️ Snowflake save error: {e}")
+                        # Mark feedback as submitted to prevent resubmission
+                        st.session_state.feedback_submitted = True
+                        print("=" * 80)
+                        print(f"✅ FEEDBACK SUBMISSION: Completed successfully")
+                        print("=" * 80)
+                        # Log file location
+                        st.info(f"📁 Feedback saved to: {feedback_file}")
+                    except Exception as e:
+                        print(f"❌ FEEDBACK SUBMISSION: Error saving feedback: {e}")
+                        print(f"❌ FEEDBACK SUBMISSION: Error type: {type(e).__name__}")
+                        traceback.print_exc()
+                        st.error(f"❌ Error saving feedback: {e}")
+                        st.write(f"Debug error: {str(e)}")
+        else:
+            # Feedback already submitted - show success message and reset option
+            st.success("✅ Feedback already submitted for this conversation!")
+            col1, col2 = st.columns([1, 1])
+            with col1:
+                if st.button("🔄 Submit New Feedback", key="new_feedback_button", use_container_width=True):
+                    try:
+                        st.session_state.feedback_submitted = False
+                        st.rerun()
+                    except Exception as e:
+                        # Handle any Streamlit API exceptions gracefully
+                        logger.error(f"Error resetting feedback state: {e}")
+                        st.error(f"Error resetting feedback. Please refresh the page.")
+            with col2:
+                if st.button("📋 View Conversation", key="view_conversation_button", use_container_width=True):
+                    # Scroll to conversation - this is handled by the auto-scroll at bottom
+                    pass
     # Display retrieval history stats
     if st.session_state.rag_retrieval_history:
                 })
                 st.markdown("---")
+    # Example Questions Section
+    st.markdown("---")
+    st.markdown(
+        "<h3 class='example-questions-header'>💡 Example Questions</h3>",
+        unsafe_allow_html=True
+    )
+    st.markdown(
+        "<p class='example-questions-description'>Click on any question below to use it, or modify the editable examples:</p>",
+        unsafe_allow_html=True
+    )
+    # Initialize example question state
+    if 'custom_question_1' not in st.session_state:
+        st.session_state.custom_question_1 = "How were administrative costs managed in the PDM implementation, and what issues arose with budget execution regarding staff salaries?"
+    if 'custom_question_2' not in st.session_state:
+        st.session_state.custom_question_2 = "What did the National Coordinator say about the release of funds for PDM administrative costs in the letter dated 29th September 2022 and how did the funding received affect the activities of the PDCs and PDM SACCOs in the FY 2022/23?"
+    # Question 1: Filename insights (fixed, clickable)
+    st.markdown("#### 📄 Question 1: List insights from a specific file")
+    col1, col2 = st.columns([3, 1])
+    with col1:
+        example_q1 = "List couple of insights from the filename."
+        st.markdown(f"**Example:** `{example_q1}`")
+        st.info("💡 **Filter to apply:** Select a Filename from the sidebar panel before asking this question.")
+    with col2:
+        if st.button("📋 Use This Question", key="use_example_1", use_container_width=True):
+            st.session_state.pending_question = example_q1
+            st.session_state.input_counter = (st.session_state.get('input_counter', 0) + 1) % 1000
+            st.rerun()
+    st.markdown("---")
+    # Questions 2 & 3: Editable examples
+    st.markdown("#### ✏️ Customizable Questions (Edit and use)")
+    # Question 2
+    # st.markdown("**Question 2:**")
+    custom_q1 = st.text_area(
+        "Edit question 2:",
+        value=st.session_state.custom_question_1,
+        height=80,
+        key="edit_question_2",
+        help="Modify this question to fit your needs, then click 'Use This Question'"
+    )
+    col1, col2 = st.columns([1, 4])
+    with col1:
+        if st.button("📋 Use Question 2", key="use_custom_1", use_container_width=True):
+            if custom_q1.strip():
+                st.session_state.pending_question = custom_q1.strip()
+                st.session_state.custom_question_1 = custom_q1.strip()
+                st.session_state.input_counter = (st.session_state.get('input_counter', 0) + 1) % 1000
+                st.rerun()
+            else:
+                st.warning("Please enter a question first!")
+    with col2:
+        st.caption("💡 Tip: Add specific details like dates, names, or amounts to get more precise answers")
+    st.info("💡 **Filter to apply:** Select District(s) and Year(s) sidebar panel before asking this question.")
+    st.markdown("---")
+    # Question 3
+    # st.markdown("**Question 3:**")
+    custom_q2 = st.text_area(
+        "Edit question 3:",
+        value=st.session_state.custom_question_2,
+        height=80,
+        key="edit_question_3",
+        help="Modify this question to fit your needs, then click 'Use This Question'"
+    )
+    col1, col2 = st.columns([1, 4])
+    with col1:
+        if st.button("📋 Use Question 3", key="use_custom_2", use_container_width=True):
+            if custom_q2.strip():
+                st.session_state.pending_question = custom_q2.strip()
+                st.session_state.custom_question_2 = custom_q2.strip()
+                st.session_state.input_counter = (st.session_state.get('input_counter', 0) + 1) % 1000
+                st.rerun()
+            else:
+                st.warning("Please enter a question first!")
+    with col2:
+        st.caption("💡 Tip: Use specific terms from the documents (e.g., 'PDM', 'SACCOs', 'FY 2022/23')")
+    # Store selected question for next render (handled in input section above)
+    # This ensures the question populates the input field correctly
     # Auto-scroll to bottom
     st.markdown("""
     <script>

smart_chatbot.py CHANGED Viewed

@@ -26,6 +26,7 @@ from langchain_core.messages import HumanMessage, AIMessage, SystemMessage
 from src.pipeline import PipelineManager
 from src.config.loader import load_config
 @dataclass
@@ -161,7 +162,7 @@ class IntelligentRAGChatbot:
         # Try to load district whitelist from filter_options.json
         try:
-            fo = Path("filter_options.json")
             if fo.exists():
                 with open(fo) as f:
                     data = json.load(f)
@@ -174,7 +175,7 @@ class IntelligentRAGChatbot:
         except Exception:
             self.district_whitelist = self.available_metadata['districts']
-        # Enrich whitelist from add_district_metadata.py if available
         try:
             from add_district_metadata import DistrictMetadataProcessor
             proc = DistrictMetadataProcessor()
@@ -195,7 +196,7 @@ class IntelligentRAGChatbot:
         # Get dynamic year list from filter_options.json
         try:
-            fo = Path("filter_options.json")
             if fo.exists():
                 with open(fo) as f:
                     data = json.load(f)

 from src.pipeline import PipelineManager
 from src.config.loader import load_config
+from src.config.paths import PROJECT_DIR
 @dataclass
         # Try to load district whitelist from filter_options.json
         try:
+            fo = PROJECT_DIR / "src" / "config" / "filter_options.json"
             if fo.exists():
                 with open(fo) as f:
                     data = json.load(f)
         except Exception:
             self.district_whitelist = self.available_metadata['districts']
+        # Enrich whitelist from add_district_metadata.py if available (optional module)
         try:
             from add_district_metadata import DistrictMetadataProcessor
             proc = DistrictMetadataProcessor()
         # Get dynamic year list from filter_options.json
         try:
+            fo = PROJECT_DIR / "src" / "config" / "filter_options.json"
             if fo.exists():
                 with open(fo) as f:
                     data = json.load(f)