Spaces:

Ryanfafa
/

docmind-ai

Running

App Files Files Community

Ryanfafa commited on Feb 18

Commit

cd4a662

verified ·

1 Parent(s): 260a555

Update app.py

Browse files

Files changed (1) hide show

app.py +207 -95

app.py CHANGED Viewed

@@ -16,6 +16,8 @@ st.set_page_config(
 config.set_option("server.enableCORS", False)
 config.set_option("server.enableXsrfProtection", False)
 # ─── CSS ──────────────────────────────────────────────────────────────────────
 st.markdown("""
 <style>
@@ -63,6 +65,10 @@ html, body, [class*="css"] { font-family: 'DM Sans', sans-serif; }
 .ft-excel { background: #064e3b; color: #6ee7b7; }
 .ft-docx  { background: #1e3a5f; color: #7dd3fc; }
 .ft-text  { background: #1c1917; color: #d6d3d1; }
 [data-testid="stFileUploader"] { background: #1c1c26 !important; border: 2px dashed #2a2a3a !important; border-radius: 12px !important; }
 .stButton > button {
     background: linear-gradient(135deg, #7c3aed, #4f46e5) !important;
@@ -76,6 +82,7 @@ html, body, [class*="css"] { font-family: 'DM Sans', sans-serif; }
 }
 .badge-ready   { background:#14532d; color:#86efac; padding:3px 10px; border-radius:20px; font-size:0.75rem; }
 .badge-empty   { background:#1c1917; color:#a8a29e; padding:3px 10px; border-radius:20px; font-size:0.75rem; }
 hr { border-color: #2a2a3a !important; }
 ::-webkit-scrollbar { width: 6px; }
 ::-webkit-scrollbar-track { background: #0f0f13; }
@@ -91,17 +98,14 @@ def load_rag_engine():
 # ─── Session state ────────────────────────────────────────────────────────────
 defaults = {
-    "messages":       [],
-    "doc_loaded":     False,
-    "doc_name":       "",
-    "doc_type":       "",
-    "chunk_count":    0,
-    "processed_hash": "",
 }
 for k, v in defaults.items():
     if k not in st.session_state:
         st.session_state[k] = v
 def file_type_badge(suffix: str) -> str:
     m = {
         ".pdf":  ("pdf",   "PDF"),
@@ -119,42 +123,106 @@ def file_type_badge(suffix: str) -> str:
     cls, label = m.get(suffix, ("text", suffix.upper()))
     return f'<span class="filetype-badge ft-{cls}">{label}</span>'
 # ─── Sidebar ──────────────────────────────────────────────────────────────────
 with st.sidebar:
     st.markdown('<p style="font-family:Syne,sans-serif;font-size:1.3rem;font-weight:700;color:#a78bfa;">🧠 DocMind AI</p>', unsafe_allow_html=True)
-    st.markdown('<p style="color:#6b6b8a;font-size:0.8rem;">Multimodal RAG · Conversation Memory</p>', unsafe_allow_html=True)
     st.markdown("---")
-    # Doc status
-    if st.session_state.doc_loaded:
-        rag = load_rag_engine()
         mem_count = rag.get_memory_count()
-        st.markdown(f'<span class="badge-ready">✓ Ready</span>', unsafe_allow_html=True)
-        suffix = Path(st.session_state.doc_name).suffix.lower()
         st.markdown(
-            f'<p style="color:#e8e8f0;font-size:0.85rem;margin-top:0.5rem;">'
-            f'{file_type_badge(suffix)} <b>{st.session_state.doc_name}</b></p>',
-            unsafe_allow_html=True
         )
-        st.markdown(f'<p style="color:#6b6b8a;font-size:0.78rem;">{st.session_state.chunk_count} chunks · {mem_count} exchanges in memory</p>', unsafe_allow_html=True)
     else:
-        st.markdown('<span class="badge-empty">○ No document loaded</span>', unsafe_allow_html=True)
     st.markdown("---")
-    st.markdown('<p style="color:#6b6b8a;font-size:0.78rem;font-weight:600;text-transform:uppercase;letter-spacing:0.08em;">Upload Document</p>', unsafe_allow_html=True)
-    st.markdown('<p style="color:#6b6b8a;font-size:0.72rem;">PDF · TXT · DOCX · CSV · XLSX · JPG · PNG</p>', unsafe_allow_html=True)
-    uploaded_file = st.file_uploader(
-        "Upload",
-        type=["pdf", "txt", "docx", "doc", "csv", "xlsx", "xls", "jpg", "jpeg", "png", "webp"],
-        label_visibility="collapsed"
     )
     if uploaded_file:
         file_hash = hashlib.md5(uploaded_file.read()).hexdigest()
         uploaded_file.seek(0)
-        if file_hash != st.session_state.processed_hash:
             suffix = Path(uploaded_file.name).suffix.lower()
             type_msg = {
                 ".pdf":  "Reading PDF...",
@@ -163,59 +231,60 @@ with st.sidebar:
                 ".csv":  "Parsing CSV...",
                 ".xlsx": "Parsing Excel...",
                 ".xls":  "Parsing Excel...",
-                ".jpg":  "🖼️ Captioning image with AI...",
-                ".jpeg": "🖼️ Captioning image with AI...",
-                ".png":  "🖼️ Captioning image with AI...",
-                ".webp": "🖼️ Captioning image with AI...",
             }.get(suffix, "Processing...")
             with st.spinner(type_msg):
-                rag    = load_rag_engine()
-                chunks = rag.ingest_file(uploaded_file)
-                st.session_state.doc_loaded     = True
-                st.session_state.doc_name       = uploaded_file.name
-                st.session_state.doc_type       = suffix
-                st.session_state.chunk_count    = chunks
-                st.session_state.processed_hash = file_hash
-                st.session_state.messages       = []
-            st.success(f"✓ Indexed {chunks} chunks!")
-            st.rerun()
     st.markdown("---")
-    # Sample doc
-    st.markdown('<p style="color:#6b6b8a;font-size:0.78rem;font-weight:600;text-transform:uppercase;letter-spacing:0.08em;">Or try a sample</p>', unsafe_allow_html=True)
     if st.button("📥 Load Sample: AI Report", use_container_width=True):
-        with st.spinner("Downloading sample..."):
-            from data_downloader import download_sample_doc
-            path, name = download_sample_doc()
-            rag    = load_rag_engine()
-            chunks = rag.ingest_path(path, name)
-            st.session_state.doc_loaded     = True
-            st.session_state.doc_name       = name
-            st.session_state.doc_type       = Path(name).suffix.lower()
-            st.session_state.chunk_count    = chunks
-            st.session_state.processed_hash = "sample"
-            st.session_state.messages       = []
-        st.success(f"✓ {chunks} chunks loaded!")
-        st.rerun()
     st.markdown("---")
     col_a, col_b = st.columns(2)
     with col_a:
         if st.button("🗑️ Clear Chat", use_container_width=True):
             st.session_state.messages = []
-            load_rag_engine().clear_memory()
             st.rerun()
     with col_b:
-        if st.button("🔄 New Doc", use_container_width=True):
-            st.session_state.update(defaults)
             st.session_state.messages = []
-            global_rag = load_rag_engine()
-            global_rag.clear_memory()
-            global_rag._vectorstore = None
-            global_rag._doc_name = ""
             st.rerun()
     st.markdown("---")
@@ -225,51 +294,85 @@ with st.sidebar:
     🔗 LangChain · ChromaDB<br>
     🤗 MiniLM Embeddings<br>
     🦙 Llama-3 / Mistral-7B<br>
-    🖼️ BLIP Image Captioning<br>
     💬 Conversation Memory<br>
     🌊 Streamlit + FastAPI
     </p>
     """, unsafe_allow_html=True)
-# ─── Main ─────────────────────────────────────────────────────────────────────
 st.markdown('<h1 class="hero-title">DocMind AI</h1>', unsafe_allow_html=True)
-st.markdown('<p class="hero-sub">PDF · Word · CSV · Excel · Images — Ask anything. Remembers your conversation.</p>', unsafe_allow_html=True)
-# Stats
-rag = load_rag_engine()
 c1, c2, c3, c4 = st.columns(4)
 with c1:
-    st.markdown(f'<div class="stat-card"><div class="stat-number">{st.session_state.chunk_count or "—"}</div><div class="stat-label">Chunks Indexed</div></div>', unsafe_allow_html=True)
 with c2:
-    st.markdown(f'<div class="stat-card"><div class="stat-number">{len(st.session_state.messages)//2}</div><div class="stat-label">Questions Asked</div></div>', unsafe_allow_html=True)
 with c3:
-    st.markdown(f'<div class="stat-card"><div class="stat-number">{rag.get_memory_count()}</div><div class="stat-label">Memory Window</div></div>', unsafe_allow_html=True)
 with c4:
-    supported_count = "7"
-    st.markdown(f'<div class="stat-card"><div class="stat-number">{supported_count}</div><div class="stat-label">File Types</div></div>', unsafe_allow_html=True)
 st.markdown("<br>", unsafe_allow_html=True)
 # ─── Chat history ─────────────────────────────────────────────────────────────
 if not st.session_state.messages:
-    if st.session_state.doc_loaded:
-        suffix = st.session_state.doc_type
-        type_emoji = {"pdf": "📄", "image": "🖼️", "csv": "📊", "excel": "📊", "docx": "📝", "text": "📄"}.get(suffix.strip("."), "📄")
         st.markdown(f"""
         <div style="text-align:center;padding:3rem;color:#6b6b8a;">
-            <div style="font-size:2.5rem;margin-bottom:1rem;">{type_emoji}</div>
-            <p style="font-size:1rem;color:#a78bfa;">Document ready!</p>
-            <p style="font-size:0.85rem;">Ask anything about <b style="color:#e8e8f0;">{st.session_state.doc_name}</b></p>
-            <p style="font-size:0.78rem;margin-top:0.5rem;">I'll remember your conversation — ask follow-up questions naturally.</p>
         </div>""", unsafe_allow_html=True)
     else:
         st.markdown("""
         <div style="text-align:center;padding:4rem 2rem;color:#6b6b8a;">
             <div style="font-size:3rem;margin-bottom:1rem;">🧠</div>
-            <p style="font-size:1.1rem;color:#a78bfa;font-family:'Syne',sans-serif;font-weight:600;">Multimodal RAG — Upload anything</p>
             <p style="font-size:0.85rem;margin-top:0.5rem;">
                 📄 PDF &nbsp;·&nbsp; 📝 Word &nbsp;·&nbsp; 📊 CSV/Excel &nbsp;·&nbsp; 🖼️ Images<br><br>
-                Upload in the sidebar or load the sample AI report to get started.
             </p>
         </div>""", unsafe_allow_html=True)
 else:
@@ -294,29 +397,38 @@ else:
                 {sources_html}
             </div>""", unsafe_allow_html=True)
-# ─── Input ────────────────────────────────────────────────────────────────────
 st.markdown("<br>", unsafe_allow_html=True)
-if not st.session_state.doc_loaded:
     st.chat_input("Upload a document first...", disabled=True)
 else:
-    placeholder = {
-        ".pdf":  "Ask anything about this PDF...",
-        ".txt":  "Ask anything about this text...",
-        ".docx": "Ask anything about this document...",
-        ".csv":  "Ask about the data, columns, or statistics...",
-        ".xlsx": "Ask about the spreadsheet data...",
-        ".xls":  "Ask about the spreadsheet data...",
-        ".jpg":  "Ask me what I see in this image...",
-        ".jpeg": "Ask me what I see in this image...",
-        ".png":  "Ask me what I see in this image...",
-        ".webp": "Ask me what I see in this image...",
-    }.get(st.session_state.doc_type, "Ask anything about your document...")
     if prompt := st.chat_input(placeholder):
         st.session_state.messages.append({"role": "user", "content": prompt})
         with st.spinner("🔍 Retrieving & generating..."):
-            rag            = load_rag_engine()
             answer, sources = rag.query(prompt)
             mem_count       = rag.get_memory_count()
         st.session_state.messages.append({
@@ -325,4 +437,4 @@ else:
             "sources":      sources,
             "memory_count": mem_count,
         })
-        st.rerun()

 config.set_option("server.enableCORS", False)
 config.set_option("server.enableXsrfProtection", False)
+MAX_FILES = 5
 # ─── CSS ──────────────────────────────────────────────────────────────────────
 st.markdown("""
 <style>
 .ft-excel { background: #064e3b; color: #6ee7b7; }
 .ft-docx  { background: #1e3a5f; color: #7dd3fc; }
 .ft-text  { background: #1c1917; color: #d6d3d1; }
+.doc-item {
+    background: #1c1c26; border: 1px solid #2a2a3a; border-radius: 10px;
+    padding: 0.6rem 0.8rem; margin-bottom: 0.4rem;
+}
 [data-testid="stFileUploader"] { background: #1c1c26 !important; border: 2px dashed #2a2a3a !important; border-radius: 12px !important; }
 .stButton > button {
     background: linear-gradient(135deg, #7c3aed, #4f46e5) !important;
 }
 .badge-ready   { background:#14532d; color:#86efac; padding:3px 10px; border-radius:20px; font-size:0.75rem; }
 .badge-empty   { background:#1c1917; color:#a8a29e; padding:3px 10px; border-radius:20px; font-size:0.75rem; }
+.badge-count   { background:#312e81; color:#a5b4fc; padding:3px 10px; border-radius:20px; font-size:0.75rem; }
 hr { border-color: #2a2a3a !important; }
 ::-webkit-scrollbar { width: 6px; }
 ::-webkit-scrollbar-track { background: #0f0f13; }
 # ─── Session state ────────────────────────────────────────────────────────────
 defaults = {
+    "messages":        [],
+    "processed_files": {},   # {filename: md5_hash}
 }
 for k, v in defaults.items():
     if k not in st.session_state:
         st.session_state[k] = v
 def file_type_badge(suffix: str) -> str:
     m = {
         ".pdf":  ("pdf",   "PDF"),
     cls, label = m.get(suffix, ("text", suffix.upper()))
     return f'<span class="filetype-badge ft-{cls}">{label}</span>'
+def type_emoji(suffix: str) -> str:
+    m = {
+        ".pdf": "📄", ".txt": "📄",
+        ".docx": "📝", ".doc": "📝",
+        ".csv": "📊", ".xlsx": "📊", ".xls": "📊",
+        ".jpg": "🖼️", ".jpeg": "🖼️", ".png": "🖼️", ".webp": "🖼️",
+    }
+    return m.get(suffix, "📄")
+# ─── Load RAG engine & get document state ─────────────────────────────────────
+rag        = load_rag_engine()
+documents  = rag.get_documents()     # [{name, type, chunk_count}]
+doc_loaded = len(documents) > 0
+total_chunks = rag.get_total_chunks()
+file_count   = rag.get_file_count()
 # ─── Sidebar ──────────────────────────────────────────────────────────────────
 with st.sidebar:
     st.markdown('<p style="font-family:Syne,sans-serif;font-size:1.3rem;font-weight:700;color:#a78bfa;">🧠 DocMind AI</p>', unsafe_allow_html=True)
+    st.markdown('<p style="color:#6b6b8a;font-size:0.8rem;">Multimodal RAG · Multi-File · Memory</p>', unsafe_allow_html=True)
     st.markdown("---")
+    # ── Document List ─────────────────────────────────────────────────────────
+    if documents:
         mem_count = rag.get_memory_count()
         st.markdown(
+            f'<span class="badge-ready">✓ Ready</span> '
+            f'<span class="badge-count">{file_count}/{MAX_FILES} files</span>',
+            unsafe_allow_html=True,
+        )
+        st.markdown(
+            f'<p style="color:#6b6b8a;font-size:0.78rem;margin-top:0.3rem;">'
+            f'{total_chunks} total chunks · {mem_count} exchanges in memory</p>',
+            unsafe_allow_html=True,
         )
+        st.markdown("")
+        # Show each document with a remove button
+        for doc in documents:
+            col_doc, col_rm = st.columns([5, 1])
+            with col_doc:
+                badge = file_type_badge(doc["type"])
+                emoji = type_emoji(doc["type"])
+                st.markdown(
+                    f'<div class="doc-item">'
+                    f'{badge} <b style="color:#e8e8f0;font-size:0.82rem;">{doc["name"]}</b>'
+                    f'<br><span style="color:#6b6b8a;font-size:0.72rem;">'
+                    f'{emoji} {doc["chunk_count"]} chunks</span>'
+                    f'</div>',
+                    unsafe_allow_html=True,
+                )
+            with col_rm:
+                st.markdown('<div style="padding-top:0.6rem;"></div>', unsafe_allow_html=True)
+                if st.button("❌", key=f"rm_{doc['name']}", help=f"Remove {doc['name']}"):
+                    rag.remove_file(doc["name"])
+                    # Remove from processed_files tracking
+                    st.session_state.processed_files = {
+                        k: v for k, v in st.session_state.processed_files.items()
+                        if k != doc["name"]
+                    }
+                    st.rerun()
     else:
+        st.markdown('<span class="badge-empty">○ No documents loaded</span>', unsafe_allow_html=True)
     st.markdown("---")
+    # ── Upload Area ───────────────────────────────────────────────────────────
+    st.markdown(
+        '<p style="color:#6b6b8a;font-size:0.78rem;font-weight:600;text-transform:uppercase;letter-spacing:0.08em;">'
+        'Upload Document</p>',
+        unsafe_allow_html=True,
     )
+    st.markdown(
+        '<p style="color:#6b6b8a;font-size:0.72rem;">'
+        'PDF · TXT · DOCX · CSV · XLSX · JPG · PNG</p>',
+        unsafe_allow_html=True,
+    )
+    if file_count >= MAX_FILES:
+        st.warning(f"Maximum {MAX_FILES} files reached. Remove a file to upload more.")
+        uploaded_file = None
+    else:
+        uploaded_file = st.file_uploader(
+            "Upload",
+            type=["pdf", "txt", "docx", "doc", "csv", "xlsx", "xls",
+                  "jpg", "jpeg", "png", "webp"],
+            label_visibility="collapsed",
+        )
     if uploaded_file:
         file_hash = hashlib.md5(uploaded_file.read()).hexdigest()
         uploaded_file.seek(0)
+        # Check if this exact file (by hash) was already processed
+        already_processed = file_hash in st.session_state.processed_files.values()
+        if not already_processed:
             suffix = Path(uploaded_file.name).suffix.lower()
             type_msg = {
                 ".pdf":  "Reading PDF...",
                 ".csv":  "Parsing CSV...",
                 ".xlsx": "Parsing Excel...",
                 ".xls":  "Parsing Excel...",
+                ".jpg":  "🖼️ Processing image (OCR + captioning)...",
+                ".jpeg": "🖼️ Processing image (OCR + captioning)...",
+                ".png":  "🖼️ Processing image (OCR + captioning)...",
+                ".webp": "🖼️ Processing image (OCR + captioning)...",
             }.get(suffix, "Processing...")
             with st.spinner(type_msg):
+                try:
+                    chunks = rag.ingest_file(uploaded_file)
+                    st.session_state.processed_files[uploaded_file.name] = file_hash
+                    st.success(f"✓ Indexed {chunks} chunks from {uploaded_file.name}!")
+                    st.rerun()
+                except ValueError as e:
+                    st.error(str(e))
+                except Exception as e:
+                    st.error(f"Failed to process file: {e}")
     st.markdown("---")
+    # ── Sample doc ────────────────────────────────────────────────────────────
+    st.markdown(
+        '<p style="color:#6b6b8a;font-size:0.78rem;font-weight:600;text-transform:uppercase;letter-spacing:0.08em;">'
+        'Or try a sample</p>',
+        unsafe_allow_html=True,
+    )
     if st.button("📥 Load Sample: AI Report", use_container_width=True):
+        if file_count >= MAX_FILES:
+            st.error(f"Maximum {MAX_FILES} files reached. Remove a file first.")
+        else:
+            with st.spinner("Downloading sample..."):
+                from data_downloader import download_sample_doc
+                path, name = download_sample_doc()
+                try:
+                    chunks = rag.ingest_path(path, name)
+                    st.session_state.processed_files[name] = "sample"
+                    st.success(f"✓ {chunks} chunks loaded!")
+                    st.rerun()
+                except ValueError as e:
+                    st.error(str(e))
     st.markdown("---")
+    # ── Action buttons ────────────────────────────────────────────────────────
     col_a, col_b = st.columns(2)
     with col_a:
         if st.button("🗑️ Clear Chat", use_container_width=True):
             st.session_state.messages = []
+            rag.clear_memory()
             st.rerun()
     with col_b:
+        if st.button("🔄 Reset All", use_container_width=True):
+            rag.reset()
             st.session_state.messages = []
+            st.session_state.processed_files = {}
             st.rerun()
     st.markdown("---")
     🔗 LangChain · ChromaDB<br>
     🤗 MiniLM Embeddings<br>
     🦙 Llama-3 / Mistral-7B<br>
+    🖼️ BLIP + VLM Captioning<br>
     💬 Conversation Memory<br>
+    📁 Up to 5 files simultaneously<br>
     🌊 Streamlit + FastAPI
     </p>
     """, unsafe_allow_html=True)
+# ─── Main Area ────────────────────────────────────────────────────────────────
 st.markdown('<h1 class="hero-title">DocMind AI</h1>', unsafe_allow_html=True)
+st.markdown(
+    '<p class="hero-sub">'
+    'PDF · Word · CSV · Excel · Images — Upload up to 5 files. Ask anything. Remembers your conversation.'
+    '</p>',
+    unsafe_allow_html=True,
+)
+# ── Stats ─────────────────────────────────────────────────────────────────────
 c1, c2, c3, c4 = st.columns(4)
 with c1:
+    st.markdown(
+        f'<div class="stat-card">'
+        f'<div class="stat-number">{total_chunks or "—"}</div>'
+        f'<div class="stat-label">Chunks Indexed</div></div>',
+        unsafe_allow_html=True,
+    )
 with c2:
+    st.markdown(
+        f'<div class="stat-card">'
+        f'<div class="stat-number">{file_count}/{MAX_FILES}</div>'
+        f'<div class="stat-label">Files Loaded</div></div>',
+        unsafe_allow_html=True,
+    )
 with c3:
+    st.markdown(
+        f'<div class="stat-card">'
+        f'<div class="stat-number">{len(st.session_state.messages) // 2}</div>'
+        f'<div class="stat-label">Questions Asked</div></div>',
+        unsafe_allow_html=True,
+    )
 with c4:
+    st.markdown(
+        f'<div class="stat-card">'
+        f'<div class="stat-number">{rag.get_memory_count()}</div>'
+        f'<div class="stat-label">Memory Window</div></div>',
+        unsafe_allow_html=True,
+    )
 st.markdown("<br>", unsafe_allow_html=True)
 # ─── Chat history ─────────────────────────────────────────────────────────────
 if not st.session_state.messages:
+    if doc_loaded:
+        # Show loaded files summary
+        file_names = ", ".join(f"<b style='color:#e8e8f0;'>{d['name']}</b>" for d in documents)
+        emojis = " ".join(set(type_emoji(d["type"]) for d in documents))
         st.markdown(f"""
         <div style="text-align:center;padding:3rem;color:#6b6b8a;">
+            <div style="font-size:2.5rem;margin-bottom:1rem;">{emojis}</div>
+            <p style="font-size:1rem;color:#a78bfa;">
+                {file_count} document{'s' if file_count > 1 else ''} ready!
+            </p>
+            <p style="font-size:0.85rem;">Ask anything about {file_names}</p>
+            <p style="font-size:0.78rem;margin-top:0.5rem;">
+                I'll remember your conversation — ask follow-up questions naturally.
+                {'You can also upload more files (up to 5).' if file_count < MAX_FILES else ''}
+            </p>
         </div>""", unsafe_allow_html=True)
     else:
         st.markdown("""
         <div style="text-align:center;padding:4rem 2rem;color:#6b6b8a;">
             <div style="font-size:3rem;margin-bottom:1rem;">🧠</div>
+            <p style="font-size:1.1rem;color:#a78bfa;font-family:'Syne',sans-serif;font-weight:600;">
+                Multimodal RAG — Upload up to 5 files
+            </p>
             <p style="font-size:0.85rem;margin-top:0.5rem;">
                 📄 PDF &nbsp;·&nbsp; 📝 Word &nbsp;·&nbsp; 📊 CSV/Excel &nbsp;·&nbsp; 🖼️ Images<br><br>
+                Upload in the sidebar or load the sample AI report to get started.<br>
+                You can upload multiple files and ask questions across all of them.
             </p>
         </div>""", unsafe_allow_html=True)
 else:
                 {sources_html}
             </div>""", unsafe_allow_html=True)
+# ─── Chat Input ───────────────────────────────────────────────────────────────
 st.markdown("<br>", unsafe_allow_html=True)
+if not doc_loaded:
     st.chat_input("Upload a document first...", disabled=True)
 else:
+    # Build a placeholder based on loaded file types
+    loaded_types = set(d["type"] for d in documents)
+    image_exts  = {".jpg", ".jpeg", ".png", ".webp"}
+    table_exts  = {".csv", ".xlsx", ".xls"}
+    if file_count == 1:
+        doc_type = documents[0]["type"]
+        placeholder = {
+            ".pdf":  "Ask anything about this PDF...",
+            ".txt":  "Ask anything about this text...",
+            ".docx": "Ask anything about this document...",
+            ".doc":  "Ask anything about this document...",
+            ".csv":  "Ask about the data, columns, or statistics...",
+            ".xlsx": "Ask about the spreadsheet data...",
+            ".xls":  "Ask about the spreadsheet data...",
+            ".jpg":  "Ask me what I see in this image...",
+            ".jpeg": "Ask me what I see in this image...",
+            ".png":  "Ask me what I see in this image...",
+            ".webp": "Ask me what I see in this image...",
+        }.get(doc_type, "Ask anything about your document...")
+    else:
+        placeholder = f"Ask anything about your {file_count} documents..."
     if prompt := st.chat_input(placeholder):
         st.session_state.messages.append({"role": "user", "content": prompt})
         with st.spinner("🔍 Retrieving & generating..."):
             answer, sources = rag.query(prompt)
             mem_count       = rag.get_memory_count()
         st.session_state.messages.append({
             "sources":      sources,
             "memory_count": mem_count,
         })
+        st.rerun()