Spaces:

NavyDevilDoc
/

Semantic_Search

Sleeping

App Files Files Community

NavyDevilDoc commited on Dec 29, 2025

Commit

a14f7cc

verified ·

1 Parent(s): 7558bd2

Update app.py

Browse files

Files changed (1) hide show

app.py +32 -20

app.py CHANGED Viewed

@@ -88,9 +88,7 @@ with st.sidebar:
             # --- DUPLICATION CHECK ---
             if f.name in existing_files:
                 st.toast(f"♻️ Updating existing file: {f.name}")
-                # Remove the old version first (Cleans SQL and FAISS)
                 st.session_state.db.delete_document(f.name)
-            # -------------------------
             # A. Parse File
             text, filename, method = process_file(f)
@@ -102,14 +100,28 @@ with st.sidebar:
             # B. Chunk & ID
             chunks, doc_id = chunk_text(text, filename)
-            # C. Save to SQLite
-            st.session_state.db.add_document(doc_id, filename, text)
             # D. Add to Vector Index
             st.session_state.search_engine.add_features(chunks)
-            progress_bar.progress((i + 1) / len(uploaded_files))
         status.text("Syncing to Cloud...")
         SyncManager.push_data()
@@ -226,38 +238,38 @@ if query:
                     with st.expander("🔍 View Source Data used for this summary"):
                         st.text(full_doc_text[:2000] + "...")
-        # --- SEARCH RESULTS SECTION (Updated) ---
-        # We wrap the results in an expander to keep the UI clean
-        with st.expander("📚 Reference Documents (Click to view)", expanded=False):
             if not results:
                 st.info("No matching documents found.")
             for res in results:
                 score = res['score']
-                # Dynamic color coding based on relevance
                 color = "#09ab3b" if score > 2 else "#ffbd45" if score > 0 else "#ff4b4b"
-                # CSS FIX:
-                # 1. We kept 'background-color: #f0f2f6' (Light Gray)
-                # 2. We ADDED 'color: #1f1f1f' (Dark Gray) to force readability
-                #    regardless of whether the user is in Dark Mode or Light Mode.
                 st.markdown(f"""
                 <div style="
                     border-left: 5px solid {color};
                     padding: 15px;
                     background-color: #f0f2f6;
-                    margin-bottom: 10px;
                     border-radius: 5px;
                     color: #1f1f1f;
                 ">
-                    <div style="display: flex; justify-content: space-between; align-items: center;">
                         <h4 style="margin:0; color: #0e1117;">📄 {res['source']}</h4>
-                        <span style="font-size: 0.8em; color: #555; background: #ddd; padding: 2px 6px; border-radius: 4px;">Score: {score:.2f}</span>
                     </div>
-                    <p style="margin: 8px 0; font-style: italic; font-size: 0.95em; color: #333; line-height: 1.5;">
-                        "...{res['snippet']}..."
                     </p>
                 </div>
                 """, unsafe_allow_html=True)

             # --- DUPLICATION CHECK ---
             if f.name in existing_files:
                 st.toast(f"♻️ Updating existing file: {f.name}")
                 st.session_state.db.delete_document(f.name)
             # A. Parse File
             text, filename, method = process_file(f)
             # B. Chunk & ID
             chunks, doc_id = chunk_text(text, filename)
+            # --- NEW STEP: Generate Abstract ---
+            # We skip this for tiny files to save time
+            abstract = "No summary generated."
+            if len(text) > 500:
+                with st.spinner(f"Writing abstract for {filename}..."):
+                    # We utilize our flexible LLM client
+                    # Note: We send only the first 30k chars to keep it fast
+                    abstract = ask_llm(
+                        query="Generate Abstract",
+                        context=text[:30000],
+                        mode="Abstract Generator",
+                        model_provider="Gemini"
+                    )
+            # -----------------------------------
+            # C. Save to SQLite (Now includes Abstract)
+            st.session_state.db.add_document(doc_id, filename, text, abstract=abstract)
             # D. Add to Vector Index
             st.session_state.search_engine.add_features(chunks)
+            progress_bar.progress((i + 1) / len(uploaded_files))
         status.text("Syncing to Cloud...")
         SyncManager.push_data()
                     with st.expander("🔍 View Source Data used for this summary"):
                         st.text(full_doc_text[:2000] + "...")
+        # --- SEARCH RESULTS SECTION (Rich View) ---
+        with st.expander("📚 Reference Documents (Click to view)", expanded=True):
             if not results:
                 st.info("No matching documents found.")
             for res in results:
                 score = res['score']
                 color = "#09ab3b" if score > 2 else "#ffbd45" if score > 0 else "#ff4b4b"
+                # RETRIEVE THE ABSTRACT FROM DB
+                doc_abstract = st.session_state.db.get_doc_abstract(res['doc_id'])
                 st.markdown(f"""
                 <div style="
                     border-left: 5px solid {color};
                     padding: 15px;
                     background-color: #f0f2f6;
+                    margin-bottom: 15px;
                     border-radius: 5px;
                     color: #1f1f1f;
                 ">
+                    <div style="display: flex; justify-content: space-between; align-items: center; margin-bottom: 10px;">
                         <h4 style="margin:0; color: #0e1117;">📄 {res['source']}</h4>
+                        <span style="font-size: 0.8em; color: #555; background: #ddd; padding: 2px 8px; border-radius: 4px;">Relevance: {score:.2f}</span>
                     </div>
+                    <div style="background: #e3e6ea; padding: 10px; border-radius: 5px; margin-bottom: 10px;">
+                        <p style="margin: 0; font-size: 0.9em; color: #333;"><strong>🤖 Abstract:</strong> {doc_abstract}</p>
+                    </div>
+                    <p style="margin: 0; font-style: italic; font-size: 0.85em; color: #555;">
+                        "Matching Chunk: ...{res['snippet']}..."
                     </p>
                 </div>
                 """, unsafe_allow_html=True)