Spaces:

Ronochieng
/

DocMindAI

Build error

App Files Files Community

Ronochieng commited on Apr 26, 2025

Commit

f0d60d1

verified ·

1 Parent(s): 9e3c676

Update app.py

Browse files

Files changed (1) hide show

app.py +23 -24

app.py CHANGED Viewed

@@ -15,7 +15,7 @@ from langchain.prompts.prompt import PromptTemplate
 from langchain.chains import ConversationalRetrievalChain
 from langchain.chains import LLMChain
 from langchain.memory import ConversationBufferMemory
-from langchain.vectorstores import Chroma
 from pydantic import BaseModel, Field
 from Ingestion.ingest import process_document, get_processor_for_file
@@ -166,40 +166,39 @@ def clean_llm_response(response):
     return content
-# Initialize LLM and Model Cache
-@st.cache_resource(experimental_allow_widgets=True)
 def load_model():
-    with st.spinner("Loading model..."):
-        try:
-            llm = Llama.from_pretrained(
-                repo_id="stduhpf/google-gemma-3-1b-it-qat-q4_0-gguf-small",
-                filename="gemma-3-1b-it-q4_0_s.gguf",
-            )
-            return llm
-        except Exception as e:
-            st.error(f"Error loading model: {str(e)}")
-            return None
-# Initialize embeddings - but only when needed to avoid torch inspection issues
-@st.cache_resource(experimental_allow_widgets=True)
 def load_embeddings():
     from langchain_community.embeddings import HuggingFaceEmbeddings
-    with st.spinner("Loading embeddings..."):
-        embeddings = HuggingFaceEmbeddings(
-            model_name="sentence-transformers/all-MiniLM-L6-v2",
-            model_kwargs={'device': 'cpu'}
-        )
-        return embeddings
 # Sidebar Configuration with improved styling
 st.sidebar.markdown("<div style='text-align: center;'><h1>🧠 DocMind AI</h1></div>", unsafe_allow_html=True)
 st.sidebar.markdown("<div style='text-align: center;'>AI-Powered Document Analysis</div>", unsafe_allow_html=True)
 st.sidebar.markdown("---")
-# Load LLM
 with st.sidebar:
-    llm = load_model()
     if llm is not None:
         st.markdown("<div class='status-success'>✅ Model loaded successfully!</div>", unsafe_allow_html=True)
     else:
@@ -539,7 +538,7 @@ def run_analysis():
             # Only create embeddings if we have chunks
             if all_chunks and len(all_chunks) > 0:
-                # Load embeddings
                 embeddings = load_embeddings()
                 # Using 'None' as namespace to avoid unique ID issues with Chroma

 from langchain.chains import ConversationalRetrievalChain
 from langchain.chains import LLMChain
 from langchain.memory import ConversationBufferMemory
+from langchain_community.vectorstores import Chroma  # Fixed import
 from pydantic import BaseModel, Field
 from Ingestion.ingest import process_document, get_processor_for_file
     return content
+# Initialize LLM without widgets in the cached function
+@st.cache_resource
 def load_model():
+    try:
+        llm = Llama.from_pretrained(
+            repo_id="stduhpf/google-gemma-3-1b-it-qat-q4_0-gguf-small",
+            filename="gemma-3-1b-it-q4_0_s.gguf",
+        )
+        return llm
+    except Exception as e:
+        return None
+# Initialize embeddings without widgets in the cached function
+@st.cache_resource
 def load_embeddings():
     from langchain_community.embeddings import HuggingFaceEmbeddings
+    embeddings = HuggingFaceEmbeddings(
+        model_name="sentence-transformers/all-MiniLM-L6-v2",
+        model_kwargs={'device': 'cpu'}
+    )
+    return embeddings
 # Sidebar Configuration with improved styling
 st.sidebar.markdown("<div style='text-align: center;'><h1>🧠 DocMind AI</h1></div>", unsafe_allow_html=True)
 st.sidebar.markdown("<div style='text-align: center;'>AI-Powered Document Analysis</div>", unsafe_allow_html=True)
 st.sidebar.markdown("---")
+# Load LLM - Move spinner outside the cached function
 with st.sidebar:
+    with st.spinner("Loading model..."):
+        llm = load_model()
     if llm is not None:
         st.markdown("<div class='status-success'>✅ Model loaded successfully!</div>", unsafe_allow_html=True)
     else:
             # Only create embeddings if we have chunks
             if all_chunks and len(all_chunks) > 0:
+                # Load embeddings - moving spinner outside
                 embeddings = load_embeddings()
                 # Using 'None' as namespace to avoid unique ID issues with Chroma