Spaces:

jonghhhh
/

press_ethics

Runtime error

jonghhhh commited on Jan 19

Commit

4e6f326

1 Parent(s): cf8d80a

Fix: Update Dockerfile, requirements.txt, and pre-download models to resolve timeout issue

Files changed (3) hide show

Dockerfile CHANGED Viewed

@@ -1,20 +1,35 @@
-FROM python:3.13.5-slim
 WORKDIR /app
 RUN apt-get update && apt-get install -y \
     build-essential \
     curl \
     git \
     && rm -rf /var/lib/apt/lists/*
-COPY requirements.txt ./
-COPY src/ ./src/
-RUN pip3 install -r requirements.txt
-EXPOSE 8501
-HEALTHCHECK CMD curl --fail http://localhost:8501/_stcore/health
-ENTRYPOINT ["streamlit", "run", "src/streamlit_app.py", "--server.port=8501", "--server.address=0.0.0.0"]

+FROM python:3.11-slim
+# Set environment variables
+ENV PYTHONUNBUFFERED=1 \
+    PYTHONDONTWRITEBYTECODE=1 \
+    STREAMLIT_SERVER_PORT=7860 \
+    STREAMLIT_SERVER_ADDRESS=0.0.0.0
 WORKDIR /app
+# Install system dependencies
 RUN apt-get update && apt-get install -y \
     build-essential \
     curl \
     git \
     && rm -rf /var/lib/apt/lists/*
+# Copy requirements first for better caching
+COPY requirements.txt .
+RUN pip3 install --no-cache-dir -r requirements.txt
+# Copy the rest of the application
+COPY . .
+# Pre-download models to speed up startup and avoid runtime download issues
+RUN python3 download_models.py
+# Hugging Face Spaces use port 7860 by default
+EXPOSE 7860
+# Health check to ensure the container is running correctly
+HEALTHCHECK CMD curl --fail http://localhost:7860/_stcore/health
+# Run the application
+ENTRYPOINT ["streamlit", "run", "multimodal_rag_langgraph_gemini_st.py"]

download_models.py CHANGED Viewed

@@ -3,7 +3,13 @@
 """
 from sentence_transformers import SentenceTransformer
 import os
 print("Downloading embedding model...")
 model = SentenceTransformer("intfloat/multilingual-e5-large-instruct", device="cpu")
-print("✅ Model downloaded successfully!")

 """
 from sentence_transformers import SentenceTransformer
 import os
+import nltk
 print("Downloading embedding model...")
 model = SentenceTransformer("intfloat/multilingual-e5-large-instruct", device="cpu")
+print("✅ Embedding model downloaded successfully!")
+print("Downloading nltk punkt...")
+nltk.download('punkt')
+nltk.download('punkt_tab')
+print("✅ NLTK data downloaded successfully!")

requirements.txt CHANGED Viewed

@@ -22,6 +22,10 @@ Pillow>=11.0.0
 requests==2.32.5
 beautifulsoup4==4.14.2
 lxml==6.0.2
 # Data Processing
 pandas>=2.0.0

 requests==2.32.5
 beautifulsoup4==4.14.2
 lxml==6.0.2
+trafilatura==1.12.2
+newspaper3k==0.2.8
+fake-useragent==2.0.3
+extruct==0.17.0
 # Data Processing
 pandas>=2.0.0