Spaces:

Sp2503
/

Muril-Model

Sleeping

Sai809701 commited on Oct 6, 2025

Commit

ee1d54c

2 Parent(s): 7b3d05b d9d9f74

Merge branch 'main' of https://huggingface.co/spaces/Sp2503/Muril-Model

Files changed (2) hide show

Dockerfile CHANGED Viewed

@@ -1,36 +1,38 @@
-# Use official Python image
 FROM python:3.10-slim
 # Set working directory
 WORKDIR /app
-# Copy requirements and install dependencies
 COPY requirements.txt .
-# Upgrade pip and install pinned dependencies
-RUN pip install --no-cache-dir --upgrade pip \
-    && pip install --no-cache-dir -r requirements.txt
-# Copy all code and model files
 COPY . .
-# Set Transformers cache to a writable folder
-ENV TRANSFORMERS_CACHE=/tmp/hf_cache
-# Expose FastAPI port
-EXPOSE 7860
-# Precompute embeddings at build time (optional: adjust if dataset is large)
-RUN python -c "\
-import os, torch, pandas as pd;\
-from sentence_transformers import SentenceTransformer;\
-model = SentenceTransformer('./muril_combined_multilingual_model');\
-df = pd.read_csv('./muril_multilingual_dataset.csv').dropna(subset=['question','answer']);\
-answers = df['answer'].tolist();\
-embeddings = model.encode(answers, convert_to_tensor=True);\
-torch.save(embeddings, './answer_embeddings.pt');\
-print('✅ Precomputed embeddings saved');\
-"
-# Run FastAPI with uvicorn
-CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "]()

+# Use a lightweight Python base image
 FROM python:3.10-slim
+# Disable CUDA since we're using CPU-only
+ENV TORCH_DISABLE_CUDA=1
+ENV TRANSFORMERS_CACHE=/app/hf_cache
+ENV HF_HOME=/app/hf_cache
 # Set working directory
 WORKDIR /app
+# Copy dependency list
 COPY requirements.txt .
+# Install dependencies efficiently
+RUN apt-get update && apt-get install -y git && \
+    pip install --no-cache-dir -r requirements.txt && \
+    rm -rf /var/lib/apt/lists/*
+# Copy application code
 COPY . .
+# Make cache folder writable
+RUN mkdir -p /app/hf_cache && chmod -R 777 /app/hf_cache
+# Expose port
+EXPOSE 8080
+# Preload model embeddings (optional)
+# Commented out to speed up Cloud Build — will load at runtime in main.py
+# RUN python -c "import torch, pandas as pd; from sentence_transformers import SentenceTransformer; \
+# model = SentenceTransformer('./muril_combined_multilingual_model'); \
+# df = pd.read_csv('./muril_multilingual_dataset.csv').dropna(subset=['question','answer']); \
+# embeddings = model.encode(df['answer'].tolist(), convert_to_tensor=True); \
+# torch.save(embeddings, './answer_embeddings.pt'); print('✅ Precomputed embeddings saved');"
+# Run the FastAPI app with uvicorn
+CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "8080"]

requirements.txt CHANGED Viewed

@@ -1,6 +1,9 @@
 fastapi==0.118.0
 uvicorn==0.37.0
-torch==2.1.0
 sentence-transformers==2.2.2
 transformers==4.33.2
 huggingface-hub==0.16.4
@@ -10,3 +13,4 @@ langdetect==1.0.9
 requests==2.31.0
 tqdm==4.65.0
 PyMuPDF==1.23.0

+--extra-index-url https://download.pytorch.org/whl/cpu
 fastapi==0.118.0
 uvicorn==0.37.0
+torch==2.1.0+cpu
+torchvision==0.16.0+cpu
+torchaudio==2.1.0+cpu
 sentence-transformers==2.2.2
 transformers==4.33.2
 huggingface-hub==0.16.4
 requests==2.31.0
 tqdm==4.65.0
 PyMuPDF==1.23.0