Spaces:
Paused
Paused
File size: 1,500 Bytes
03910cb | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 | FROM nvidia/cuda:12.1.1-cudnn8-runtime-ubuntu22.04
ENV DEBIAN_FRONTEND=noninteractive
WORKDIR /home/user/app
ENV OMP_NUM_THREADS=1 \
TOKENIZERS_PARALLELISM=false \
PYTHONUNBUFFERED=1 \
HF_HOME=/home/user/.cache/huggingface \
TRANSFORMERS_CACHE=/home/user/.cache/huggingface/transformers \
HF_DATASETS_CACHE=/home/user/.cache/huggingface/datasets \
OFFLOAD_DIR=/home/user/app/offload \
MERGED_MODEL_DIR=/home/user/app/merged-model \
QUANTIZE=4bit \
USE_ADAPTER_INFERENCE=1 \
FORCE_REMERGE=0 \
ALLOW_RUNTIME_MERGE=0 \
NVIDIA_VISIBLE_DEVICES=all \
NVIDIA_DRIVER_CAPABILITIES=compute,utility
RUN apt-get update && apt-get install -y --no-install-recommends \
python3 python3-pip git git-lfs ca-certificates && \
rm -rf /var/lib/apt/lists/* && \
git lfs install
RUN python3 -m pip install --upgrade pip
RUN python3 -m pip install --no-cache-dir \
--index-url https://download.pytorch.org/whl/cu121 \
torch==2.0.1 torchvision==0.15.2 torchaudio==2.0.2
RUN python3 -m pip install --no-cache-dir faiss-gpu==1.7.2
RUN python3 -m pip install --no-cache-dir \
sentence-transformers==2.2.2 \
huggingface_hub>=0.14.1
COPY requirements.txt .
RUN python3 -m pip install --no-cache-dir -r requirements.txt
RUN python3 -m pip install --no-cache-dir --upgrade --upgrade-strategy eager peft==0.12.0
COPY . .
RUN mkdir -p "$OFFLOAD_DIR" "$MERGED_MODEL_DIR" "$HF_HOME" "$TRANSFORMERS_CACHE"
EXPOSE 7860
CMD ["python3", "app.py"] |