Finish-him commited on
Commit
9edd46d
verified
1 Parent(s): 92ff09a

Update Dockerfile

Browse files
Files changed (1) hide show
  1. Dockerfile +10 -10
Dockerfile CHANGED
@@ -5,25 +5,25 @@ FROM python:3.9-slim-bookworm
5
  WORKDIR /app
6
 
7
  # --- ETAPA 1: INSTALAR O GIT E CLONAR O SEU DATASET COMPLETO ---
8
- # Instala o git-lfs para lidar com ficheiros grandes
9
  RUN apt-get update && apt-get install -y git git-lfs && git-lfs install
10
-
11
- # Clona o reposit贸rio deste pr贸prio Space para uma pasta chamada /app/dados
12
  RUN git clone https://huggingface.co/spaces/Finish-him/prometheus-embedding-generator ./dados && cd dados && git lfs pull
13
 
14
- # --- ETAPA 2: CONFIGURAR O AMBIENTE PYTHON ---
15
- # Copia o ficheiro de requerimentos e instala as depend锚ncias
16
  COPY requirements.txt .
17
  RUN pip install --no-cache-dir --upgrade -r requirements.txt
18
 
19
- # Copia o script de treinamento
20
- COPY train.py .
21
-
22
- # Define o caminho da cache para evitar erros de permiss茫o
23
  ENV HF_HOME=/app/cache/huggingface
24
  ENV SENTENCE_TRANSFORMERS_HOME=/app/cache/torch
25
  RUN mkdir -p $HF_HOME && mkdir -p $SENTENCE_TRANSFORMERS_HOME && chown -R 1000:1000 /app/cache
26
 
27
- # --- ETAPA 3: EXECUTAR O SCRIPT E MANTER O CONT脢INER VIVO ---
 
 
 
 
 
 
 
28
  # Executa o script e, ap贸s o t茅rmino, mant茅m o cont锚iner a correr.
29
  CMD ["sh", "-c", "python train.py && sleep infinity"]
 
5
  WORKDIR /app
6
 
7
  # --- ETAPA 1: INSTALAR O GIT E CLONAR O SEU DATASET COMPLETO ---
 
8
  RUN apt-get update && apt-get install -y git git-lfs && git-lfs install
 
 
9
  RUN git clone https://huggingface.co/spaces/Finish-him/prometheus-embedding-generator ./dados && cd dados && git lfs pull
10
 
11
+ # --- ETAPA 2: CONFIGURAR O AMBIENTE PYTHON E PR脡-AQUECER O CACHE ---
 
12
  COPY requirements.txt .
13
  RUN pip install --no-cache-dir --upgrade -r requirements.txt
14
 
15
+ # Define o caminho da cache
 
 
 
16
  ENV HF_HOME=/app/cache/huggingface
17
  ENV SENTENCE_TRANSFORMERS_HOME=/app/cache/torch
18
  RUN mkdir -p $HF_HOME && mkdir -p $SENTENCE_TRANSFORMERS_HOME && chown -R 1000:1000 /app/cache
19
 
20
+ # --- CORRE脟脙O PRINCIPAL: PR脡-AQUECIMENTO DO CACHE ---
21
+ # For莽a o download do modelo durante a fase de build, que tem um timeout maior.
22
+ RUN python -c "from sentence_transformers import SentenceTransformer; SentenceTransformer('intfloat/e5-mistral-7b-instruct', cache_folder=os.environ.get('SENTENCE_TRANSFORMERS_HOME', '/app/cache/torch'), trust_remote_code=True)"
23
+
24
+ # --- ETAPA 3: EXECUTAR O SCRIPT ---
25
+ # Copia o script de treinamento
26
+ COPY train.py .
27
+
28
  # Executa o script e, ap贸s o t茅rmino, mant茅m o cont锚iner a correr.
29
  CMD ["sh", "-c", "python train.py && sleep infinity"]