Rayugacodes commited on
Commit
7f52093
·
verified ·
1 Parent(s): 278a0ec

Skip GRPO: merge warm-start and push to HF

Browse files
Files changed (1) hide show
  1. Dockerfile +1 -8
Dockerfile CHANGED
@@ -10,8 +10,6 @@ ENV XDG_CACHE_HOME=/tmp/cache
10
  ENV HOME=/tmp/home
11
  ENV USER=user
12
  ENV PYTHONUNBUFFERED=1
13
- ENV NVIDIA_VISIBLE_DEVICES=all
14
- ENV NVIDIA_DRIVER_CAPABILITIES=compute,utility
15
 
16
  RUN mkdir -p /tmp/hf_cache /tmp/torch_cache /tmp/cache /tmp/home && \
17
  chmod -R 777 /tmp/hf_cache /tmp/torch_cache /tmp/cache /tmp/home
@@ -27,13 +25,8 @@ RUN pip install --no-cache-dir \
27
  "accelerate>=0.34,<0.36" \
28
  huggingface_hub
29
 
30
- # Verify all imports work at build time
31
- RUN python3 -c "from trl import SFTTrainer, SFTConfig, GRPOConfig, GRPOTrainer; print('TRL OK')"
32
- RUN python3 -c "from peft import LoraConfig; print('PEFT OK')"
33
- RUN python3 -c "import torch; print('CUDA:', torch.cuda.is_available())"
34
-
35
  COPY train_on_hf.py .
36
  RUN chmod -R 777 /app
37
 
38
  EXPOSE 7860
39
- CMD ["sh", "-c", "python3 train_on_hf.py --hf-token $HF_TOKEN --skip-world-model"]
 
10
  ENV HOME=/tmp/home
11
  ENV USER=user
12
  ENV PYTHONUNBUFFERED=1
 
 
13
 
14
  RUN mkdir -p /tmp/hf_cache /tmp/torch_cache /tmp/cache /tmp/home && \
15
  chmod -R 777 /tmp/hf_cache /tmp/torch_cache /tmp/cache /tmp/home
 
25
  "accelerate>=0.34,<0.36" \
26
  huggingface_hub
27
 
 
 
 
 
 
28
  COPY train_on_hf.py .
29
  RUN chmod -R 777 /app
30
 
31
  EXPOSE 7860
32
+ CMD ["sh", "-c", "python3 train_on_hf.py --hf-token $HF_TOKEN --skip-world-model --skip-strategist"]