origami_env / training /Dockerfile.train
praveen287's picture
Add GRPO training notebook + Dockerfile for cloud training (#1)
610ba6d
FROM python:3.11-slim
RUN apt-get update && apt-get install -y git && rm -rf /var/lib/apt/lists/*
WORKDIR /app
# Install PyTorch with CUDA support + training stack
RUN pip install --no-cache-dir \
torch --index-url https://download.pytorch.org/whl/cu124 && \
pip install --no-cache-dir \
"trl>=0.7" \
"datasets>=2.14" \
"transformers>=4.40" \
"accelerate>=0.30" \
"peft>=0.10" \
"bitsandbytes>=0.43" \
numpy scipy pydantic
# Copy the full repo
COPY . /app
# Default: run training script
# Override TASK, MODEL, MAX_STEPS etc. via env vars on Northflank
ENV TASK="triangle"
ENV MODEL="Qwen/Qwen2.5-3B-Instruct"
ENV MAX_STEPS="600"
ENV NUM_GENERATIONS="4"
ENV LR="2e-4"
CMD ["sh", "-c", "python -m training.train_grpo --task $TASK --model $MODEL --max_steps $MAX_STEPS --num_generations $NUM_GENERATIONS --lr $LR"]
="triangle"
ENV MODEL="Qwen/Qwen2.5-3B-Instruct"
ENV MAX_STEPS="600"
ENV NUM_GENERATIONS="4"
ENV LR="2e-4"
CMD ["sh", "-c", "python -m training.train_grpo --task $TASK --model $MODEL --max_steps $MAX_STEPS --num_generations $NUM_GENERATIONS --lr $LR"]