File size: 4,280 Bytes
2073b3f
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
0f8f2c1
2073b3f
0f8f2c1
2073b3f
 
 
 
0f8f2c1
2073b3f
0f8f2c1
2073b3f
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
e56d042
2073b3f
 
 
 
 
 
456f5a3
2073b3f
 
 
 
 
 
 
e56d042
 
456f5a3
 
 
2073b3f
 
a01a8f1
0f8f2c1
 
 
2073b3f
e56d042
 
 
456f5a3
 
 
e56d042
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
# Copyright (c) Meta Platforms, Inc. and affiliates.
# All rights reserved.
#
# This source code is licensed under the BSD-style license found in the
# LICENSE file in the root directory of this source tree.

# Multi-stage build using openenv-base
# This Dockerfile is flexible and works for both:
# - In-repo environments (with local OpenEnv sources)
# - Standalone environments (with openenv from PyPI/Git)
# The build script (openenv build) handles context detection and sets appropriate build args.

ARG BASE_IMAGE=ghcr.io/meta-pytorch/openenv-base:latest
FROM ${BASE_IMAGE} AS builder

WORKDIR /app

# Ensure git is available (required for installing dependencies from VCS)
RUN apt-get update && \
    apt-get install -y --no-install-recommends git && \
    rm -rf /var/lib/apt/lists/*

# Build argument to control whether we're building standalone or in-repo
ARG BUILD_MODE=in-repo
ARG ENV_NAME=aws_rl_env

# Copy environment code (always at root of build context)
COPY . /app/env

# For in-repo builds, openenv is already vendored in the build context
# For standalone builds, openenv will be installed via pyproject.toml
WORKDIR /app/env

# Ensure uv is available (for local builds where base image lacks it)
RUN if ! command -v uv >/dev/null 2>&1; then \
    curl -LsSf https://astral.sh/uv/install.sh | sh && \
    mv /root/.local/bin/uv /usr/local/bin/uv && \
    mv /root/.local/bin/uvx /usr/local/bin/uvx; \
    fi

# Install dependencies using uv sync
# If uv.lock exists, use it; otherwise resolve on the fly
RUN --mount=type=cache,target=/root/.cache/uv \
    if [ -f uv.lock ]; then \
    uv sync --frozen --extra dev --no-install-project --no-editable; \
    else \
    uv sync --extra dev --no-install-project --no-editable; \
    fi

RUN --mount=type=cache,target=/root/.cache/uv \
    if [ -f uv.lock ]; then \
    uv sync --frozen --extra dev --no-editable; \
    else \
    uv sync --extra dev --no-editable; \
    fi

# Final runtime stage
FROM ${BASE_IMAGE}

WORKDIR /app

# Copy the uv-managed Python interpreter from builder
COPY --from=builder /root/.local/share/uv/python /root/.local/share/uv/python

# Copy the virtual environment from builder
COPY --from=builder /app/env/.venv /app/.venv

# Copy the environment code
COPY --from=builder /app/env /app/env

# Install AWS CLI
RUN apt-get update && \
    apt-get install -y --no-install-recommends awscli && \
    rm -rf /var/lib/apt/lists/*

# Configure AWS CLI to point to MiniStack (vendored at aws_infra/) and use dummy credentials
RUN mkdir -p /root/.aws && \
    printf '[default]\nregion = us-east-1\noutput = json\n' > /root/.aws/config && \
    printf '[default]\naws_access_key_id = test\naws_secret_access_key = test\n' > /root/.aws/credentials
ENV AWS_ENDPOINT_URL=http://localhost:4566

# Enable the web interface for OpenEnv (if applicable)
ENV ENABLE_WEB_INTERFACE=true

# Set PATH to use the virtual environment
ENV PATH="/app/.venv/bin:$PATH"

# Set PYTHONPATH so imports work correctly
ENV PYTHONPATH="/app/env:$PYTHONPATH"

ENV AWS_RL_ENV_POOL_SIZE=8
ENV AWS_RL_ENV_MINISTACK_BASE_PORT=4566
# Dedicated port for the web playground's lazily-spawned MiniStack.
# Kept outside the pool's range so a WebSocket session can never claim it.
ENV AWS_RL_ENV_WEB_MINISTACK_PORT=4565

# DEV_MODE=1 enables live reload via --reload flag
ENV DEV_MODE=0

ENV API_BASE_URL=https://router.huggingface.co/v1
ENV MODEL_NAME=Qwen/Qwen2.5-72B-Instruct

# Entrypoint: start N MiniStack instances (AWS_RL_ENV_POOL_SIZE, default 1),
# then run the FastAPI server. Each MiniStack listens on a distinct port
# starting at AWS_RL_ENV_MINISTACK_BASE_PORT (default 4566).
# The web playground's MiniStack on AWS_RL_ENV_WEB_MINISTACK_PORT is NOT
# started here — the FastAPI server spawns it lazily on the first /web/*
# request so training-only deployments pay zero cost.
# cloudflared tunnel --url localhost:8000
CMD ["sh", "-c", "\
  POOL_SIZE=\"${AWS_RL_ENV_POOL_SIZE:-1}\"; \
  BASE_PORT=\"${AWS_RL_ENV_MINISTACK_BASE_PORT:-4566}\"; \
  i=0; while [ \"$i\" -lt \"$POOL_SIZE\" ]; do \
    GATEWAY_PORT=$((BASE_PORT + i)) ministack -d; \
    i=$((i + 1)); \
  done; \
  sleep 3; \
  uvicorn server.app:app --host 0.0.0.0 --port 8000 $([ \"$DEV_MODE\" = '1' ] && echo '--reload --reload-dir /app/env') \
"]