Spaces:
Sleeping
Sleeping
File size: 1,154 Bytes
d53a65c | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 | # Copy to .env and fill in. Never commit real secrets.
# --- inference.py (OpenAI-compatible HTTP API) ---
API_BASE_URL=https://api.openai.com/v1
MODEL_NAME=gpt-4o-mini
# Used as API key by inference.py (or set OPENAI_API_KEY instead)
HF_TOKEN=hf_xxx
# --- CommitmentOS HTTP environment (inference + LLM eval) ---
ENV_BASE_URL=https://jayant2304-commitment-os.hf.space
# --- evaluation/evaluate_llm_checkpoints.py (local Transformers + PEFT) ---
# Base model on Hugging Face (must match what you trained on)
BASELINE_MODEL_NAME=Qwen/Qwen2.5-1.5B-Instruct
# REQUIRED: absolute or relative path to a folder containing adapter_config.json
# (e.g. ./training_output after train_grpo.py, or a downloaded adapter dir)
TRAINED_MODEL_PATH=./training_output
# Optional eval protocol (defaults shown)
EVAL_SEED=42
EVAL_MAX_STEPS=12
EVAL_TEMPERATURE=0.0
EVAL_TOP_P=1.0
EVAL_MAX_NEW_TOKENS=256
EVAL_SUCCESS_THRESHOLD=0.6
# --- training/train_grpo.py --push_to_hub only ---
# Hub repo id when using: python training/train_grpo.py ... --push_to_hub --hub_model_id your/repo
# TRAINED_MODEL_NAME is not read by evaluate_llm_checkpoints.py; use TRAINED_MODEL_PATH.
|