# Copy to .env and fill in. Never commit real secrets. # --- inference.py (OpenAI-compatible HTTP API) --- API_BASE_URL=https://api.openai.com/v1 MODEL_NAME=gpt-4o-mini # Used as API key by inference.py (or set OPENAI_API_KEY instead) HF_TOKEN=hf_xxx # --- CommitmentOS HTTP environment (inference + LLM eval) --- ENV_BASE_URL=https://jayant2304-commitment-os.hf.space # --- evaluation/evaluate_llm_checkpoints.py (local Transformers + PEFT) --- # Base model on Hugging Face (must match what you trained on) BASELINE_MODEL_NAME=Qwen/Qwen2.5-1.5B-Instruct # REQUIRED: absolute or relative path to a folder containing adapter_config.json # (e.g. ./training_output after train_grpo.py, or a downloaded adapter dir) TRAINED_MODEL_PATH=./training_output # Optional eval protocol (defaults shown) EVAL_SEED=42 EVAL_MAX_STEPS=12 EVAL_TEMPERATURE=0.0 EVAL_TOP_P=1.0 EVAL_MAX_NEW_TOKENS=256 EVAL_SUCCESS_THRESHOLD=0.6 # --- training/train_grpo.py --push_to_hub only --- # Hub repo id when using: python training/train_grpo.py ... --push_to_hub --hub_model_id your/repo # TRAINED_MODEL_NAME is not read by evaluate_llm_checkpoints.py; use TRAINED_MODEL_PATH.