Spaces:
Sleeping
Sleeping
| # Copy to .env and fill in. Never commit real secrets. | |
| # --- inference.py (OpenAI-compatible HTTP API) --- | |
| API_BASE_URL=https://api.openai.com/v1 | |
| MODEL_NAME=gpt-4o-mini | |
| # Used as API key by inference.py (or set OPENAI_API_KEY instead) | |
| HF_TOKEN=hf_xxx | |
| # --- CommitmentOS HTTP environment (inference + LLM eval) --- | |
| ENV_BASE_URL=https://jayant2304-commitment-os.hf.space | |
| # --- evaluation/evaluate_llm_checkpoints.py (local Transformers + PEFT) --- | |
| # Base model on Hugging Face (must match what you trained on) | |
| BASELINE_MODEL_NAME=Qwen/Qwen2.5-1.5B-Instruct | |
| # REQUIRED: absolute or relative path to a folder containing adapter_config.json | |
| # (e.g. ./training_output after train_grpo.py, or a downloaded adapter dir) | |
| TRAINED_MODEL_PATH=./training_output | |
| # Optional eval protocol (defaults shown) | |
| EVAL_SEED=42 | |
| EVAL_MAX_STEPS=12 | |
| EVAL_TEMPERATURE=0.0 | |
| EVAL_TOP_P=1.0 | |
| EVAL_MAX_NEW_TOKENS=256 | |
| EVAL_SUCCESS_THRESHOLD=0.6 | |
| # --- training/train_grpo.py --push_to_hub only --- | |
| # Hub repo id when using: python training/train_grpo.py ... --push_to_hub --hub_model_id your/repo | |
| # TRAINED_MODEL_NAME is not read by evaluate_llm_checkpoints.py; use TRAINED_MODEL_PATH. | |