MODEL_IDS = [ "sachiniyer/Qwen2.5-0.5B-GRPO-LLMJudge-Schwinn", "sachiniyer/Qwen2.5-0.5B-DPO-Schwinn", "sachiniyer/Qwen2.5-0.5B-PPO-Schwinn", "Qwen/Qwen2.5-0.5B", "sachiniyer/SmolLM2-DPO-Schwinn-SmolLM2-Base", "sachiniyer/SmolLM2-DPO-Schwinn-gpt-5-mini-base", "sachiniyer/SmolLM2-FT-SFT-Learning", "sachiniyer/DeepSeek-R1-LoRA-Finetuned", "sachiniyer/DeepSeek-R1-QLoRA-Finetuned", ]