File size: 815 Bytes
5850885
 
 
 
 
 
 
bbf206f
 
5850885
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
"""TRL/Unsloth GRPO training harness — P12/P13.

Public surface:

* :class:`training.config.GRPOConfig` / :class:`training.config.CurriculumConfig`
* :func:`training.prompt.render_system_prompt`
* :class:`training.random_agent.RandomAgent`
* :func:`training.grpo_train.train` (requires GPU + ``[train]`` extra
  plus the CUDA-specific Unsloth stack installed by ``utilities/run_training_job.py``)
"""

from __future__ import annotations

from training.config import ALL_SCENARIOS, CurriculumConfig, GRPOConfig
from training.prompt import (
    render_prompt_from_observation,
    render_system_prompt,
)
from training.random_agent import RandomAgent

__all__ = [
    "ALL_SCENARIOS",
    "CurriculumConfig",
    "GRPOConfig",
    "RandomAgent",
    "render_prompt_from_observation",
    "render_system_prompt",
]