File size: 670 Bytes
c5c527c 2153d46 c5c527c | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 | # train.py
from trade_env.env.coach_env import CoachEnv
from trade_env.schemas.action import Action, ActionType
from trade_env.agent.ppo_agent import PPOAgent
env = CoachEnv()
agent = PPOAgent(state_dim=6, action_dim=5)
for episode in range(2000):
state = env.reset()
done = False
while not done:
action_idx = agent.select_action(state)
action = Action(action=ActionType(action_idx))
next_state, reward, done, info = env.step(action)
agent.store_outcome(reward, done)
state = next_state
agent.update()
print(f"Ep {episode} | PnL: {info['pnl']:.2f} | Action: {action_idx} | Trader: {info['trader_action']}") |