tether007 commited on
Commit ·
8ff5feb
1
Parent(s): 91e580b
graders added
Browse files
trade_env/env/coach_env.py
CHANGED
|
@@ -106,7 +106,7 @@ class CoachEnv:
|
|
| 106 |
self.loss_streak = 0
|
| 107 |
|
| 108 |
raw_reward = step_pnl - (0.1 * intr) - (0.5 * self.loss_streak if step_pnl < 0 else 0)
|
| 109 |
-
reward = max(-1.0, min(1.0, raw_reward /
|
| 110 |
self.t += 1
|
| 111 |
done = False
|
| 112 |
|
|
|
|
| 106 |
self.loss_streak = 0
|
| 107 |
|
| 108 |
raw_reward = step_pnl - (0.1 * intr) - (0.5 * self.loss_streak if step_pnl < 0 else 0)
|
| 109 |
+
reward = max(-1.0, min(1.0, raw_reward / 5.0))
|
| 110 |
self.t += 1
|
| 111 |
done = False
|
| 112 |
|