File size: 421 Bytes
308e4ba
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
[
  {
    "train_loss": -0.15511070310068362,
    "train_policy_loss": 0.0,
    "train_kl_loss": -3.102214025259018,
    "train_reward": 0.30753333568573,
    "baseline": 0.3100000023841858,
    "epoch": 1
  },
  {
    "train_loss": -0.24350257394835353,
    "train_policy_loss": 0.0,
    "train_kl_loss": -5.263461359739304,
    "train_reward": 0.300500001758337,
    "baseline": 0.3100000023841858,
    "epoch": 2
  }
]