File size: 1,867 Bytes
844074c
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
[
  {
    "step": 200,
    "policy_loss": 6.2601,
    "value_loss": 0.3127,
    "lr": 2.82e-05,
    "gnorm": 9.03
  },
  {
    "step": 400,
    "policy_loss": 4.3384,
    "value_loss": 0.2786,
    "lr": 5.64e-05,
    "gnorm": 6.71
  },
  {
    "step": 600,
    "policy_loss": 3.9855,
    "value_loss": 0.2473,
    "lr": 8.46e-05,
    "gnorm": 4.17
  },
  {
    "step": 800,
    "policy_loss": 3.7476,
    "value_loss": 0.231,
    "lr": 0.000113,
    "gnorm": 2.66
  },
  {
    "step": 1000,
    "policy_loss": 3.5844,
    "value_loss": 0.224,
    "lr": 0.000141,
    "gnorm": 2.37
  },
  {
    "step": 1200,
    "policy_loss": 3.4408,
    "value_loss": 0.2213,
    "lr": 0.000169,
    "gnorm": 1.9
  },
  {
    "step": 1400,
    "policy_loss": 3.3147,
    "value_loss": 0.2153,
    "lr": 0.000197,
    "gnorm": 1.73
  },
  {
    "step": 1600,
    "policy_loss": 3.1981,
    "value_loss": 0.2103,
    "lr": 0.0002,
    "gnorm": 1.48
  },
  {
    "step": 1800,
    "policy_loss": 3.0781,
    "value_loss": 0.2041,
    "lr": 0.0002,
    "gnorm": 1.52
  },
  {
    "step": 2000,
    "policy_loss": 2.9918,
    "value_loss": 0.2015,
    "lr": 0.0002,
    "gnorm": 1.26
  },
  {
    "step": 2200,
    "policy_loss": 2.9199,
    "value_loss": 0.1948,
    "lr": 0.0002,
    "gnorm": 1.24
  },
  {
    "step": 2400,
    "policy_loss": 2.8578,
    "value_loss": 0.1895,
    "lr": 0.0002,
    "gnorm": 1.14
  },
  {
    "step": 2600,
    "policy_loss": 2.8174,
    "value_loss": 0.1862,
    "lr": 0.0002,
    "gnorm": 1.1
  },
  {
    "step": 2800,
    "policy_loss": 2.7771,
    "value_loss": 0.1822,
    "lr": 0.0002,
    "gnorm": 1.24
  },
  {
    "step": 3000,
    "policy_loss": 2.7415,
    "value_loss": 0.1807,
    "lr": 0.000199,
    "gnorm": 1.14
  },
  {
    "step": 3200,
    "policy_loss": 2.6978,
    "value_loss": 0.1727,
    "lr": 0.000199,
    "gnorm": 1.1
  }
]