mahithakur commited on
Commit
754af78
·
1 Parent(s): c22ceaa

Add pre-training baseline results and graphs

Browse files
pre_training_results/baseline_comparison.svg ADDED
pre_training_results/pre_training_bar_chart.png ADDED
pre_training_results/pre_training_smoke_test.txt ADDED
File without changes
pre_training_results/pre_training_summary.json ADDED
@@ -0,0 +1,209 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "phase": "before_training",
3
+ "total_tasks": 40,
4
+ "avg_reward": 0.104,
5
+ "min_reward": -0.48,
6
+ "max_reward": 1.0,
7
+ "per_task": [
8
+ {
9
+ "task_id": 0,
10
+ "difficulty": "ultra-easy",
11
+ "reward": -0.03
12
+ },
13
+ {
14
+ "task_id": 0,
15
+ "difficulty": "ultra-easy",
16
+ "reward": 0.02
17
+ },
18
+ {
19
+ "task_id": 0,
20
+ "difficulty": "ultra-easy",
21
+ "reward": 0.787
22
+ },
23
+ {
24
+ "task_id": 0,
25
+ "difficulty": "ultra-easy",
26
+ "reward": -0.23
27
+ },
28
+ {
29
+ "task_id": 1,
30
+ "difficulty": "easy",
31
+ "reward": -0.03
32
+ },
33
+ {
34
+ "task_id": 1,
35
+ "difficulty": "easy",
36
+ "reward": 0.02
37
+ },
38
+ {
39
+ "task_id": 1,
40
+ "difficulty": "easy",
41
+ "reward": 0.8
42
+ },
43
+ {
44
+ "task_id": 1,
45
+ "difficulty": "easy",
46
+ "reward": -0.13
47
+ },
48
+ {
49
+ "task_id": 2,
50
+ "difficulty": "medium",
51
+ "reward": -0.03
52
+ },
53
+ {
54
+ "task_id": 2,
55
+ "difficulty": "medium",
56
+ "reward": 0.02
57
+ },
58
+ {
59
+ "task_id": 2,
60
+ "difficulty": "medium",
61
+ "reward": 0.795
62
+ },
63
+ {
64
+ "task_id": 2,
65
+ "difficulty": "medium",
66
+ "reward": -0.38
67
+ },
68
+ {
69
+ "task_id": 3,
70
+ "difficulty": "hard",
71
+ "reward": -0.03
72
+ },
73
+ {
74
+ "task_id": 3,
75
+ "difficulty": "hard",
76
+ "reward": 0.02
77
+ },
78
+ {
79
+ "task_id": 3,
80
+ "difficulty": "hard",
81
+ "reward": 0.0
82
+ },
83
+ {
84
+ "task_id": 3,
85
+ "difficulty": "hard",
86
+ "reward": -0.48
87
+ },
88
+ {
89
+ "task_id": 4,
90
+ "difficulty": "medium",
91
+ "reward": -0.03
92
+ },
93
+ {
94
+ "task_id": 4,
95
+ "difficulty": "medium",
96
+ "reward": 0.02
97
+ },
98
+ {
99
+ "task_id": 4,
100
+ "difficulty": "medium",
101
+ "reward": 0.795
102
+ },
103
+ {
104
+ "task_id": 4,
105
+ "difficulty": "medium",
106
+ "reward": -0.38
107
+ },
108
+ {
109
+ "task_id": 5,
110
+ "difficulty": "hard",
111
+ "reward": -0.03
112
+ },
113
+ {
114
+ "task_id": 5,
115
+ "difficulty": "hard",
116
+ "reward": 0.02
117
+ },
118
+ {
119
+ "task_id": 5,
120
+ "difficulty": "hard",
121
+ "reward": 0.8
122
+ },
123
+ {
124
+ "task_id": 5,
125
+ "difficulty": "hard",
126
+ "reward": -0.28
127
+ },
128
+ {
129
+ "task_id": 6,
130
+ "difficulty": "hard",
131
+ "reward": -0.03
132
+ },
133
+ {
134
+ "task_id": 6,
135
+ "difficulty": "hard",
136
+ "reward": 0.02
137
+ },
138
+ {
139
+ "task_id": 6,
140
+ "difficulty": "hard",
141
+ "reward": 0.803
142
+ },
143
+ {
144
+ "task_id": 6,
145
+ "difficulty": "hard",
146
+ "reward": -0.28
147
+ },
148
+ {
149
+ "task_id": 7,
150
+ "difficulty": "adversarial",
151
+ "reward": -0.18
152
+ },
153
+ {
154
+ "task_id": 7,
155
+ "difficulty": "adversarial",
156
+ "reward": -0.13
157
+ },
158
+ {
159
+ "task_id": 7,
160
+ "difficulty": "adversarial",
161
+ "reward": 1.0
162
+ },
163
+ {
164
+ "task_id": 7,
165
+ "difficulty": "adversarial",
166
+ "reward": -0.08
167
+ },
168
+ {
169
+ "task_id": 8,
170
+ "difficulty": "adversarial",
171
+ "reward": -0.18
172
+ },
173
+ {
174
+ "task_id": 8,
175
+ "difficulty": "adversarial",
176
+ "reward": -0.13
177
+ },
178
+ {
179
+ "task_id": 8,
180
+ "difficulty": "adversarial",
181
+ "reward": 1.0
182
+ },
183
+ {
184
+ "task_id": 8,
185
+ "difficulty": "adversarial",
186
+ "reward": -0.08
187
+ },
188
+ {
189
+ "task_id": 9,
190
+ "difficulty": "adversarial",
191
+ "reward": -0.18
192
+ },
193
+ {
194
+ "task_id": 9,
195
+ "difficulty": "adversarial",
196
+ "reward": -0.13
197
+ },
198
+ {
199
+ "task_id": 9,
200
+ "difficulty": "adversarial",
201
+ "reward": 1.0
202
+ },
203
+ {
204
+ "task_id": 9,
205
+ "difficulty": "adversarial",
206
+ "reward": -0.28
207
+ }
208
+ ]
209
+ }
pre_training_results/reward_breakdown.svg ADDED