ATISHAY005 commited on
Commit
6b7f681
·
1 Parent(s): 93a3442

Final OpenEnv submission fix

Browse files
Files changed (2) hide show
  1. evaluation/grader.py +8 -20
  2. openenv.yaml +8 -3
evaluation/grader.py CHANGED
@@ -1,24 +1,12 @@
1
- def grade_easy(episode_rewards):
2
- # maximize engagement
3
- return min(1.0, sum(episode_rewards) / max(1, len(episode_rewards)))
4
 
5
 
6
- def grade_medium(episode_rewards):
7
- # engagement + diversity (simulated)
8
- score = sum(episode_rewards) / max(1, len(episode_rewards))
9
- diversity_bonus = 0.1
10
- return min(1.0, score + diversity_bonus)
11
 
12
 
13
- def grade_hard(episode_rewards):
14
- # engagement + alignment + penalties
15
- score = sum(episode_rewards) / max(1, len(episode_rewards))
16
- penalty = 0.2
17
- return max(0.0, min(1.0, score - penalty))
18
-
19
-
20
- TASK_GRADERS = {
21
- "easy": grade_easy,
22
- "medium": grade_medium,
23
- "hard": grade_hard,
24
- }
 
1
+ def grade_easy(rewards):
2
+ return min(1.0, sum(rewards) / max(1, len(rewards)))
 
3
 
4
 
5
+ def grade_medium(rewards):
6
+ score = sum(rewards) / max(1, len(rewards))
7
+ return min(1.0, score + 0.1)
 
 
8
 
9
 
10
+ def grade_hard(rewards):
11
+ score = sum(rewards) / max(1, len(rewards))
12
+ return max(0.0, min(1.0, score - 0.2))
 
 
 
 
 
 
 
 
 
openenv.yaml CHANGED
@@ -1,9 +1,14 @@
1
  name: value-aware-feed-ranking
2
 
3
  tasks:
4
- - easy
5
- - medium
6
- - hard
 
 
 
 
 
7
 
8
  observation_space:
9
  type: UserState
 
1
  name: value-aware-feed-ranking
2
 
3
  tasks:
4
+ - name: easy
5
+ grader: evaluation.grader:grade_easy
6
+
7
+ - name: medium
8
+ grader: evaluation.grader:grade_medium
9
+
10
+ - name: hard
11
+ grader: evaluation.grader:grade_hard
12
 
13
  observation_space:
14
  type: UserState