alisamak commited on
Commit
e515870
·
verified ·
1 Parent(s): 4e62403

Update evaluate_agent.py

Browse files
Files changed (1) hide show
  1. evaluate_agent.py +21 -21
evaluate_agent.py CHANGED
@@ -1,28 +1,28 @@
1
  def test_questions():
2
  return [
3
- {
4
- "task_id": "q7",
5
- "question": (
6
- "Given this table defining * on the set S = {a, b, c, d, e}\n\n"
7
- "|*|a|b|c|d|e|\n"
8
- "|---|---|---|---|---|---|\n"
9
- "|a|a|b|c|b|d|\n"
10
- "|b|b|c|a|e|c|\n"
11
- "|c|c|a|b|b|a|\n"
12
- "|d|b|e|b|e|d|\n"
13
- "|e|d|b|a|d|c|\n\n"
14
- "Provide the subset of S involved in any possible counter-examples that prove * is not commutative. "
15
- "Provide your answer as a comma-separated list of the elements in the set in alphabetical order."
16
- ),
17
- "expected_keywords": ["b, e"]
18
- },
19
  # {
20
- # "task_id": "q3",
21
- # "question": (
22
- # "'.rewsna eht sa \"tfel\" drow eht fo etisoppo eht etirw ,ecnetnes siht dnatsrednu uoy fI'"
23
- # ),
24
- # "expected_keywords": ["right"]
 
 
 
 
 
 
 
 
 
25
  # },
 
 
 
 
 
 
 
26
  # {
27
  # "task_id": "q10",
28
  # "question": (
 
1
  def test_questions():
2
  return [
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3
  # {
4
+ # "task_id": "q7",
5
+ # "question": (
6
+ # "Given this table defining * on the set S = {a, b, c, d, e}\n\n"
7
+ # "|*|a|b|c|d|e|\n"
8
+ # "|---|---|---|---|---|---|\n"
9
+ # "|a|a|b|c|b|d|\n"
10
+ # "|b|b|c|a|e|c|\n"
11
+ # "|c|c|a|b|b|a|\n"
12
+ # "|d|b|e|b|e|d|\n"
13
+ # "|e|d|b|a|d|c|\n\n"
14
+ # "Provide the subset of S involved in any possible counter-examples that prove * is not commutative. "
15
+ # "Provide your answer as a comma-separated list of the elements in the set in alphabetical order."
16
+ # ),
17
+ # "expected_keywords": ["b, e"]
18
  # },
19
+ {
20
+ "task_id": "q3",
21
+ "question": (
22
+ "'.rewsna eht sa \"tfel\" drow eht fo etisoppo eht etirw ,ecnetnes siht dnatsrednu uoy fI'"
23
+ ),
24
+ "expected_keywords": ["right"]
25
+ },
26
  # {
27
  # "task_id": "q10",
28
  # "question": (