teja944 commited on
Commit
474a72a
·
verified ·
1 Parent(s): 0d04fc6

Update env.py

Browse files
Files changed (1) hide show
  1. env.py +2 -1
env.py CHANGED
@@ -71,7 +71,8 @@ class CustomerSupportEnv(es.Environment):
71
  # Penalize infinite loops / max steps
72
  if self.step_count >= self.max_steps:
73
  self.done = True
74
- return self._get_obs(reward=-0.5, feedback="Max steps reached")
 
75
 
76
  if action.action_type == "ASK_INFO":
77
  asked = action.argument.lower()
 
71
  # Penalize infinite loops / max steps
72
  if self.step_count >= self.max_steps:
73
  self.done = True
74
+ final_score = grader(task, self.state_data)
75
+ return self._get_obs(reward=float(final_score), feedback="Max steps reached")
76
 
77
  if action.action_type == "ASK_INFO":
78
  asked = action.argument.lower()