Spaces:

seatyyy
/

skillforge

Sleeping

seatyyy commited on 2 days ago

Commit

697e014

verified ·

1 Parent(s): 8c7f5b4

Upload folder using huggingface_hub

Files changed (1) hide show

server/environment.py CHANGED Viewed

@@ -59,6 +59,7 @@ class SkillForgeEnvironment(Environment):
     def step(self, action: SkillForgeAction) -> SkillForgeObservation:
         self._state.step_count += 1
         task = TASKS[self.task_idx]
         # --- create_skill: store template, stay on current task ---
         if action.action_type == "create_skill":
@@ -102,9 +103,12 @@ class SkillForgeEnvironment(Environment):
         result_correct, result_output = self._evaluate(exec_code, task["dataframe"], task["expected_output"])
         if result_correct:
-            reward = 2.0
-            reward -= 0.001 * token_cost
             if action.action_type == "use_skill":
                 reward += 0.5
             self.tasks_solved += 1

     def step(self, action: SkillForgeAction) -> SkillForgeObservation:
         self._state.step_count += 1
         task = TASKS[self.task_idx]
+        reward = 0.0
         # --- create_skill: store template, stay on current task ---
         if action.action_type == "create_skill":
         result_correct, result_output = self._evaluate(exec_code, task["dataframe"], task["expected_output"])
+        if action.action_type == "create_skill":
+            result_correct = True
         if result_correct:
+            reward += 2.0
+            reward -= 0.001 * token_cost
             if action.action_type == "use_skill":
                 reward += 0.5
             self.tasks_solved += 1