| from grader import grade_agent |
| from tasks import get_task |
|
|
| def run_test(): |
| print("--- Starting WarehouseMaster Task 1 Test ---") |
| |
| |
| |
| sequence = [3]*5 + [0]*5 + [4] + [2]*5 + [1]*5 + [5] |
| |
| |
| result = grade_agent(task_id=1, actions=sequence) |
| |
| print(f"Task Name: {get_task(1)['name']}") |
| print(f"Status: {result['status']}") |
| print(f"Items: {result['items_collected']}/{result['target_count']}") |
| print(f"Steps: {result['steps_taken']}") |
| print(f"Final Score: {result['final_score']}/100") |
| |
| if result['is_success']: |
| print("\n✅ Verification Successful: Environment and Grader are fully functional!") |
| else: |
| print("\n❌ Verification Failed: Logic error detected.") |
|
|
| if __name__ == "__main__": |
| run_test() |
|
|