OPENSPEC_Hackhathon / test_run.py
SushCodex's picture
Upload 14 files
85768b6 verified
raw
history blame contribute delete
911 Bytes
from grader import grade_agent
from tasks import get_task
def run_test():
print("--- Starting WarehouseMaster Task 1 Test ---")
# Task 1: [0,0] -> [5,5] -> [0,0]
# Sequence: 5 Right, 5 Up, Pick(4), 5 Left, 5 Down, Drop(5)
sequence = [3]*5 + [0]*5 + [4] + [2]*5 + [1]*5 + [5]
# Run the automated grader
result = grade_agent(task_id=1, actions=sequence)
print(f"Task Name: {get_task(1)['name']}")
print(f"Status: {result['status']}")
print(f"Items: {result['items_collected']}/{result['target_count']}")
print(f"Steps: {result['steps_taken']}")
print(f"Final Score: {result['final_score']}/100")
if result['is_success']:
print("\n✅ Verification Successful: Environment and Grader are fully functional!")
else:
print("\n❌ Verification Failed: Logic error detected.")
if __name__ == "__main__":
run_test()