Spaces:
Running
Running
| { | |
| "model": "Qwen/Qwen2.5-7B-Instruct", | |
| "api_base": "https://api-inference.huggingface.co/v1", | |
| "episodes_per_task": 1, | |
| "seed_base": 1000, | |
| "fast_mode": true, | |
| "llm_every": 8, | |
| "max_steps": null, | |
| "task_averages": { | |
| "1": 0.4942, | |
| "2": 0.4707, | |
| "3": 0.7478, | |
| "4": 0.4779 | |
| }, | |
| "overall_average": 0.54765, | |
| "all_results": [ | |
| { | |
| "task_id": 1, | |
| "seed": 1100, | |
| "total_reward": 251.84571448658104, | |
| "total_steps": 96, | |
| "elapsed_sec": 1.227782964706421, | |
| "score": 0.4942, | |
| "sub_scores": {}, | |
| "exploit_detected": false | |
| }, | |
| { | |
| "task_id": 2, | |
| "seed": 1200, | |
| "total_reward": 245.38403598363988, | |
| "total_steps": 96, | |
| "elapsed_sec": 0.8327796459197998, | |
| "score": 0.4707, | |
| "sub_scores": {}, | |
| "exploit_detected": false | |
| }, | |
| { | |
| "task_id": 3, | |
| "seed": 1300, | |
| "total_reward": 242.06080137356216, | |
| "total_steps": 96, | |
| "elapsed_sec": 0.6833479404449463, | |
| "score": 0.7478, | |
| "sub_scores": {}, | |
| "exploit_detected": false | |
| }, | |
| { | |
| "task_id": 4, | |
| "seed": 1400, | |
| "total_reward": 206.4647897455665, | |
| "total_steps": 96, | |
| "elapsed_sec": 1.0237984657287598, | |
| "score": 0.4779, | |
| "sub_scores": {}, | |
| "exploit_detected": false | |
| } | |
| ] | |
| } |