[ "tests/test_api_reset.py::test_reset_defaults_to_cascading_timeout_when_task_missing", "tests/test_api_reset.py::test_reset_rejects_unknown_explicit_task", "tests/test_env_task_context.py::test_job_generator_rate_resolved_uses_config", "tests/test_env_task_context.py::test_registry_auth_matches_default_detects_corruption", "tests/test_env_task_context.py::test_restore_defaults_adds_job_generator_config", "tests/test_graders.py::test_grade_backpressure_cascade_continuous", "tests/test_graders.py::test_grade_byzantine_queue_fault_cases", "tests/test_graders.py::test_grade_cascading_timeout_boundaries", "tests/test_graders.py::test_grade_distributed_lock_starvation_cases", "tests/test_graders.py::test_grade_job_generator_runaway_thresholds", "tests/test_graders.py::test_grade_registry_corruption_thresholds", "tests/test_graders.py::test_grade_route_partition_threshold", "tests/test_inference_format.py::test_attempt_history_block_renders_all_attempts", "tests/test_inference_format.py::test_build_prompt_contains_symptoms_and_history", "tests/test_inference_format.py::test_end_log_line_includes_score_and_reward_list", "tests/test_inference_format.py::test_episode_score_clamps_terminal_reward_to_unit_interval", "tests/test_inference_format.py::test_extract_command_prefers_first_json_object_with_command", "tests/test_inference_format.py::test_extract_command_reads_fenced_json_payload", "tests/test_inference_format.py::test_extract_command_reads_json_after_reasoning_preamble", "tests/test_inference_format.py::test_extract_command_reads_json_embedded_in_text", "tests/test_inference_format.py::test_extract_command_reads_json_payload", "tests/test_inference_format.py::test_extract_command_rejects_non_json_code_fence", "tests/test_inference_format.py::test_extract_command_requires_command_even_with_reasoning", "tests/test_inference_format.py::test_extract_command_returns_none_when_empty", "tests/test_inference_format.py::test_extract_reasoning_when_present", "tests/test_inference_format.py::test_parse_tasks_default_and_override", "tests/test_inference_format.py::test_single_line_removes_newlines", "tests/test_inference_format.py::test_task_symptom_block_includes_new_tasks", "tests/test_inference_format.py::test_task_symptom_block_is_non_empty", "tests/test_models.py::test_action_rejects_empty_command", "tests/test_models.py::test_observation_roundtrip", "tests/test_models.py::test_system_metrics_rejects_success_rate_above_one" ]