Veer15's picture
chore: deploy distributed systems debug environment
b641d3d verified
[
"tests/test_api_reset.py::test_reset_defaults_to_cascading_timeout_when_task_missing",
"tests/test_api_reset.py::test_reset_rejects_unknown_explicit_task",
"tests/test_env_task_context.py::test_job_generator_rate_resolved_uses_config",
"tests/test_env_task_context.py::test_registry_auth_matches_default_detects_corruption",
"tests/test_env_task_context.py::test_restore_defaults_adds_job_generator_config",
"tests/test_graders.py::test_grade_backpressure_cascade_continuous",
"tests/test_graders.py::test_grade_byzantine_queue_fault_cases",
"tests/test_graders.py::test_grade_cascading_timeout_boundaries",
"tests/test_graders.py::test_grade_distributed_lock_starvation_cases",
"tests/test_graders.py::test_grade_job_generator_runaway_thresholds",
"tests/test_graders.py::test_grade_registry_corruption_thresholds",
"tests/test_graders.py::test_grade_route_partition_threshold",
"tests/test_inference_format.py::test_attempt_history_block_renders_all_attempts",
"tests/test_inference_format.py::test_build_prompt_contains_symptoms_and_history",
"tests/test_inference_format.py::test_end_log_line_includes_score_and_reward_list",
"tests/test_inference_format.py::test_episode_score_clamps_terminal_reward_to_unit_interval",
"tests/test_inference_format.py::test_extract_command_prefers_first_json_object_with_command",
"tests/test_inference_format.py::test_extract_command_reads_fenced_json_payload",
"tests/test_inference_format.py::test_extract_command_reads_json_after_reasoning_preamble",
"tests/test_inference_format.py::test_extract_command_reads_json_embedded_in_text",
"tests/test_inference_format.py::test_extract_command_reads_json_payload",
"tests/test_inference_format.py::test_extract_command_rejects_non_json_code_fence",
"tests/test_inference_format.py::test_extract_command_requires_command_even_with_reasoning",
"tests/test_inference_format.py::test_extract_command_returns_none_when_empty",
"tests/test_inference_format.py::test_extract_reasoning_when_present",
"tests/test_inference_format.py::test_parse_tasks_default_and_override",
"tests/test_inference_format.py::test_single_line_removes_newlines",
"tests/test_inference_format.py::test_task_symptom_block_includes_new_tasks",
"tests/test_inference_format.py::test_task_symptom_block_is_non_empty",
"tests/test_models.py::test_action_rejects_empty_command",
"tests/test_models.py::test_observation_roundtrip",
"tests/test_models.py::test_system_metrics_rejects_success_rate_above_one"
]