name: context-corruption-env version: "1.0.0" description: > OpenEnv environment for training epistemic robustness in LLMs. Agents identify correct answers and flag corrupted documents in a multi-doc QA setting with verifiable, objective rewards. author: "Siddh Sanghavi, Aagam Parekh" license: MIT environment: entrypoint: "environment.server:app" action_schema: "environment.actions.ContextCorruptionAction" observation_schema: "environment.actions.EpisodeObservation" max_concurrent_sessions: 64 reward: type: "objective" range: [-0.5, 1.05] components: - {name: answer_correctness, weight: 0.4} - {name: corruption_detection, weight: 0.3} - {name: false_positive_penalty, weight: 0.2} - {name: confidence_calibration, weight: 0.1} datasets: - {name: Natural Questions, url: "https://huggingface.co/datasets/google-research-datasets/natural_questions"} - {name: PopQA, url: "https://huggingface.co/datasets/akariasai/PopQA"} - {name: FaithEval, url: "https://github.com/SalesforceAIResearch/FaithEval"} citation: | @misc{contextcorruption2026, title={ContextCorruption-Env: Training Epistemic Robustness in LLMs}, year={2026}, note={OpenEnv Hackathon Submission} }