Spaces:

Rayugacodes
/

Breach-OS

Sleeping

App Files Files Community

Breach-OS / tests /test_environment.py

subhdotsol

test(environment): add injection tests — custom reward_computer and llm_pipeline are called

613f214 about 1 month ago

raw

history blame contribute delete

2.18 kB

	import pytest
	from server.environment import RedTeamEnvironment
	from models import AttackAction, StrategyType, TargetCategory

	@pytest.mark.asyncio
	async def test_reset():
	env = RedTeamEnvironment()
	obs = await env.reset()
	assert obs.turn == 0
	assert obs.episode_id is not None
	assert env.is_active is True

	@pytest.mark.asyncio
	async def test_step():
	env = RedTeamEnvironment()
	await env.reset()
	action = AttackAction(
	strategy_type="roleplay",
	target_category="privacy",
	intensity=0.5,
	framing="Hello"
	)
	res = await env.step(action)
	assert res.observation.turn == 1
	assert len(env.attack_history) == 1

	@pytest.mark.asyncio
	async def test_guards():
	env = RedTeamEnvironment()
	action = AttackAction(strategy_type="roleplay", target_category="privacy", intensity=0.5, framing="H")
	with pytest.raises(ValueError, match="Episode not active"):
	await env.step(action)

	await env.reset()
	env.turn = 10
	with pytest.raises(ValueError, match="Episode already complete"):
	await env.step(action)

	def test_framing_sanitization():
	action = AttackAction(
	strategy_type="roleplay", target_category="privacy", intensity=0.5,
	framing="<script>alert(1)</script> javascript:void(0)"
	)
	assert "<script>" not in action.framing
	assert "javascript:" not in action.framing
	assert "[FILTERED]" in action.framing

	@pytest.mark.asyncio
	async def test_injections():
	env = RedTeamEnvironment()

	called_reward = False
	def mock_reward(**kwargs):
	nonlocal called_reward
	called_reward = True
	return {"total_reward": 1.0}

	called_llm = False
	async def mock_llm(*args):
	nonlocal called_llm
	called_llm = True
	return {"defender_response": "ok", "attack_success": 0.5}

	env.set_reward_computer(mock_reward)
	env.set_llm_pipeline(mock_llm)

	await env.reset()
	action = AttackAction(strategy_type="roleplay", target_category="privacy", intensity=0.5, framing="H")
	await env.step(action)

	assert called_reward is True
	assert called_llm is True