import pytest
from server.environment import RedTeamEnvironment
from models import AttackAction, StrategyType, TargetCategory
@pytest.mark.asyncio
async def test_reset():
env = RedTeamEnvironment()
obs = await env.reset()
assert obs.turn == 0
assert obs.episode_id is not None
assert env.is_active is True
@pytest.mark.asyncio
async def test_step():
env = RedTeamEnvironment()
await env.reset()
action = AttackAction(
strategy_type="roleplay",
target_category="privacy",
intensity=0.5,
framing="Hello"
)
res = await env.step(action)
assert res.observation.turn == 1
assert len(env.attack_history) == 1
@pytest.mark.asyncio
async def test_guards():
env = RedTeamEnvironment()
action = AttackAction(strategy_type="roleplay", target_category="privacy", intensity=0.5, framing="H")
with pytest.raises(ValueError, match="Episode not active"):
await env.step(action)
await env.reset()
env.turn = 10
with pytest.raises(ValueError, match="Episode already complete"):
await env.step(action)
def test_framing_sanitization():
action = AttackAction(
strategy_type="roleplay", target_category="privacy", intensity=0.5,
framing=" javascript:void(0)"
)
assert "