[pytest] markers = judge: LLM-as-judge assertions (deselect with -m "not judge")