Secured

Sleeping

App Files Files Community

Secured / tests /test_eval_runner.py

gowtham0992

Ship MiniCPM LoRA v3

cc862d5 21 days ago

Raw

History Blame Contribute Delete

5.83 kB

	import importlib.util
	from pathlib import Path

	from jawbreaker.analyzers import load_json_prediction, validate_prediction


	def load_run_eval_module():
	spec = importlib.util.spec_from_file_location("run_eval", Path("eval/run_eval.py"))
	assert spec is not None
	assert spec.loader is not None
	module = importlib.util.module_from_spec(spec)
	spec.loader.exec_module(module)
	return module


	def test_validate_prediction_accepts_complete_prediction() -> None:
	prediction = {
	"risk_level": "dangerous",
	"scam_type": "credential_theft",
	"summary": "This is pretending to be a bank.",
	"tactics": ["fake authority", "credential request"],
	"safest_action": "Do not click links. Open the official app directly.",
	"trusted_person_message": "Can you check this for me?",
	"scam_dna": {
	"impersonates": "bank",
	"pressure": "account locked",
	"ask": "login",
	"risk": "credential theft",
	},
	}

	assert validate_prediction(prediction) == []


	def test_score_rows_tracks_dangerous_as_safe() -> None:
	run_eval = load_run_eval_module()
	rows = [
	{
	"id": "case_1",
	"category": "bank_phishing",
	"input": "Bank login now",
	"expected_risk_level": "dangerous",
	"expected_scam_type": "credential_theft",
	"expected_tactics": ["credential request"],
	}
	]
	predictions = {
	"case_1": {
	"risk_level": "safe",
	"scam_type": "none",
	"summary": "Looks fine.",
	"tactics": [],
	"safest_action": "No action needed.",
	"trusted_person_message": "Can you check this?",
	"scam_dna": {"impersonates": "", "pressure": "", "ask": "", "risk": ""},
	}
	}

	metrics = run_eval.score_rows(rows, predictions, elapsed=0.01)

	assert metrics["risk_level_accuracy"] == 0
	assert metrics["dangerous_as_safe"] == ["case_1"]
	assert metrics["dangerous_as_needs_check"] == []
	assert metrics["suspicious_as_safe"] == []


	def test_score_rows_tracks_dangerous_undercalls_and_suspicious_as_safe() -> None:
	run_eval = load_run_eval_module()
	rows = [
	{
	"id": "danger_case",
	"category": "family_impersonation",
	"input": "Grandpa, I need money before midnight.",
	"expected_risk_level": "dangerous",
	"expected_scam_type": "family_impersonation",
	"expected_tactics": ["payment pressure"],
	},
	{
	"id": "suspicious_case",
	"category": "suspicious",
	"input": "Open this marketplace escrow link.",
	"expected_risk_level": "suspicious",
	"expected_scam_type": "fake_escrow",
	"expected_tactics": ["suspicious link"],
	},
	]
	base_prediction = {
	"scam_type": "unknown",
	"summary": "Check this.",
	"tactics": [],
	"safest_action": "Verify through a trusted route.",
	"trusted_person_message": "Can you check this?",
	"scam_dna": {"impersonates": "", "pressure": "", "ask": "", "risk": ""},
	}
	predictions = {
	"danger_case": {**base_prediction, "risk_level": "needs_check"},
	"suspicious_case": {**base_prediction, "risk_level": "safe"},
	}

	metrics = run_eval.score_rows(rows, predictions, elapsed=0.01)

	assert metrics["dangerous_as_needs_check"] == ["danger_case"]
	assert metrics["suspicious_as_safe"] == ["suspicious_case"]


	def test_score_rows_tracks_model_errors() -> None:
	run_eval = load_run_eval_module()
	rows = [
	{
	"id": "case_1",
	"category": "safe_benign",
	"input": "Dentist appointment Tuesday.",
	"expected_risk_level": "safe",
	"expected_scam_type": "none",
	"expected_tactics": [],
	}
	]
	predictions = {
	"case_1": {
	"risk_level": "safe",
	"scam_type": "none",
	"summary": "Looks fine.",
	"tactics": [],
	"safest_action": "No action needed.",
	"trusted_person_message": "Can you check this?",
	"scam_dna": {"impersonates": "", "pressure": "", "ask": "", "risk": ""},
	"_jawbreaker_model_error": "JSONDecodeError('empty')",
	}
	}

	metrics = run_eval.score_rows(rows, predictions, elapsed=0.01)

	assert metrics["model_errors"] == [{"id": "case_1", "error": "JSONDecodeError('empty')"}]


	def test_has_unsafe_action_allows_do_not_send_money() -> None:
	run_eval = load_run_eval_module()

	assert not run_eval.has_unsafe_action("Do not send money. Call a known number.")
	assert run_eval.has_unsafe_action("Send money to verify the account.")


	def test_load_json_prediction_extracts_embedded_object() -> None:
	prediction = load_json_prediction(
	'Here is the result: {"risk_level": "safe", "scam_type": "none", '
	'"summary": "ok", "tactics": [], "safest_action": "No action.", '
	'"trusted_person_message": "Please check.", '
	'"scam_dna": {"impersonates": "", "pressure": "", "ask": "", "risk": ""}}'
	)

	assert prediction["risk_level"] == "safe"


	def test_load_json_prediction_ignores_qwen_thinking_tokens() -> None:
	prediction = load_json_prediction(
	'<think>I should reason internally.</think>{"risk_level": "dangerous", '
	'"scam_type": "family_impersonation", "summary": "scam", '
	'"tactics": ["secrecy"], "safest_action": "Do not reply.", '
	'"trusted_person_message": "Can you check this?", '
	'"scam_dna": {"impersonates": "family", "pressure": "secret", "ask": "money", "risk": "payment"}}'
	)

	assert prediction["risk_level"] == "dangerous"