Spaces:

build-small-hackathon
/

blood-test-explainer

Running on Zero

blood-test-explainer / tests /test_eval_scoring.py

Dimitris

feat(eval): field-level extraction eval harness + tests

1b58e74 25 days ago

1.57 kB

	import sys
	from pathlib import Path

	sys.path.insert(0, str(Path(__file__).resolve().parents[1]))

	from src.eval_scoring import score # noqa: E402


	def _row(tests):
	return {"tests": tests}


	def _t(marker, value, unit="mg/dL", status="normal"):
	return {"marker": marker, "value": value, "unit": unit, "status": status}


	def test_perfect_match():
	gold = [_row([_t("Glucose", "95"), _t("ALT", "30", "U/L")])]
	m = score(gold, gold)
	assert m.precision == 1.0 and m.recall == 1.0 and m.f1 == 1.0
	assert m.value_acc == 1.0 and m.unit_acc == 1.0 and m.status_acc == 1.0


	def test_alias_is_matched_to_canonical():
	gold = [_row([_t("Creatinine", "1.0")])]
	pred = [_row([_t("Cr", "1.0")])] # alias
	m = score(gold, pred)
	assert m.tp == 1 and m.fp == 0 and m.fn == 0


	def test_missing_and_extra_markers():
	gold = [_row([_t("Glucose", "95"), _t("ALT", "30")])]
	pred = [_row([_t("Glucose", "95"), _t("HDL", "55")])] # missed ALT, hallucinated HDL
	m = score(gold, pred)
	assert m.tp == 1 and m.fn == 1 and m.fp == 1
	assert "alt" in m.by_marker_fn


	def test_value_numeric_tolerance_and_status():
	gold = [_row([_t("Glucose", "95", status="normal")])]
	pred = [_row([_t("Glucose", "95.0", status="high")])] # value ok (numeric), status wrong
	m = score(gold, pred)
	assert m.value_ok == 1
	assert m.status_ok == 0


	def test_unit_mismatch():
	gold = [_row([_t("ALT", "30", "U/L")])]
	pred = [_row([_t("ALT", "30", "IU/L")])]
	m = score(gold, pred)
	assert m.unit_ok == 0 and m.value_ok == 1