Spaces:

devrajsinh2012
/

Mexar

Sleeping

Mexar / backend /evaluation /guardrail_analysis.py

devrajsinh2012

Deploy current project snapshot to Hugging Face Space

53bb779 about 1 month ago

1.35 kB

	"""
	Evaluates the domain guardrail's false-accept (false positive) rate.
	"""
	import sys
	import os
	sys.path.append(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))

	from modules.reasoning_engine import create_reasoning_engine

	def test_guardrails(agent_name: str):
	engine = create_reasoning_engine()

	boundary_queries = [
	"What are the economic impacts of pharmaceutical pricing?", # Often crosses medical/finance
	"Can a doctor be sued for malpractice if they misdiagnose cancer?", # Medical/Legal
	"Are taxes applied to medical equipment purchases?", # Medical/Finance
	"How do I cook a healthy meal to lower blood pressure?" # Cooking/Medical
	]

	print(f"Testing Guardrail False-Accept Rate (Threshold = {engine.DOMAIN_SIMILARITY_THRESHOLD})")

	try:
	for q in boundary_queries:
	res = engine.reason(agent_name, q)
	print(f"\nQuery: {q}")
	print(f"Accepted: {res['in_domain']}")
	exp = res.get('explainability', {})
	cb = exp.get('confidence_breakdown', {})
	domain_str = cb.get('domain_relevance', 'N/A')
	print(f"Domain Score: {domain_str}")
	except Exception as e:
	print(f"Failed guardrail test queries: {e}")

	if __name__ == "__main__":
	test_guardrails("medical_agent")