Spaces:

devrajsinh2012
/

Mexar

Sleeping

File size: 1,346 Bytes

53bb779

"""
Evaluates the domain guardrail's false-accept (false positive) rate.
"""
import sys
import os
sys.path.append(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))

from modules.reasoning_engine import create_reasoning_engine

def test_guardrails(agent_name: str):
    engine = create_reasoning_engine()
    
    boundary_queries = [
        "What are the economic impacts of pharmaceutical pricing?", # Often crosses medical/finance
        "Can a doctor be sued for malpractice if they misdiagnose cancer?", # Medical/Legal
        "Are taxes applied to medical equipment purchases?", # Medical/Finance
        "How do I cook a healthy meal to lower blood pressure?" # Cooking/Medical
    ]
    
    print(f"Testing Guardrail False-Accept Rate (Threshold = {engine.DOMAIN_SIMILARITY_THRESHOLD})")
    
    try:
        for q in boundary_queries:
            res = engine.reason(agent_name, q)
            print(f"\nQuery: {q}")
            print(f"Accepted: {res['in_domain']}")
            exp = res.get('explainability', {})
            cb = exp.get('confidence_breakdown', {})
            domain_str = cb.get('domain_relevance', 'N/A')
            print(f"Domain Score: {domain_str}")
    except Exception as e:
        print(f"Failed guardrail test queries: {e}")

if __name__ == "__main__":
    test_guardrails("medical_agent")