Spaces:

T0X1N
/

Agentic-RagBot

Sleeping

Nikhil Pravin Pise commited on Feb 25

Commit

696f787

1 Parent(s): fd5543a

Fix codebase issues: linting, types, tests, and security.

- Resolved over 3,000 ruff linting violations
- Enforced strict type checking with mypy
- Fixed infinite loop in pytest suite by migrating obsolete tests
- Remediated security warnings flagged by Bandit

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

Makefile +4 -2
airflow/dags/ingest_pdfs.py +7 -4
alembic/env.py +9 -11
alembic/versions/001_initial.py +81 -0
api/app/main.py +10 -13
api/app/routes/analyze.py +31 -37
api/app/routes/biomarkers.py +16 -17
api/app/routes/health.py +12 -15
api/app/services/extraction.py +27 -27
api/app/services/ragbot.py +69 -62
archive/evolution/__init__.py +11 -17
archive/evolution/director.py +55 -55
archive/evolution/pareto.py +48 -46
archive/sop_evolution.py +2 -1
{tests → archive/tests}/test_evolution_loop.py +37 -37
{tests → archive/tests}/test_evolution_quick.py +14 -13
docker-compose.yml +20 -0
gradio_launcher.py +24 -0
huggingface/app.py +180 -133
pytest.ini +3 -0
requirements.txt +0 -41
scripts/chat.py +73 -73
scripts/monitor_test.py +1 -1
scripts/setup_embeddings.py +16 -16
scripts/test_chat_demo.py +4 -5
scripts/test_extraction.py +8 -7
src/agents/biomarker_analyzer.py +23 -23
src/agents/biomarker_linker.py +41 -41
src/agents/clinical_guidelines.py +43 -42
src/agents/confidence_assessor.py +46 -46
src/agents/disease_explainer.py +36 -34
src/agents/response_synthesizer.py +52 -51
src/biomarker_normalization.py +1 -2
src/biomarker_validator.py +31 -31
src/config.py +15 -14
src/database.py +2 -2
src/dependencies.py +0 -3
src/evaluation/__init__.py +7 -7
src/evaluation/evaluators.py +72 -70
src/exceptions.py +2 -3
src/gradio_app.py +65 -25
src/llm_config.py +68 -67
src/main.py +20 -23
src/middlewares.py +24 -23
src/pdf_processor.py +52 -53
src/repositories/analysis.py +2 -4
src/repositories/document.py +2 -4
src/routers/analyze.py +28 -32
src/routers/ask.py +25 -12
src/routers/health.py +9 -7

Makefile CHANGED Viewed

@@ -117,12 +117,14 @@ index-pdfs: ## Parse and index all medical PDFs
 from pathlib import Path; \
 from src.services.pdf_parser.service import make_pdf_parser_service; \
 from src.services.indexing.service import IndexingService; \
 from src.services.embeddings.service import make_embedding_service; \
 from src.services.opensearch.client import make_opensearch_client; \
 parser = make_pdf_parser_service(); \
-idx = IndexingService(make_embedding_service(), make_opensearch_client()); \
 docs = parser.parse_directory(Path('data/medical_pdfs')); \
-[idx.index_text(d.full_text, {'title': d.filename}) for d in docs if d.full_text]; \
 print(f'Indexed {len(docs)} documents')"
 # ---------------------------------------------------------------------------

 from pathlib import Path; \
 from src.services.pdf_parser.service import make_pdf_parser_service; \
 from src.services.indexing.service import IndexingService; \
+from src.services.indexing.text_chunker import MedicalTextChunker; \
 from src.services.embeddings.service import make_embedding_service; \
 from src.services.opensearch.client import make_opensearch_client; \
 parser = make_pdf_parser_service(); \
+chunker = MedicalTextChunker(); \
+idx = IndexingService(chunker, make_embedding_service(), make_opensearch_client()); \
 docs = parser.parse_directory(Path('data/medical_pdfs')); \
+[idx.index_text(d.full_text, title=d.filename, source_file=d.filename) for d in docs if d.full_text]; \
 print(f'Indexed {len(docs)} documents')"
 # ---------------------------------------------------------------------------

airflow/dags/ingest_pdfs.py CHANGED Viewed

@@ -9,9 +9,10 @@ from __future__ import annotations
 from datetime import datetime, timedelta
-from airflow import DAG
 from airflow.operators.python import PythonOperator
 default_args = {
     "owner": "mediguard",
     "retries": 2,
@@ -26,23 +27,25 @@ def _ingest_pdfs(**kwargs):
     from src.services.embeddings.service import make_embedding_service
     from src.services.indexing.service import IndexingService
     from src.services.opensearch.client import make_opensearch_client
     from src.services.pdf_parser.service import make_pdf_parser_service
     from src.settings import get_settings
     settings = get_settings()
-    pdf_dir = Path(settings.medical_pdfs.directory)
     parser = make_pdf_parser_service()
     embedding_svc = make_embedding_service()
     os_client = make_opensearch_client()
-    indexing_svc = IndexingService(embedding_svc, os_client)
     docs = parser.parse_directory(pdf_dir)
     indexed = 0
     for doc in docs:
         if doc.full_text and not doc.error:
-            indexing_svc.index_text(doc.full_text, {"title": doc.filename})
             indexed += 1
     print(f"Ingested {indexed}/{len(docs)} documents")

 from datetime import datetime, timedelta
 from airflow.operators.python import PythonOperator
+from airflow import DAG
 default_args = {
     "owner": "mediguard",
     "retries": 2,
     from src.services.embeddings.service import make_embedding_service
     from src.services.indexing.service import IndexingService
+    from src.services.indexing.text_chunker import MedicalTextChunker
     from src.services.opensearch.client import make_opensearch_client
     from src.services.pdf_parser.service import make_pdf_parser_service
     from src.settings import get_settings
     settings = get_settings()
+    pdf_dir = Path(settings.pdf.pdf_directory)
     parser = make_pdf_parser_service()
     embedding_svc = make_embedding_service()
     os_client = make_opensearch_client()
+    chunker = MedicalTextChunker(target_words=settings.chunking.chunk_size, overlap_words=settings.chunking.chunk_overlap, min_words=settings.chunking.min_chunk_size)
+    indexing_svc = IndexingService(chunker, embedding_svc, os_client)
     docs = parser.parse_directory(pdf_dir)
     indexed = 0
     for doc in docs:
         if doc.full_text and not doc.error:
+            indexing_svc.index_text(doc.full_text, title=doc.filename, source_file=doc.filename)
             indexed += 1
     print(f"Ingested {indexed}/{len(docs)} documents")

alembic/env.py CHANGED Viewed

@@ -1,25 +1,23 @@
-from logging.config import fileConfig
-from sqlalchemy import engine_from_config
-from sqlalchemy import pool, create_engine
-from alembic import context
 # ---------------------------------------------------------------------------
 # MediGuard AI — Alembic env.py
 # Pull DB URL from settings so we never hard-code credentials.
 # ---------------------------------------------------------------------------
 import sys
-import os
 # Make sure the project root is on sys.path
 sys.path.insert(0, os.path.dirname(os.path.dirname(__file__)))
-from src.settings import get_settings  # noqa: E402
-from src.database import Base  # noqa: E402
 # Import all models so Alembic's autogenerate can see them
-import src.models.analysis  # noqa: F401, E402
 # this is the Alembic Config object, which provides
 # access to the values within the .ini file in use.

+import os
 # ---------------------------------------------------------------------------
 # MediGuard AI — Alembic env.py
 # Pull DB URL from settings so we never hard-code credentials.
 # ---------------------------------------------------------------------------
 import sys
+from logging.config import fileConfig
+from sqlalchemy import engine_from_config, pool
+from alembic import context
 # Make sure the project root is on sys.path
 sys.path.insert(0, os.path.dirname(os.path.dirname(__file__)))
 # Import all models so Alembic's autogenerate can see them
+import src.models.analysis  # noqa: F401
+from src.database import Base
+from src.settings import get_settings
 # this is the Alembic Config object, which provides
 # access to the values within the .ini file in use.

alembic/versions/001_initial.py ADDED Viewed

	@@ -0,0 +1,81 @@

+"""initial_tables
+Revision ID: 001
+Revises:
+Create Date: 2026-02-24 20:58:00.000000
+"""
+import sqlalchemy as sa
+from alembic import op
+# revision identifiers, used by Alembic.
+revision = '001'
+down_revision = None
+branch_labels = None
+depends_on = None
+def upgrade() -> None:
+    op.create_table(
+        'patient_analyses',
+        sa.Column('id', sa.String(length=36), nullable=False),
+        sa.Column('request_id', sa.String(length=64), nullable=False),
+        sa.Column('biomarkers', sa.JSON(), nullable=False),
+        sa.Column('patient_context', sa.JSON(), nullable=True),
+        sa.Column('predicted_disease', sa.String(length=128), nullable=False),
+        sa.Column('confidence', sa.Float(), nullable=False),
+        sa.Column('probabilities', sa.JSON(), nullable=True),
+        sa.Column('analysis_result', sa.JSON(), nullable=True),
+        sa.Column('safety_alerts', sa.JSON(), nullable=True),
+        sa.Column('sop_version', sa.String(length=64), nullable=True),
+        sa.Column('processing_time_ms', sa.Float(), nullable=False),
+        sa.Column('model_provider', sa.String(length=32), nullable=True),
+        sa.Column('created_at', sa.DateTime(timezone=True), server_default=sa.text('now()'), nullable=False),
+        sa.PrimaryKeyConstraint('id')
+    )
+    op.create_index(op.f('ix_patient_analyses_request_id'), 'patient_analyses', ['request_id'], unique=True)
+    op.create_table(
+        'medical_documents',
+        sa.Column('id', sa.String(length=36), nullable=False),
+        sa.Column('title', sa.String(length=512), nullable=False),
+        sa.Column('source', sa.String(length=512), nullable=False),
+        sa.Column('source_type', sa.String(length=32), nullable=False),
+        sa.Column('authors', sa.Text(), nullable=True),
+        sa.Column('abstract', sa.Text(), nullable=True),
+        sa.Column('content_hash', sa.String(length=64), nullable=True),
+        sa.Column('page_count', sa.Integer(), nullable=True),
+        sa.Column('chunk_count', sa.Integer(), nullable=True),
+        sa.Column('parse_status', sa.String(length=32), nullable=False),
+        sa.Column('metadata_json', sa.JSON(), nullable=True),
+        sa.Column('created_at', sa.DateTime(timezone=True), server_default=sa.text('now()'), nullable=False),
+        sa.Column('indexed_at', sa.DateTime(timezone=True), nullable=True),
+        sa.PrimaryKeyConstraint('id'),
+        sa.UniqueConstraint('content_hash')
+    )
+    op.create_index(op.f('ix_medical_documents_title'), 'medical_documents', ['title'], unique=False)
+    op.create_table(
+        'sop_versions',
+        sa.Column('id', sa.String(length=36), nullable=False),
+        sa.Column('version_tag', sa.String(length=64), nullable=False),
+        sa.Column('parameters', sa.JSON(), nullable=False),
+        sa.Column('evaluation_scores', sa.JSON(), nullable=True),
+        sa.Column('parent_version', sa.String(length=64), nullable=True),
+        sa.Column('is_active', sa.Boolean(), nullable=False),
+        sa.Column('created_at', sa.DateTime(timezone=True), server_default=sa.text('now()'), nullable=False),
+        sa.PrimaryKeyConstraint('id')
+    )
+    op.create_index(op.f('ix_sop_versions_version_tag'), 'sop_versions', ['version_tag'], unique=True)
+def downgrade() -> None:
+    op.drop_index(op.f('ix_sop_versions_version_tag'), table_name='sop_versions')
+    op.drop_table('sop_versions')
+    op.drop_index(op.f('ix_medical_documents_title'), table_name='medical_documents')
+    op.drop_table('medical_documents')
+    op.drop_index(op.f('ix_patient_analyses_request_id'), table_name='patient_analyses')
+    op.drop_table('patient_analyses')

api/app/main.py CHANGED Viewed

@@ -3,22 +3,19 @@ RagBot FastAPI Main Application
 Medical biomarker analysis API
 """
-import os
-import sys
 import logging
-from pathlib import Path
 from contextlib import asynccontextmanager
 from fastapi import FastAPI, Request, status
 from fastapi.middleware.cors import CORSMiddleware
 from fastapi.responses import JSONResponse
-from fastapi.exceptions import RequestValidationError
 from app import __version__
-from app.routes import health, biomarkers, analyze
 from app.services.ragbot import get_ragbot_service
 # Configure logging
 logging.basicConfig(
     level=logging.INFO,
@@ -40,7 +37,7 @@ async def lifespan(app: FastAPI):
     logger.info("=" * 70)
     logger.info("Starting RagBot API Server")
     logger.info("=" * 70)
     # Startup: Initialize RagBot service
     try:
         ragbot_service = get_ragbot_service()
@@ -49,12 +46,12 @@ async def lifespan(app: FastAPI):
     except Exception as e:
         logger.error(f"Failed to initialize RagBot service: {e}")
         logger.warning("API will start but health checks will fail")
     logger.info("API server ready to accept requests")
     logger.info("=" * 70)
     yield  # Server runs here
     # Shutdown
     logger.info("Shutting down RagBot API Server")
@@ -178,14 +175,14 @@ async def api_v1_info():
 if __name__ == "__main__":
     import uvicorn
     # Get configuration from environment
     host = os.getenv("API_HOST", "0.0.0.0")
     port = int(os.getenv("API_PORT", "8000"))
     reload = os.getenv("API_RELOAD", "false").lower() == "true"
     logger.info(f"Starting server on {host}:{port}")
     uvicorn.run(
         "app.main:app",
         host=host,

 Medical biomarker analysis API
 """
 import logging
+import os
 from contextlib import asynccontextmanager
 from fastapi import FastAPI, Request, status
+from fastapi.exceptions import RequestValidationError
 from fastapi.middleware.cors import CORSMiddleware
 from fastapi.responses import JSONResponse
 from app import __version__
+from app.routes import analyze, biomarkers, health
 from app.services.ragbot import get_ragbot_service
 # Configure logging
 logging.basicConfig(
     level=logging.INFO,
     logger.info("=" * 70)
     logger.info("Starting RagBot API Server")
     logger.info("=" * 70)
     # Startup: Initialize RagBot service
     try:
         ragbot_service = get_ragbot_service()
     except Exception as e:
         logger.error(f"Failed to initialize RagBot service: {e}")
         logger.warning("API will start but health checks will fail")
     logger.info("API server ready to accept requests")
     logger.info("=" * 70)
     yield  # Server runs here
     # Shutdown
     logger.info("Shutting down RagBot API Server")
 if __name__ == "__main__":
     import uvicorn
     # Get configuration from environment
     host = os.getenv("API_HOST", "0.0.0.0")
     port = int(os.getenv("API_PORT", "8000"))
     reload = os.getenv("API_RELOAD", "false").lower() == "true"
     logger.info(f"Starting server on {host}:{port}")
     uvicorn.run(
         "app.main:app",
         host=host,

api/app/routes/analyze.py CHANGED Viewed

@@ -4,19 +4,13 @@ Natural language and structured biomarker analysis
 """
 import os
-from datetime import datetime
 from fastapi import APIRouter, HTTPException, status
-from app.models.schemas import (
-    NaturalAnalysisRequest,
-    StructuredAnalysisRequest,
-    AnalysisResponse,
-    ErrorResponse
-)
 from app.services.extraction import extract_biomarkers, predict_disease_simple
 from app.services.ragbot import get_ragbot_service
 router = APIRouter(prefix="/api/v1", tags=["analysis"])
@@ -45,23 +39,23 @@ async def analyze_natural(request: NaturalAnalysisRequest):
     Returns full detailed analysis with all agent outputs, citations, recommendations.
     """
     # Get services
     ragbot_service = get_ragbot_service()
     if not ragbot_service.is_ready():
         raise HTTPException(
             status_code=status.HTTP_503_SERVICE_UNAVAILABLE,
             detail="RagBot service not initialized. Please try again in a moment."
         )
     # Extract biomarkers from natural language
     ollama_base_url = os.getenv("OLLAMA_BASE_URL", "http://localhost:11434")
     biomarkers, extracted_context, error = extract_biomarkers(
         request.message,
         ollama_base_url=ollama_base_url
     )
     if error:
         raise HTTPException(
             status_code=status.HTTP_400_BAD_REQUEST,
@@ -72,7 +66,7 @@ async def analyze_natural(request: NaturalAnalysisRequest):
                 "suggestion": "Try: 'My glucose is 140 and HbA1c is 7.5'"
             }
         )
     if not biomarkers:
         raise HTTPException(
             status_code=status.HTTP_400_BAD_REQUEST,
@@ -83,14 +77,14 @@ async def analyze_natural(request: NaturalAnalysisRequest):
                 "suggestion": "Include specific biomarker values like 'glucose is 140'"
             }
         )
     # Merge extracted context with request context
     patient_context = request.patient_context.model_dump() if request.patient_context else {}
     patient_context.update(extracted_context)
     # Predict disease (simple rule-based for now)
     model_prediction = predict_disease_simple(biomarkers)
     try:
         # Run full analysis
         response = ragbot_service.analyze(
@@ -99,15 +93,15 @@ async def analyze_natural(request: NaturalAnalysisRequest):
             model_prediction=model_prediction,
             extracted_biomarkers=biomarkers  # Keep original extraction
         )
         return response
     except Exception as e:
         raise HTTPException(
             status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
             detail={
                 "error_code": "ANALYSIS_FAILED",
-                "message": f"Analysis workflow failed: {str(e)}",
                 "biomarkers_received": biomarkers
             }
         )
@@ -145,16 +139,16 @@ async def analyze_structured(request: StructuredAnalysisRequest):
     Use this endpoint when you already have structured biomarker data.
     Returns full detailed analysis with all agent outputs, citations, recommendations.
     """
     # Get services
     ragbot_service = get_ragbot_service()
     if not ragbot_service.is_ready():
         raise HTTPException(
             status_code=status.HTTP_503_SERVICE_UNAVAILABLE,
             detail="RagBot service not initialized. Please try again in a moment."
         )
     # Validate biomarkers
     if not request.biomarkers:
         raise HTTPException(
@@ -165,13 +159,13 @@ async def analyze_structured(request: StructuredAnalysisRequest):
                 "suggestion": "Provide at least one biomarker with a numeric value"
             }
         )
     # Patient context
     patient_context = request.patient_context.model_dump() if request.patient_context else {}
     # Predict disease
     model_prediction = predict_disease_simple(request.biomarkers)
     try:
         # Run full analysis
         response = ragbot_service.analyze(
@@ -180,15 +174,15 @@ async def analyze_structured(request: StructuredAnalysisRequest):
             model_prediction=model_prediction,
             extracted_biomarkers=None  # No extraction for structured input
         )
         return response
     except Exception as e:
         raise HTTPException(
             status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
             detail={
                 "error_code": "ANALYSIS_FAILED",
-                "message": f"Analysis workflow failed: {str(e)}",
                 "biomarkers_received": request.biomarkers
             }
         )
@@ -211,16 +205,16 @@ async def get_example():
     Same as CLI chatbot 'example' command.
     """
     # Get services
     ragbot_service = get_ragbot_service()
     if not ragbot_service.is_ready():
         raise HTTPException(
             status_code=status.HTTP_503_SERVICE_UNAVAILABLE,
             detail="RagBot service not initialized. Please try again in a moment."
         )
     # Example biomarkers (Type 2 Diabetes patient)
     biomarkers = {
         "Glucose": 185.0,
@@ -235,14 +229,14 @@ async def get_example():
         "Systolic Blood Pressure": 142.0,
         "Diastolic Blood Pressure": 88.0
     }
     patient_context = {
         "age": 52,
         "gender": "male",
         "bmi": 31.2,
         "patient_id": "EXAMPLE-001"
     }
     model_prediction = {
         "disease": "Diabetes",
         "confidence": 0.87,
@@ -254,7 +248,7 @@ async def get_example():
             "Thrombocytopenia": 0.01
         }
     }
     try:
         # Run analysis
         response = ragbot_service.analyze(
@@ -263,14 +257,14 @@ async def get_example():
             model_prediction=model_prediction,
             extracted_biomarkers=None
         )
         return response
     except Exception as e:
         raise HTTPException(
             status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
             detail={
                 "error_code": "EXAMPLE_FAILED",
-                "message": f"Example analysis failed: {str(e)}"
             }
         )

 """
 import os
 from fastapi import APIRouter, HTTPException, status
+from app.models.schemas import AnalysisResponse, NaturalAnalysisRequest, StructuredAnalysisRequest
 from app.services.extraction import extract_biomarkers, predict_disease_simple
 from app.services.ragbot import get_ragbot_service
 router = APIRouter(prefix="/api/v1", tags=["analysis"])
     Returns full detailed analysis with all agent outputs, citations, recommendations.
     """
     # Get services
     ragbot_service = get_ragbot_service()
     if not ragbot_service.is_ready():
         raise HTTPException(
             status_code=status.HTTP_503_SERVICE_UNAVAILABLE,
             detail="RagBot service not initialized. Please try again in a moment."
         )
     # Extract biomarkers from natural language
     ollama_base_url = os.getenv("OLLAMA_BASE_URL", "http://localhost:11434")
     biomarkers, extracted_context, error = extract_biomarkers(
         request.message,
         ollama_base_url=ollama_base_url
     )
     if error:
         raise HTTPException(
             status_code=status.HTTP_400_BAD_REQUEST,
                 "suggestion": "Try: 'My glucose is 140 and HbA1c is 7.5'"
             }
         )
     if not biomarkers:
         raise HTTPException(
             status_code=status.HTTP_400_BAD_REQUEST,
                 "suggestion": "Include specific biomarker values like 'glucose is 140'"
             }
         )
     # Merge extracted context with request context
     patient_context = request.patient_context.model_dump() if request.patient_context else {}
     patient_context.update(extracted_context)
     # Predict disease (simple rule-based for now)
     model_prediction = predict_disease_simple(biomarkers)
     try:
         # Run full analysis
         response = ragbot_service.analyze(
             model_prediction=model_prediction,
             extracted_biomarkers=biomarkers  # Keep original extraction
         )
         return response
     except Exception as e:
         raise HTTPException(
             status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
             detail={
                 "error_code": "ANALYSIS_FAILED",
+                "message": f"Analysis workflow failed: {e!s}",
                 "biomarkers_received": biomarkers
             }
         )
     Use this endpoint when you already have structured biomarker data.
     Returns full detailed analysis with all agent outputs, citations, recommendations.
     """
     # Get services
     ragbot_service = get_ragbot_service()
     if not ragbot_service.is_ready():
         raise HTTPException(
             status_code=status.HTTP_503_SERVICE_UNAVAILABLE,
             detail="RagBot service not initialized. Please try again in a moment."
         )
     # Validate biomarkers
     if not request.biomarkers:
         raise HTTPException(
                 "suggestion": "Provide at least one biomarker with a numeric value"
             }
         )
     # Patient context
     patient_context = request.patient_context.model_dump() if request.patient_context else {}
     # Predict disease
     model_prediction = predict_disease_simple(request.biomarkers)
     try:
         # Run full analysis
         response = ragbot_service.analyze(
             model_prediction=model_prediction,
             extracted_biomarkers=None  # No extraction for structured input
         )
         return response
     except Exception as e:
         raise HTTPException(
             status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
             detail={
                 "error_code": "ANALYSIS_FAILED",
+                "message": f"Analysis workflow failed: {e!s}",
                 "biomarkers_received": request.biomarkers
             }
         )
     Same as CLI chatbot 'example' command.
     """
     # Get services
     ragbot_service = get_ragbot_service()
     if not ragbot_service.is_ready():
         raise HTTPException(
             status_code=status.HTTP_503_SERVICE_UNAVAILABLE,
             detail="RagBot service not initialized. Please try again in a moment."
         )
     # Example biomarkers (Type 2 Diabetes patient)
     biomarkers = {
         "Glucose": 185.0,
         "Systolic Blood Pressure": 142.0,
         "Diastolic Blood Pressure": 88.0
     }
     patient_context = {
         "age": 52,
         "gender": "male",
         "bmi": 31.2,
         "patient_id": "EXAMPLE-001"
     }
     model_prediction = {
         "disease": "Diabetes",
         "confidence": 0.87,
             "Thrombocytopenia": 0.01
         }
     }
     try:
         # Run analysis
         response = ragbot_service.analyze(
             model_prediction=model_prediction,
             extracted_biomarkers=None
         )
         return response
     except Exception as e:
         raise HTTPException(
             status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
             detail={
                 "error_code": "EXAMPLE_FAILED",
+                "message": f"Example analysis failed: {e!s}"
             }
         )

api/app/routes/biomarkers.py CHANGED Viewed

@@ -3,13 +3,12 @@ Biomarkers List Endpoint
 """
 import json
-import sys
-from pathlib import Path
 from datetime import datetime
-from fastapi import APIRouter, HTTPException
-from app.models.schemas import BiomarkersListResponse, BiomarkerInfo, BiomarkerReferenceRange
 router = APIRouter(prefix="/api/v1", tags=["biomarkers"])
@@ -30,22 +29,22 @@ async def list_biomarkers():
     - Understanding what biomarkers can be analyzed
     - Getting reference ranges for display
     """
     try:
         # Load biomarker references
         config_path = Path(__file__).parent.parent.parent.parent / "config" / "biomarker_references.json"
-        with open(config_path, 'r') as f:
             config_data = json.load(f)
         biomarkers_data = config_data.get("biomarkers", {})
         biomarkers_list = []
         for name, info in biomarkers_data.items():
             # Parse reference range
             normal_range_data = info.get("normal_range", {})
             if "male" in normal_range_data or "female" in normal_range_data:
                 # Gender-specific ranges
                 reference_range = BiomarkerReferenceRange(
@@ -62,7 +61,7 @@ async def list_biomarkers():
                     male=None,
                     female=None
                 )
             biomarker_info = BiomarkerInfo(
                 name=name,
                 unit=info.get("unit", ""),
@@ -73,23 +72,23 @@ async def list_biomarkers():
                 description=info.get("description", ""),
                 clinical_significance=info.get("clinical_significance", {})
             )
             biomarkers_list.append(biomarker_info)
         return BiomarkersListResponse(
             biomarkers=biomarkers_list,
             total_count=len(biomarkers_list),
             timestamp=datetime.now().isoformat()
         )
     except FileNotFoundError:
         raise HTTPException(
             status_code=500,
             detail="Biomarker configuration file not found"
         )
     except Exception as e:
         raise HTTPException(
             status_code=500,
-            detail=f"Failed to load biomarkers: {str(e)}"
         )

 """
 import json
 from datetime import datetime
+from pathlib import Path
+from fastapi import APIRouter, HTTPException
+from app.models.schemas import BiomarkerInfo, BiomarkerReferenceRange, BiomarkersListResponse
 router = APIRouter(prefix="/api/v1", tags=["biomarkers"])
     - Understanding what biomarkers can be analyzed
     - Getting reference ranges for display
     """
     try:
         # Load biomarker references
         config_path = Path(__file__).parent.parent.parent.parent / "config" / "biomarker_references.json"
+        with open(config_path) as f:
             config_data = json.load(f)
         biomarkers_data = config_data.get("biomarkers", {})
         biomarkers_list = []
         for name, info in biomarkers_data.items():
             # Parse reference range
             normal_range_data = info.get("normal_range", {})
             if "male" in normal_range_data or "female" in normal_range_data:
                 # Gender-specific ranges
                 reference_range = BiomarkerReferenceRange(
                     male=None,
                     female=None
                 )
             biomarker_info = BiomarkerInfo(
                 name=name,
                 unit=info.get("unit", ""),
                 description=info.get("description", ""),
                 clinical_significance=info.get("clinical_significance", {})
             )
             biomarkers_list.append(biomarker_info)
         return BiomarkersListResponse(
             biomarkers=biomarkers_list,
             total_count=len(biomarkers_list),
             timestamp=datetime.now().isoformat()
         )
     except FileNotFoundError:
         raise HTTPException(
             status_code=500,
             detail="Biomarker configuration file not found"
         )
     except Exception as e:
         raise HTTPException(
             status_code=500,
+            detail=f"Failed to load biomarkers: {e!s}"
         )

api/app/routes/health.py CHANGED Viewed

@@ -2,16 +2,13 @@
 Health Check Endpoint
 """
-import os
-import sys
-from pathlib import Path
 from datetime import datetime
-from fastapi import APIRouter, HTTPException
 from app.models.schemas import HealthResponse
 from app.services.ragbot import get_ragbot_service
-from app import __version__
 router = APIRouter(prefix="/api/v1", tags=["health"])
@@ -30,16 +27,16 @@ async def health_check():
     Returns health status with component details.
     """
     ragbot_service = get_ragbot_service()
     # Check LLM API connection
     llm_status = "disconnected"
     available_models = []
     try:
-        from src.llm_config import get_chat_model, DEFAULT_LLM_PROVIDER
         test_llm = get_chat_model(temperature=0.0)
         # Try a simple test
         response = test_llm.invoke("Say OK")
         if response:
@@ -50,13 +47,13 @@ async def health_check():
                 available_models = ["gemini-2.0-flash (Google)"]
             else:
                 available_models = ["llama3.1:8b (Ollama)"]
     except Exception as e:
         llm_status = f"error: {str(e)[:100]}"
     # Check vector store
     vector_store_loaded = ragbot_service.is_ready()
     # Determine overall status
     if llm_status == "connected" and vector_store_loaded:
         overall_status = "healthy"
@@ -64,7 +61,7 @@ async def health_check():
         overall_status = "degraded"
     else:
         overall_status = "unhealthy"
     return HealthResponse(
         status=overall_status,
         timestamp=datetime.now().isoformat(),

 Health Check Endpoint
 """
 from datetime import datetime
+from fastapi import APIRouter
+from app import __version__
 from app.models.schemas import HealthResponse
 from app.services.ragbot import get_ragbot_service
 router = APIRouter(prefix="/api/v1", tags=["health"])
     Returns health status with component details.
     """
     ragbot_service = get_ragbot_service()
     # Check LLM API connection
     llm_status = "disconnected"
     available_models = []
     try:
+        from src.llm_config import DEFAULT_LLM_PROVIDER, get_chat_model
         test_llm = get_chat_model(temperature=0.0)
         # Try a simple test
         response = test_llm.invoke("Say OK")
         if response:
                 available_models = ["gemini-2.0-flash (Google)"]
             else:
                 available_models = ["llama3.1:8b (Ollama)"]
     except Exception as e:
         llm_status = f"error: {str(e)[:100]}"
     # Check vector store
     vector_store_loaded = ragbot_service.is_ready()
     # Determine overall status
     if llm_status == "connected" and vector_store_loaded:
         overall_status = "healthy"
         overall_status = "degraded"
     else:
         overall_status = "unhealthy"
     return HealthResponse(
         status=overall_status,
         timestamp=datetime.now().isoformat(),

api/app/services/extraction.py CHANGED Viewed

@@ -6,7 +6,7 @@ Extracts biomarker values from natural language text using LLM
 import json
 import sys
 from pathlib import Path
-from typing import Dict, Any, Tuple
 # Ensure project root is in path for src imports
 _project_root = str(Path(__file__).parent.parent.parent.parent)
@@ -14,10 +14,10 @@ if _project_root not in sys.path:
     sys.path.insert(0, _project_root)
 from langchain_core.prompts import ChatPromptTemplate
 from src.biomarker_normalization import normalize_biomarker_name
 from src.llm_config import get_chat_model
 # ============================================================================
 # EXTRACTION PROMPT
 # ============================================================================
@@ -54,7 +54,7 @@ If you cannot find any biomarkers, return {{"biomarkers": {{}}, "patient_context
 # EXTRACTION HELPERS
 # ============================================================================
-def _parse_llm_json(content: str) -> Dict[str, Any]:
     """Parse JSON payload from LLM output with fallback recovery."""
     text = content.strip()
@@ -78,9 +78,9 @@ def _parse_llm_json(content: str) -> Dict[str, Any]:
 # ============================================================================
 def extract_biomarkers(
-    user_message: str,
     ollama_base_url: str = None  # Kept for backward compatibility, ignored
-) -> Tuple[Dict[str, float], Dict[str, Any], str]:
     """
     Extract biomarker values from natural language using LLM.
@@ -102,18 +102,18 @@ def extract_biomarkers(
     try:
         # Initialize LLM (uses Groq/Gemini by default - FREE)
         llm = get_chat_model(temperature=0.0)
         prompt = ChatPromptTemplate.from_template(BIOMARKER_EXTRACTION_PROMPT)
         chain = prompt | llm
         # Invoke LLM
         response = chain.invoke({"user_message": user_message})
         content = response.content.strip()
         extracted = _parse_llm_json(content)
         biomarkers = extracted.get("biomarkers", {})
         patient_context = extracted.get("patient_context", {})
         # Normalize biomarker names and convert to float
         normalized = {}
         for key, value in biomarkers.items():
@@ -123,27 +123,27 @@ def extract_biomarkers(
             except (ValueError, TypeError):
                 # Skip invalid values
                 continue
         # Clean up patient context (remove null values)
         patient_context = {k: v for k, v in patient_context.items() if v is not None}
         if not normalized:
             return {}, patient_context, "No biomarkers found in the input"
         return normalized, patient_context, ""
     except json.JSONDecodeError as e:
-        return {}, {}, f"Failed to parse LLM response as JSON: {str(e)}"
     except Exception as e:
-        return {}, {}, f"Extraction failed: {str(e)}"
 # ============================================================================
 # SIMPLE DISEASE PREDICTION (Fallback)
 # ============================================================================
-def predict_disease_simple(biomarkers: Dict[str, float]) -> Dict[str, Any]:
     """
     Simple rule-based disease prediction based on key biomarkers.
     Used as a fallback when no ML model is available.
@@ -161,15 +161,15 @@ def predict_disease_simple(biomarkers: Dict[str, float]) -> Dict[str, Any]:
         "Thrombocytopenia": 0.0,
         "Thalassemia": 0.0
     }
     # Helper: check both abbreviated and normalized biomarker names
     # Returns None when biomarker is not present (avoids false triggers)
     def _get(name, *alt_names):
-        val = biomarkers.get(name, None)
         if val is not None:
             return val
         for alt in alt_names:
-            val = biomarkers.get(alt, None)
             if val is not None:
                 return val
         return None
@@ -183,7 +183,7 @@ def predict_disease_simple(biomarkers: Dict[str, float]) -> Dict[str, Any]:
         scores["Diabetes"] += 0.2
     if hba1c is not None and hba1c >= 6.5:
         scores["Diabetes"] += 0.5
     # Anemia indicators
     hemoglobin = _get("Hemoglobin")
     mcv = _get("Mean Corpuscular Volume", "MCV")
@@ -193,7 +193,7 @@ def predict_disease_simple(biomarkers: Dict[str, float]) -> Dict[str, Any]:
         scores["Anemia"] += 0.2
     if mcv is not None and mcv < 80:
         scores["Anemia"] += 0.2
     # Heart disease indicators
     cholesterol = _get("Cholesterol")
     troponin = _get("Troponin")
@@ -204,32 +204,32 @@ def predict_disease_simple(biomarkers: Dict[str, float]) -> Dict[str, Any]:
         scores["Heart Disease"] += 0.6
     if ldl is not None and ldl > 190:
         scores["Heart Disease"] += 0.2
     # Thrombocytopenia indicators
     platelets = _get("Platelets")
     if platelets is not None and platelets < 150000:
         scores["Thrombocytopenia"] += 0.6
     if platelets is not None and platelets < 50000:
         scores["Thrombocytopenia"] += 0.3
     # Thalassemia indicators (simplified)
     if mcv is not None and hemoglobin is not None and mcv < 80 and hemoglobin < 12.0:
         scores["Thalassemia"] += 0.4
     # Find top prediction
     top_disease = max(scores, key=scores.get)
     confidence = min(scores[top_disease], 1.0)  # Cap at 1.0 for Pydantic validation
     if confidence == 0.0:
         top_disease = "Undetermined"
     # Normalize probabilities to sum to 1.0
     total = sum(scores.values())
     if total > 0:
         probabilities = {k: v / total for k, v in scores.items()}
     else:
         probabilities = {k: 1.0 / len(scores) for k in scores}
     return {
         "disease": top_disease,
         "confidence": confidence,

 import json
 import sys
 from pathlib import Path
+from typing import Any
 # Ensure project root is in path for src imports
 _project_root = str(Path(__file__).parent.parent.parent.parent)
     sys.path.insert(0, _project_root)
 from langchain_core.prompts import ChatPromptTemplate
 from src.biomarker_normalization import normalize_biomarker_name
 from src.llm_config import get_chat_model
 # ============================================================================
 # EXTRACTION PROMPT
 # ============================================================================
 # EXTRACTION HELPERS
 # ============================================================================
+def _parse_llm_json(content: str) -> dict[str, Any]:
     """Parse JSON payload from LLM output with fallback recovery."""
     text = content.strip()
 # ============================================================================
 def extract_biomarkers(
+    user_message: str,
     ollama_base_url: str = None  # Kept for backward compatibility, ignored
+) -> tuple[dict[str, float], dict[str, Any], str]:
     """
     Extract biomarker values from natural language using LLM.
     try:
         # Initialize LLM (uses Groq/Gemini by default - FREE)
         llm = get_chat_model(temperature=0.0)
         prompt = ChatPromptTemplate.from_template(BIOMARKER_EXTRACTION_PROMPT)
         chain = prompt | llm
         # Invoke LLM
         response = chain.invoke({"user_message": user_message})
         content = response.content.strip()
         extracted = _parse_llm_json(content)
         biomarkers = extracted.get("biomarkers", {})
         patient_context = extracted.get("patient_context", {})
         # Normalize biomarker names and convert to float
         normalized = {}
         for key, value in biomarkers.items():
             except (ValueError, TypeError):
                 # Skip invalid values
                 continue
         # Clean up patient context (remove null values)
         patient_context = {k: v for k, v in patient_context.items() if v is not None}
         if not normalized:
             return {}, patient_context, "No biomarkers found in the input"
         return normalized, patient_context, ""
     except json.JSONDecodeError as e:
+        return {}, {}, f"Failed to parse LLM response as JSON: {e!s}"
     except Exception as e:
+        return {}, {}, f"Extraction failed: {e!s}"
 # ============================================================================
 # SIMPLE DISEASE PREDICTION (Fallback)
 # ============================================================================
+def predict_disease_simple(biomarkers: dict[str, float]) -> dict[str, Any]:
     """
     Simple rule-based disease prediction based on key biomarkers.
     Used as a fallback when no ML model is available.
         "Thrombocytopenia": 0.0,
         "Thalassemia": 0.0
     }
     # Helper: check both abbreviated and normalized biomarker names
     # Returns None when biomarker is not present (avoids false triggers)
     def _get(name, *alt_names):
+        val = biomarkers.get(name)
         if val is not None:
             return val
         for alt in alt_names:
+            val = biomarkers.get(alt)
             if val is not None:
                 return val
         return None
         scores["Diabetes"] += 0.2
     if hba1c is not None and hba1c >= 6.5:
         scores["Diabetes"] += 0.5
     # Anemia indicators
     hemoglobin = _get("Hemoglobin")
     mcv = _get("Mean Corpuscular Volume", "MCV")
         scores["Anemia"] += 0.2
     if mcv is not None and mcv < 80:
         scores["Anemia"] += 0.2
     # Heart disease indicators
     cholesterol = _get("Cholesterol")
     troponin = _get("Troponin")
         scores["Heart Disease"] += 0.6
     if ldl is not None and ldl > 190:
         scores["Heart Disease"] += 0.2
     # Thrombocytopenia indicators
     platelets = _get("Platelets")
     if platelets is not None and platelets < 150000:
         scores["Thrombocytopenia"] += 0.6
     if platelets is not None and platelets < 50000:
         scores["Thrombocytopenia"] += 0.3
     # Thalassemia indicators (simplified)
     if mcv is not None and hemoglobin is not None and mcv < 80 and hemoglobin < 12.0:
         scores["Thalassemia"] += 0.4
     # Find top prediction
     top_disease = max(scores, key=scores.get)
     confidence = min(scores[top_disease], 1.0)  # Cap at 1.0 for Pydantic validation
     if confidence == 0.0:
         top_disease = "Undetermined"
     # Normalize probabilities to sum to 1.0
     total = sum(scores.values())
     if total > 0:
         probabilities = {k: v / total for k, v in scores.items()}
     else:
         probabilities = {k: 1.0 / len(scores) for k in scores}
     return {
         "disease": top_disease,
         "confidence": confidence,

api/app/services/ragbot.py CHANGED Viewed

@@ -6,22 +6,29 @@ Wraps the RagBot workflow and formats comprehensive responses
 import sys
 import time
 import uuid
-from pathlib import Path
-from typing import Dict, Any
 from datetime import datetime
 # Ensure project root is in path for src imports
 _project_root = str(Path(__file__).parent.parent.parent.parent)
 if _project_root not in sys.path:
     sys.path.insert(0, _project_root)
-from src.workflow import create_guild
-from src.state import PatientInput
 from app.models.schemas import (
-    AnalysisResponse, Analysis, Prediction, BiomarkerFlag,
-    SafetyAlert, KeyDriver, DiseaseExplanation, Recommendations,
-    ConfidenceAssessment, AgentOutput
 )
 class RagBotService:
@@ -29,65 +36,65 @@ class RagBotService:
     Service class to manage RagBot workflow lifecycle.
     Initializes once, then handles multiple analysis requests.
     """
     def __init__(self):
         """Initialize the workflow (loads vector store, models, etc.)"""
         self.guild = None
         self.initialized = False
         self.init_time = None
     def initialize(self):
         """Initialize the Clinical Insight Guild (expensive operation)"""
         if self.initialized:
             return
         print("INFO: Initializing RagBot workflow...")
         start_time = time.time()
         import os
         try:
             # Set working directory via environment so vector store paths resolve
             # without a process-global os.chdir() (which is thread-unsafe).
             ragbot_root = Path(__file__).parent.parent.parent.parent
             os.environ["RAGBOT_ROOT"] = str(ragbot_root)
             print(f"INFO: Project root: {ragbot_root}")
             # Temporarily chdir only during initialization (single-threaded at startup)
             original_dir = os.getcwd()
             os.chdir(ragbot_root)
             self.guild = create_guild()
             self.initialized = True
             self.init_time = datetime.now()
             elapsed = (time.time() - start_time) * 1000
             print(f"OK: RagBot initialized successfully ({elapsed:.0f}ms)")
         except Exception as e:
             print(f"ERROR: Failed to initialize RagBot: {e}")
             raise
         finally:
             # Restore original directory
             os.chdir(original_dir)
     def get_uptime_seconds(self) -> float:
         """Get API uptime in seconds"""
         if not self.init_time:
             return 0.0
         return (datetime.now() - self.init_time).total_seconds()
     def is_ready(self) -> bool:
         """Check if service is ready to handle requests"""
         return self.initialized and self.guild is not None
     def analyze(
         self,
-        biomarkers: Dict[str, float],
-        patient_context: Dict[str, Any],
-        model_prediction: Dict[str, Any],
-        extracted_biomarkers: Dict[str, float] = None
     ) -> AnalysisResponse:
         """
         Run complete analysis workflow and format full detailed response.
@@ -103,10 +110,10 @@ class RagBotService:
         """
         if not self.is_ready():
             raise RuntimeError("RagBot service not initialized. Call initialize() first.")
         request_id = f"req_{uuid.uuid4().hex[:12]}"
         start_time = time.time()
         try:
             # Create PatientInput
             patient_input = PatientInput(
@@ -114,13 +121,13 @@ class RagBotService:
                 model_prediction=model_prediction,
                 patient_context=patient_context
             )
             # Run workflow
             workflow_result = self.guild.run(patient_input)
             # Calculate processing time
             processing_time_ms = (time.time() - start_time) * 1000
             # Format response
             response = self._format_response(
                 request_id=request_id,
@@ -131,21 +138,21 @@ class RagBotService:
                 model_prediction=model_prediction,
                 processing_time_ms=processing_time_ms
             )
             return response
         except Exception as e:
             # Re-raise with context
-            raise RuntimeError(f"Analysis failed during workflow execution: {str(e)}") from e
     def _format_response(
         self,
         request_id: str,
-        workflow_result: Dict[str, Any],
-        input_biomarkers: Dict[str, float],
-        extracted_biomarkers: Dict[str, float],
-        patient_context: Dict[str, Any],
-        model_prediction: Dict[str, Any],
         processing_time_ms: float
     ) -> AnalysisResponse:
         """
@@ -159,17 +166,17 @@ class RagBotService:
         - safety_alerts: list of SafetyAlert objects
         - sop_version, processing_timestamp, etc.
         """
         # The synthesizer output is nested inside final_response
         final_response = workflow_result.get("final_response", {}) or {}
         # Extract main prediction
         prediction = Prediction(
             disease=model_prediction["disease"],
             confidence=model_prediction["confidence"],
             probabilities=model_prediction.get("probabilities", {})
         )
         # Biomarker flags: prefer state-level data (BiomarkerFlag objects from validator),
         # fall back to synthesizer output
         state_flags = workflow_result.get("biomarker_flags", [])
@@ -188,7 +195,7 @@ class RagBotService:
                 BiomarkerFlag(**flag) if isinstance(flag, dict) else BiomarkerFlag(**flag.model_dump())
                 for flag in biomarker_flags_source
             ]
         # Safety alerts: prefer state-level data, fall back to synthesizer
         state_alerts = workflow_result.get("safety_alerts", [])
         if state_alerts:
@@ -206,7 +213,7 @@ class RagBotService:
                 SafetyAlert(**alert) if isinstance(alert, dict) else SafetyAlert(**alert.model_dump())
                 for alert in safety_alerts_source
             ]
         # Extract key drivers from synthesizer output
         key_drivers_data = final_response.get("key_drivers", [])
         if not key_drivers_data:
@@ -215,7 +222,7 @@ class RagBotService:
         for driver in key_drivers_data:
             if isinstance(driver, dict):
                 key_drivers.append(KeyDriver(**driver))
         # Disease explanation from synthesizer
         disease_exp_data = final_response.get("disease_explanation", {})
         if not disease_exp_data:
@@ -225,7 +232,7 @@ class RagBotService:
             citations=disease_exp_data.get("citations", []),
             retrieved_chunks=disease_exp_data.get("retrieved_chunks")
         )
         # Recommendations from synthesizer
         recs_data = final_response.get("recommendations", {})
         if not recs_data:
@@ -238,7 +245,7 @@ class RagBotService:
             monitoring=recs_data.get("monitoring", []),
             follow_up=recs_data.get("follow_up")
         )
         # Confidence assessment from synthesizer
         conf_data = final_response.get("confidence_assessment", {})
         if not conf_data:
@@ -249,12 +256,12 @@ class RagBotService:
             limitations=conf_data.get("limitations", []),
             reasoning=conf_data.get("reasoning")
         )
         # Alternative diagnoses
         alternative_diagnoses = final_response.get("alternative_diagnoses")
         if alternative_diagnoses is None:
             alternative_diagnoses = final_response.get("analysis", {}).get("alternative_diagnoses")
         # Assemble complete analysis
         analysis = Analysis(
             biomarker_flags=biomarker_flags,
@@ -265,7 +272,7 @@ class RagBotService:
             confidence_assessment=confidence_assessment,
             alternative_diagnoses=alternative_diagnoses
         )
         # Agent outputs from state (these are src.state.AgentOutput objects)
         agent_outputs_data = workflow_result.get("agent_outputs", [])
         agent_outputs = []
@@ -274,7 +281,7 @@ class RagBotService:
                 agent_outputs.append(AgentOutput(**agent_out.model_dump()))
             elif isinstance(agent_out, dict):
                 agent_outputs.append(AgentOutput(**agent_out))
         # Workflow metadata
         workflow_metadata = {
             "sop_version": workflow_result.get("sop_version"),
@@ -282,12 +289,12 @@ class RagBotService:
             "agents_executed": len(agent_outputs),
             "workflow_success": True
         }
         # Conversational summary (if available)
         conversational_summary = final_response.get("conversational_summary")
         if not conversational_summary:
             conversational_summary = final_response.get("patient_summary", {}).get("narrative")
         # Generate conversational summary if not present
         if not conversational_summary:
             conversational_summary = self._generate_conversational_summary(
@@ -296,7 +303,7 @@ class RagBotService:
                 key_drivers=key_drivers,
                 recommendations=recommendations
             )
         # Assemble final response
         response = AnalysisResponse(
             status="success",
@@ -313,9 +320,9 @@ class RagBotService:
             processing_time_ms=processing_time_ms,
             sop_version=workflow_result.get("sop_version", "Baseline")
         )
         return response
     def _generate_conversational_summary(
         self,
         prediction: Prediction,
@@ -324,37 +331,37 @@ class RagBotService:
         recommendations: Recommendations
     ) -> str:
         """Generate a simple conversational summary"""
         summary_parts = []
         summary_parts.append("Hi there!\n")
         summary_parts.append("Based on your biomarkers, I analyzed your results.\n")
         # Prediction
         summary_parts.append(f"\nPrimary Finding: {prediction.disease}")
         summary_parts.append(f"   Confidence: {prediction.confidence:.0%}\n")
         # Safety alerts
         if safety_alerts:
             summary_parts.append("\nIMPORTANT SAFETY ALERTS:")
             for alert in safety_alerts[:3]:  # Top 3
                 summary_parts.append(f"   - {alert.biomarker}: {alert.message}")
                 summary_parts.append(f"     Action: {alert.action}")
         # Key drivers
         if key_drivers:
             summary_parts.append("\nWhy this prediction?")
             for driver in key_drivers[:3]:  # Top 3
                 summary_parts.append(f"   - {driver.biomarker} ({driver.value}): {driver.explanation[:100]}...")
         # Recommendations
         if recommendations.immediate_actions:
             summary_parts.append("\nWhat You Should Do:")
             for i, action in enumerate(recommendations.immediate_actions[:3], 1):
                 summary_parts.append(f"   {i}. {action}")
         summary_parts.append("\nImportant: This is an AI-assisted analysis, NOT medical advice.")
         summary_parts.append("   Please consult a healthcare professional for proper diagnosis and treatment.")
         return "\n".join(summary_parts)

 import sys
 import time
 import uuid
 from datetime import datetime
+from pathlib import Path
+from typing import Any
 # Ensure project root is in path for src imports
 _project_root = str(Path(__file__).parent.parent.parent.parent)
 if _project_root not in sys.path:
     sys.path.insert(0, _project_root)
 from app.models.schemas import (
+    AgentOutput,
+    Analysis,
+    AnalysisResponse,
+    BiomarkerFlag,
+    ConfidenceAssessment,
+    DiseaseExplanation,
+    KeyDriver,
+    Prediction,
+    Recommendations,
+    SafetyAlert,
 )
+from src.state import PatientInput
+from src.workflow import create_guild
 class RagBotService:
     Service class to manage RagBot workflow lifecycle.
     Initializes once, then handles multiple analysis requests.
     """
     def __init__(self):
         """Initialize the workflow (loads vector store, models, etc.)"""
         self.guild = None
         self.initialized = False
         self.init_time = None
     def initialize(self):
         """Initialize the Clinical Insight Guild (expensive operation)"""
         if self.initialized:
             return
         print("INFO: Initializing RagBot workflow...")
         start_time = time.time()
         import os
         try:
             # Set working directory via environment so vector store paths resolve
             # without a process-global os.chdir() (which is thread-unsafe).
             ragbot_root = Path(__file__).parent.parent.parent.parent
             os.environ["RAGBOT_ROOT"] = str(ragbot_root)
             print(f"INFO: Project root: {ragbot_root}")
             # Temporarily chdir only during initialization (single-threaded at startup)
             original_dir = os.getcwd()
             os.chdir(ragbot_root)
             self.guild = create_guild()
             self.initialized = True
             self.init_time = datetime.now()
             elapsed = (time.time() - start_time) * 1000
             print(f"OK: RagBot initialized successfully ({elapsed:.0f}ms)")
         except Exception as e:
             print(f"ERROR: Failed to initialize RagBot: {e}")
             raise
         finally:
             # Restore original directory
             os.chdir(original_dir)
     def get_uptime_seconds(self) -> float:
         """Get API uptime in seconds"""
         if not self.init_time:
             return 0.0
         return (datetime.now() - self.init_time).total_seconds()
     def is_ready(self) -> bool:
         """Check if service is ready to handle requests"""
         return self.initialized and self.guild is not None
     def analyze(
         self,
+        biomarkers: dict[str, float],
+        patient_context: dict[str, Any],
+        model_prediction: dict[str, Any],
+        extracted_biomarkers: dict[str, float] = None
     ) -> AnalysisResponse:
         """
         Run complete analysis workflow and format full detailed response.
         """
         if not self.is_ready():
             raise RuntimeError("RagBot service not initialized. Call initialize() first.")
         request_id = f"req_{uuid.uuid4().hex[:12]}"
         start_time = time.time()
         try:
             # Create PatientInput
             patient_input = PatientInput(
                 model_prediction=model_prediction,
                 patient_context=patient_context
             )
             # Run workflow
             workflow_result = self.guild.run(patient_input)
             # Calculate processing time
             processing_time_ms = (time.time() - start_time) * 1000
             # Format response
             response = self._format_response(
                 request_id=request_id,
                 model_prediction=model_prediction,
                 processing_time_ms=processing_time_ms
             )
             return response
         except Exception as e:
             # Re-raise with context
+            raise RuntimeError(f"Analysis failed during workflow execution: {e!s}") from e
     def _format_response(
         self,
         request_id: str,
+        workflow_result: dict[str, Any],
+        input_biomarkers: dict[str, float],
+        extracted_biomarkers: dict[str, float],
+        patient_context: dict[str, Any],
+        model_prediction: dict[str, Any],
         processing_time_ms: float
     ) -> AnalysisResponse:
         """
         - safety_alerts: list of SafetyAlert objects
         - sop_version, processing_timestamp, etc.
         """
         # The synthesizer output is nested inside final_response
         final_response = workflow_result.get("final_response", {}) or {}
         # Extract main prediction
         prediction = Prediction(
             disease=model_prediction["disease"],
             confidence=model_prediction["confidence"],
             probabilities=model_prediction.get("probabilities", {})
         )
         # Biomarker flags: prefer state-level data (BiomarkerFlag objects from validator),
         # fall back to synthesizer output
         state_flags = workflow_result.get("biomarker_flags", [])
                 BiomarkerFlag(**flag) if isinstance(flag, dict) else BiomarkerFlag(**flag.model_dump())
                 for flag in biomarker_flags_source
             ]
         # Safety alerts: prefer state-level data, fall back to synthesizer
         state_alerts = workflow_result.get("safety_alerts", [])
         if state_alerts:
                 SafetyAlert(**alert) if isinstance(alert, dict) else SafetyAlert(**alert.model_dump())
                 for alert in safety_alerts_source
             ]
         # Extract key drivers from synthesizer output
         key_drivers_data = final_response.get("key_drivers", [])
         if not key_drivers_data:
         for driver in key_drivers_data:
             if isinstance(driver, dict):
                 key_drivers.append(KeyDriver(**driver))
         # Disease explanation from synthesizer
         disease_exp_data = final_response.get("disease_explanation", {})
         if not disease_exp_data:
             citations=disease_exp_data.get("citations", []),
             retrieved_chunks=disease_exp_data.get("retrieved_chunks")
         )
         # Recommendations from synthesizer
         recs_data = final_response.get("recommendations", {})
         if not recs_data:
             monitoring=recs_data.get("monitoring", []),
             follow_up=recs_data.get("follow_up")
         )
         # Confidence assessment from synthesizer
         conf_data = final_response.get("confidence_assessment", {})
         if not conf_data:
             limitations=conf_data.get("limitations", []),
             reasoning=conf_data.get("reasoning")
         )
         # Alternative diagnoses
         alternative_diagnoses = final_response.get("alternative_diagnoses")
         if alternative_diagnoses is None:
             alternative_diagnoses = final_response.get("analysis", {}).get("alternative_diagnoses")
         # Assemble complete analysis
         analysis = Analysis(
             biomarker_flags=biomarker_flags,
             confidence_assessment=confidence_assessment,
             alternative_diagnoses=alternative_diagnoses
         )
         # Agent outputs from state (these are src.state.AgentOutput objects)
         agent_outputs_data = workflow_result.get("agent_outputs", [])
         agent_outputs = []
                 agent_outputs.append(AgentOutput(**agent_out.model_dump()))
             elif isinstance(agent_out, dict):
                 agent_outputs.append(AgentOutput(**agent_out))
         # Workflow metadata
         workflow_metadata = {
             "sop_version": workflow_result.get("sop_version"),
             "agents_executed": len(agent_outputs),
             "workflow_success": True
         }
         # Conversational summary (if available)
         conversational_summary = final_response.get("conversational_summary")
         if not conversational_summary:
             conversational_summary = final_response.get("patient_summary", {}).get("narrative")
         # Generate conversational summary if not present
         if not conversational_summary:
             conversational_summary = self._generate_conversational_summary(
                 key_drivers=key_drivers,
                 recommendations=recommendations
             )
         # Assemble final response
         response = AnalysisResponse(
             status="success",
             processing_time_ms=processing_time_ms,
             sop_version=workflow_result.get("sop_version", "Baseline")
         )
         return response
     def _generate_conversational_summary(
         self,
         prediction: Prediction,
         recommendations: Recommendations
     ) -> str:
         """Generate a simple conversational summary"""
         summary_parts = []
         summary_parts.append("Hi there!\n")
         summary_parts.append("Based on your biomarkers, I analyzed your results.\n")
         # Prediction
         summary_parts.append(f"\nPrimary Finding: {prediction.disease}")
         summary_parts.append(f"   Confidence: {prediction.confidence:.0%}\n")
         # Safety alerts
         if safety_alerts:
             summary_parts.append("\nIMPORTANT SAFETY ALERTS:")
             for alert in safety_alerts[:3]:  # Top 3
                 summary_parts.append(f"   - {alert.biomarker}: {alert.message}")
                 summary_parts.append(f"     Action: {alert.action}")
         # Key drivers
         if key_drivers:
             summary_parts.append("\nWhy this prediction?")
             for driver in key_drivers[:3]:  # Top 3
                 summary_parts.append(f"   - {driver.biomarker} ({driver.value}): {driver.explanation[:100]}...")
         # Recommendations
         if recommendations.immediate_actions:
             summary_parts.append("\nWhat You Should Do:")
             for i, action in enumerate(recommendations.immediate_actions[:3], 1):
                 summary_parts.append(f"   {i}. {action}")
         summary_parts.append("\nImportant: This is an AI-assisted analysis, NOT medical advice.")
         summary_parts.append("   Please consult a healthcare professional for proper diagnosis and treatment.")
         return "\n".join(summary_parts)

archive/evolution/__init__.py CHANGED Viewed

@@ -4,32 +4,26 @@ Self-improvement system for SOP optimization
 """
 from .director import (
-    SOPGenePool,
     Diagnosis,
-    SOPMutation,
     EvolvedSOPs,
     performance_diagnostician,
     sop_architect,
-    run_evolution_cycle
-)
-from .pareto import (
-    identify_pareto_front,
-    visualize_pareto_frontier,
-    print_pareto_summary,
-    analyze_improvements
 )
 __all__ = [
-    'SOPGenePool',
     'Diagnosis',
-    'SOPMutation',
     'EvolvedSOPs',
-    'performance_diagnostician',
-    'sop_architect',
-    'run_evolution_cycle',
     'identify_pareto_front',
-    'visualize_pareto_frontier',
     'print_pareto_summary',
-    'analyze_improvements'
 ]

 """
 from .director import (
     Diagnosis,
     EvolvedSOPs,
+    SOPGenePool,
+    SOPMutation,
     performance_diagnostician,
+    run_evolution_cycle,
     sop_architect,
 )
+from .pareto import analyze_improvements, identify_pareto_front, print_pareto_summary, visualize_pareto_frontier
 __all__ = [
     'Diagnosis',
     'EvolvedSOPs',
+    'SOPGenePool',
+    'SOPMutation',
+    'analyze_improvements',
     'identify_pareto_front',
+    'performance_diagnostician',
     'print_pareto_summary',
+    'run_evolution_cycle',
+    'sop_architect',
+    'visualize_pareto_frontier'
 ]

archive/evolution/director.py CHANGED Viewed

@@ -3,27 +3,28 @@ MediGuard AI RAG-Helper - Evolution Engine
 Outer Loop Director for SOP Evolution
 """
-import json
-from typing import Any, Callable, Dict, List, Literal, Optional
 from pydantic import BaseModel, Field
-from langchain_core.prompts import ChatPromptTemplate
 from src.config import ExplanationSOP
 from src.evaluation.evaluators import EvaluationResult
 class SOPGenePool:
     """Manages version control for evolving SOPs"""
     def __init__(self):
-        self.pool: List[Dict[str, Any]] = []
-        self.gene_pool: List[Dict[str, Any]] = []  # Alias for compatibility
         self.version_counter = 0
     def add(
         self,
         sop: ExplanationSOP,
         evaluation: EvaluationResult,
-        parent_version: Optional[int] = None,
         description: str = ""
     ):
         """Add a new SOP to the gene pool"""
@@ -38,50 +39,50 @@ class SOPGenePool:
         self.pool.append(entry)
         self.gene_pool = self.pool  # Keep in sync
         print(f"✓ Added SOP v{self.version_counter} to gene pool: {description}")
-    def get_latest(self) -> Optional[Dict[str, Any]]:
         """Get the most recent SOP"""
         return self.pool[-1] if self.pool else None
-    def get_by_version(self, version: int) -> Optional[Dict[str, Any]]:
         """Retrieve specific SOP version"""
         for entry in self.pool:
             if entry['version'] == version:
                 return entry
         return None
-    def get_best_by_metric(self, metric: str) -> Optional[Dict[str, Any]]:
         """Get SOP with highest score on specific metric"""
         if not self.pool:
             return None
         best = max(
             self.pool,
             key=lambda x: getattr(x['evaluation'], metric).score
         )
         return best
     def summary(self):
         """Print summary of all SOPs in pool"""
         print("\n" + "=" * 80)
         print("SOP GENE POOL SUMMARY")
         print("=" * 80)
         for entry in self.pool:
             v = entry['version']
             p = entry['parent']
             desc = entry['description']
             e = entry['evaluation']
             parent_str = "(Baseline)" if p is None else f"(Child of v{p})"
             print(f"\nSOP v{v} {parent_str}: {desc}")
             print(f"  Clinical Accuracy:     {e.clinical_accuracy.score:.2f}")
             print(f"  Evidence Grounding:    {e.evidence_grounding.score:.2f}")
             print(f"  Actionability:         {e.actionability.score:.2f}")
             print(f"  Clarity:               {e.clarity.score:.2f}")
             print(f"  Safety & Completeness: {e.safety_completeness.score:.2f}")
         print("\n" + "=" * 80)
@@ -120,7 +121,7 @@ class SOPMutation(BaseModel):
 class EvolvedSOPs(BaseModel):
     """Container for mutated SOPs from Architect"""
-    mutations: List[SOPMutation]
 def performance_diagnostician(evaluation: EvaluationResult) -> Diagnosis:
@@ -131,7 +132,7 @@ def performance_diagnostician(evaluation: EvaluationResult) -> Diagnosis:
     print("\n" + "=" * 70)
     print("EXECUTING: Performance Diagnostician")
     print("=" * 70)
     # Find lowest score programmatically (no LLM needed)
     scores = {
         'clinical_accuracy': evaluation.clinical_accuracy.score,
@@ -140,7 +141,7 @@ def performance_diagnostician(evaluation: EvaluationResult) -> Diagnosis:
         'clarity': evaluation.clarity.score,
         'safety_completeness': evaluation.safety_completeness.score
     }
     reasonings = {
         'clinical_accuracy': evaluation.clinical_accuracy.reasoning,
         'evidence_grounding': evaluation.evidence_grounding.reasoning,
@@ -148,11 +149,11 @@ def performance_diagnostician(evaluation: EvaluationResult) -> Diagnosis:
         'clarity': evaluation.clarity.reasoning,
         'safety_completeness': evaluation.safety_completeness.reasoning
     }
     primary_weakness = min(scores, key=scores.get)
     weakness_score = scores[primary_weakness]
     weakness_reasoning = reasonings[primary_weakness]
     # Generate detailed root cause analysis
     root_cause_map = {
         'clinical_accuracy': f"Clinical accuracy score ({weakness_score:.2f}) indicates potential issues with medical interpretations. {weakness_reasoning[:200]}",
@@ -161,7 +162,7 @@ def performance_diagnostician(evaluation: EvaluationResult) -> Diagnosis:
         'clarity': f"Clarity score ({weakness_score:.2f}) suggests readability issues. {weakness_reasoning[:200]}",
         'safety_completeness': f"Safety score ({weakness_score:.2f}) indicates missing risk discussions. {weakness_reasoning[:200]}"
     }
     recommendation_map = {
         'clinical_accuracy': "Increase RAG depth to access more authoritative medical sources.",
         'evidence_grounding': "Enforce strict citation requirements and increase RAG depth.",
@@ -169,17 +170,17 @@ def performance_diagnostician(evaluation: EvaluationResult) -> Diagnosis:
         'clarity': "Simplify language and reduce technical jargon for better readability.",
         'safety_completeness': "Add explicit safety warnings and ensure complete risk coverage."
     }
     diagnosis = Diagnosis(
         primary_weakness=primary_weakness,
         root_cause_analysis=root_cause_map[primary_weakness],
         recommendation=recommendation_map[primary_weakness]
     )
-    print(f"\n✓ Diagnosis complete")
     print(f"  Primary weakness: {diagnosis.primary_weakness} ({weakness_score:.3f})")
     print(f"  Recommendation: {diagnosis.recommendation}")
     return diagnosis
@@ -195,9 +196,9 @@ def sop_architect(
     print("EXECUTING: SOP Architect")
     print("=" * 70)
     print(f"Target weakness: {diagnosis.primary_weakness}")
     weakness = diagnosis.primary_weakness
     # Generate mutations based on weakness type
     if weakness == 'clarity':
         mut1 = SOPMutation(
@@ -226,7 +227,7 @@ def sop_architect(
             critical_value_alert_mode=current_sop.critical_value_alert_mode,
             description="Balanced detail with fewer citations for readability"
         )
     elif weakness == 'evidence_grounding':
         mut1 = SOPMutation(
             disease_explainer_k=min(10, current_sop.disease_explainer_k + 2),
@@ -254,7 +255,7 @@ def sop_architect(
             critical_value_alert_mode=current_sop.critical_value_alert_mode,
             description="Moderate RAG increase with citation enforcement"
         )
     elif weakness == 'actionability':
         mut1 = SOPMutation(
             disease_explainer_k=current_sop.disease_explainer_k,
@@ -282,7 +283,7 @@ def sop_architect(
             critical_value_alert_mode='strict',
             description="Comprehensive approach with all agents enabled"
         )
     elif weakness == 'clinical_accuracy':
         mut1 = SOPMutation(
             disease_explainer_k=10,
@@ -310,7 +311,7 @@ def sop_architect(
             critical_value_alert_mode='strict',
             description="High RAG depth with comprehensive detail"
         )
     else:  # safety_completeness
         mut1 = SOPMutation(
             disease_explainer_k=min(10, current_sop.disease_explainer_k + 1),
@@ -338,14 +339,14 @@ def sop_architect(
             critical_value_alert_mode='strict',
             description="Maximum coverage with all safety features"
         )
     evolved = EvolvedSOPs(mutations=[mut1, mut2])
     print(f"\n✓ Generated {len(evolved.mutations)} mutations")
     for i, mut in enumerate(evolved.mutations, 1):
         print(f"  {i}. {mut.description}")
         print(f"     Disease K: {mut.disease_explainer_k}, Detail: {mut.explainer_detail_level}")
     return evolved
@@ -354,7 +355,7 @@ def run_evolution_cycle(
     patient_input: Any,
     workflow_graph: Any,
     evaluation_func: Callable
-) -> List[Dict[str, Any]]:
     """
     Executes one complete evolution cycle:
     1. Diagnose current best SOP
@@ -367,38 +368,37 @@ def run_evolution_cycle(
     print("\n" + "=" * 80)
     print("STARTING EVOLUTION CYCLE")
     print("=" * 80)
     # Get current best (for simplicity, use latest)
     current_best = gene_pool.get_latest()
     if not current_best:
         raise ValueError("Gene pool is empty. Add baseline SOP first.")
     parent_sop = current_best['sop']
     parent_eval = current_best['evaluation']
     parent_version = current_best['version']
     print(f"\nImproving upon SOP v{parent_version}")
     # Step 1: Diagnose
     diagnosis = performance_diagnostician(parent_eval)
     # Step 2: Generate mutations
     evolved_sops = sop_architect(diagnosis, parent_sop)
     # Step 3: Test each mutation
     new_entries = []
     for i, mutant_sop_model in enumerate(evolved_sops.mutations, 1):
         print(f"\n{'=' * 70}")
         print(f"TESTING MUTATION {i}/{len(evolved_sops.mutations)}: {mutant_sop_model.description}")
         print("=" * 70)
         # Convert SOPMutation to ExplanationSOP
         mutant_sop_dict = mutant_sop_model.model_dump()
         description = mutant_sop_dict.pop('description')
         mutant_sop = ExplanationSOP(**mutant_sop_dict)
         # Run workflow with mutated SOP
-        from src.state import PatientInput
         from datetime import datetime
         graph_input = {
             "patient_biomarkers": patient_input.biomarkers,
@@ -414,17 +414,17 @@ def run_evolution_cycle(
             "processing_timestamp": datetime.now().isoformat(),
             "sop_version": description
         }
         try:
             final_state = workflow_graph.invoke(graph_input)
             # Evaluate output
             evaluation = evaluation_func(
                 final_response=final_state['final_response'],
                 agent_outputs=final_state['agent_outputs'],
                 biomarkers=patient_input.biomarkers
             )
             # Add to gene pool
             gene_pool.add(
                 sop=mutant_sop,
@@ -432,7 +432,7 @@ def run_evolution_cycle(
                 parent_version=parent_version,
                 description=description
             )
             new_entries.append({
                 "sop": mutant_sop,
                 "evaluation": evaluation,
@@ -441,9 +441,9 @@ def run_evolution_cycle(
         except Exception as e:
             print(f"❌ Mutation {i} failed: {e}")
             continue
     print("\n" + "=" * 80)
     print("EVOLUTION CYCLE COMPLETE")
     print("=" * 80)
     return new_entries

 Outer Loop Director for SOP Evolution
 """
+from collections.abc import Callable
+from typing import Any, Literal
 from pydantic import BaseModel, Field
 from src.config import ExplanationSOP
 from src.evaluation.evaluators import EvaluationResult
 class SOPGenePool:
     """Manages version control for evolving SOPs"""
     def __init__(self):
+        self.pool: list[dict[str, Any]] = []
+        self.gene_pool: list[dict[str, Any]] = []  # Alias for compatibility
         self.version_counter = 0
     def add(
         self,
         sop: ExplanationSOP,
         evaluation: EvaluationResult,
+        parent_version: int | None = None,
         description: str = ""
     ):
         """Add a new SOP to the gene pool"""
         self.pool.append(entry)
         self.gene_pool = self.pool  # Keep in sync
         print(f"✓ Added SOP v{self.version_counter} to gene pool: {description}")
+    def get_latest(self) -> dict[str, Any] | None:
         """Get the most recent SOP"""
         return self.pool[-1] if self.pool else None
+    def get_by_version(self, version: int) -> dict[str, Any] | None:
         """Retrieve specific SOP version"""
         for entry in self.pool:
             if entry['version'] == version:
                 return entry
         return None
+    def get_best_by_metric(self, metric: str) -> dict[str, Any] | None:
         """Get SOP with highest score on specific metric"""
         if not self.pool:
             return None
         best = max(
             self.pool,
             key=lambda x: getattr(x['evaluation'], metric).score
         )
         return best
     def summary(self):
         """Print summary of all SOPs in pool"""
         print("\n" + "=" * 80)
         print("SOP GENE POOL SUMMARY")
         print("=" * 80)
         for entry in self.pool:
             v = entry['version']
             p = entry['parent']
             desc = entry['description']
             e = entry['evaluation']
             parent_str = "(Baseline)" if p is None else f"(Child of v{p})"
             print(f"\nSOP v{v} {parent_str}: {desc}")
             print(f"  Clinical Accuracy:     {e.clinical_accuracy.score:.2f}")
             print(f"  Evidence Grounding:    {e.evidence_grounding.score:.2f}")
             print(f"  Actionability:         {e.actionability.score:.2f}")
             print(f"  Clarity:               {e.clarity.score:.2f}")
             print(f"  Safety & Completeness: {e.safety_completeness.score:.2f}")
         print("\n" + "=" * 80)
 class EvolvedSOPs(BaseModel):
     """Container for mutated SOPs from Architect"""
+    mutations: list[SOPMutation]
 def performance_diagnostician(evaluation: EvaluationResult) -> Diagnosis:
     print("\n" + "=" * 70)
     print("EXECUTING: Performance Diagnostician")
     print("=" * 70)
     # Find lowest score programmatically (no LLM needed)
     scores = {
         'clinical_accuracy': evaluation.clinical_accuracy.score,
         'clarity': evaluation.clarity.score,
         'safety_completeness': evaluation.safety_completeness.score
     }
     reasonings = {
         'clinical_accuracy': evaluation.clinical_accuracy.reasoning,
         'evidence_grounding': evaluation.evidence_grounding.reasoning,
         'clarity': evaluation.clarity.reasoning,
         'safety_completeness': evaluation.safety_completeness.reasoning
     }
     primary_weakness = min(scores, key=scores.get)
     weakness_score = scores[primary_weakness]
     weakness_reasoning = reasonings[primary_weakness]
     # Generate detailed root cause analysis
     root_cause_map = {
         'clinical_accuracy': f"Clinical accuracy score ({weakness_score:.2f}) indicates potential issues with medical interpretations. {weakness_reasoning[:200]}",
         'clarity': f"Clarity score ({weakness_score:.2f}) suggests readability issues. {weakness_reasoning[:200]}",
         'safety_completeness': f"Safety score ({weakness_score:.2f}) indicates missing risk discussions. {weakness_reasoning[:200]}"
     }
     recommendation_map = {
         'clinical_accuracy': "Increase RAG depth to access more authoritative medical sources.",
         'evidence_grounding': "Enforce strict citation requirements and increase RAG depth.",
         'clarity': "Simplify language and reduce technical jargon for better readability.",
         'safety_completeness': "Add explicit safety warnings and ensure complete risk coverage."
     }
     diagnosis = Diagnosis(
         primary_weakness=primary_weakness,
         root_cause_analysis=root_cause_map[primary_weakness],
         recommendation=recommendation_map[primary_weakness]
     )
+    print("\n✓ Diagnosis complete")
     print(f"  Primary weakness: {diagnosis.primary_weakness} ({weakness_score:.3f})")
     print(f"  Recommendation: {diagnosis.recommendation}")
     return diagnosis
     print("EXECUTING: SOP Architect")
     print("=" * 70)
     print(f"Target weakness: {diagnosis.primary_weakness}")
     weakness = diagnosis.primary_weakness
     # Generate mutations based on weakness type
     if weakness == 'clarity':
         mut1 = SOPMutation(
             critical_value_alert_mode=current_sop.critical_value_alert_mode,
             description="Balanced detail with fewer citations for readability"
         )
     elif weakness == 'evidence_grounding':
         mut1 = SOPMutation(
             disease_explainer_k=min(10, current_sop.disease_explainer_k + 2),
             critical_value_alert_mode=current_sop.critical_value_alert_mode,
             description="Moderate RAG increase with citation enforcement"
         )
     elif weakness == 'actionability':
         mut1 = SOPMutation(
             disease_explainer_k=current_sop.disease_explainer_k,
             critical_value_alert_mode='strict',
             description="Comprehensive approach with all agents enabled"
         )
     elif weakness == 'clinical_accuracy':
         mut1 = SOPMutation(
             disease_explainer_k=10,
             critical_value_alert_mode='strict',
             description="High RAG depth with comprehensive detail"
         )
     else:  # safety_completeness
         mut1 = SOPMutation(
             disease_explainer_k=min(10, current_sop.disease_explainer_k + 1),
             critical_value_alert_mode='strict',
             description="Maximum coverage with all safety features"
         )
     evolved = EvolvedSOPs(mutations=[mut1, mut2])
     print(f"\n✓ Generated {len(evolved.mutations)} mutations")
     for i, mut in enumerate(evolved.mutations, 1):
         print(f"  {i}. {mut.description}")
         print(f"     Disease K: {mut.disease_explainer_k}, Detail: {mut.explainer_detail_level}")
     return evolved
     patient_input: Any,
     workflow_graph: Any,
     evaluation_func: Callable
+) -> list[dict[str, Any]]:
     """
     Executes one complete evolution cycle:
     1. Diagnose current best SOP
     print("\n" + "=" * 80)
     print("STARTING EVOLUTION CYCLE")
     print("=" * 80)
     # Get current best (for simplicity, use latest)
     current_best = gene_pool.get_latest()
     if not current_best:
         raise ValueError("Gene pool is empty. Add baseline SOP first.")
     parent_sop = current_best['sop']
     parent_eval = current_best['evaluation']
     parent_version = current_best['version']
     print(f"\nImproving upon SOP v{parent_version}")
     # Step 1: Diagnose
     diagnosis = performance_diagnostician(parent_eval)
     # Step 2: Generate mutations
     evolved_sops = sop_architect(diagnosis, parent_sop)
     # Step 3: Test each mutation
     new_entries = []
     for i, mutant_sop_model in enumerate(evolved_sops.mutations, 1):
         print(f"\n{'=' * 70}")
         print(f"TESTING MUTATION {i}/{len(evolved_sops.mutations)}: {mutant_sop_model.description}")
         print("=" * 70)
         # Convert SOPMutation to ExplanationSOP
         mutant_sop_dict = mutant_sop_model.model_dump()
         description = mutant_sop_dict.pop('description')
         mutant_sop = ExplanationSOP(**mutant_sop_dict)
         # Run workflow with mutated SOP
         from datetime import datetime
         graph_input = {
             "patient_biomarkers": patient_input.biomarkers,
             "processing_timestamp": datetime.now().isoformat(),
             "sop_version": description
         }
         try:
             final_state = workflow_graph.invoke(graph_input)
             # Evaluate output
             evaluation = evaluation_func(
                 final_response=final_state['final_response'],
                 agent_outputs=final_state['agent_outputs'],
                 biomarkers=patient_input.biomarkers
             )
             # Add to gene pool
             gene_pool.add(
                 sop=mutant_sop,
                 parent_version=parent_version,
                 description=description
             )
             new_entries.append({
                 "sop": mutant_sop,
                 "evaluation": evaluation,
         except Exception as e:
             print(f"❌ Mutation {i} failed: {e}")
             continue
     print("\n" + "=" * 80)
     print("EVOLUTION CYCLE COMPLETE")
     print("=" * 80)
     return new_entries

archive/evolution/pareto.py CHANGED Viewed

@@ -3,14 +3,16 @@ Pareto Frontier Analysis
 Identifies optimal trade-offs in multi-objective optimization
 """
-import numpy as np
-from typing import List, Dict, Any
 import matplotlib
 matplotlib.use('Agg')  # Use non-interactive backend
 import matplotlib.pyplot as plt
-def identify_pareto_front(gene_pool_entries: List[Dict[str, Any]]) -> List[Dict[str, Any]]:
     """
     Identifies non-dominated solutions (Pareto Frontier).
@@ -19,32 +21,32 @@ def identify_pareto_front(gene_pool_entries: List[Dict[str, Any]]) -> List[Dict[
     - Strictly better on AT LEAST ONE metric
     """
     pareto_front = []
     for i, candidate in enumerate(gene_pool_entries):
         is_dominated = False
         # Get candidate's 5D score vector
         cand_scores = np.array(candidate['evaluation'].to_vector())
         for j, other in enumerate(gene_pool_entries):
             if i == j:
                 continue
             # Get other solution's 5D vector
             other_scores = np.array(other['evaluation'].to_vector())
             # Check domination: other >= candidate on ALL, other > candidate on SOME
             if np.all(other_scores >= cand_scores) and np.any(other_scores > cand_scores):
                 is_dominated = True
                 break
         if not is_dominated:
             pareto_front.append(candidate)
     return pareto_front
-def visualize_pareto_frontier(pareto_front: List[Dict[str, Any]]):
     """
     Creates two visualizations:
     1. Parallel coordinates plot (5D)
@@ -53,16 +55,16 @@ def visualize_pareto_frontier(pareto_front: List[Dict[str, Any]]):
     if not pareto_front:
         print("No solutions on Pareto front to visualize")
         return
     fig = plt.figure(figsize=(18, 7))
     # --- Plot 1: Bar Chart (since pandas might not be available) ---
     ax1 = plt.subplot(1, 2, 1)
     metrics = ['Clinical\nAccuracy', 'Evidence\nGrounding', 'Actionability', 'Clarity', 'Safety']
     x = np.arange(len(metrics))
     width = 0.8 / len(pareto_front)
     for idx, entry in enumerate(pareto_front):
         e = entry['evaluation']
         scores = [
@@ -72,11 +74,11 @@ def visualize_pareto_frontier(pareto_front: List[Dict[str, Any]]):
             e.clarity.score,
             e.safety_completeness.score
         ]
         offset = (idx - len(pareto_front) / 2) * width + width / 2
         label = f"SOP v{entry['version']}"
         ax1.bar(x + offset, scores, width, label=label, alpha=0.8)
     ax1.set_xlabel('Metrics', fontsize=12)
     ax1.set_ylabel('Score', fontsize=12)
     ax1.set_title('5D Performance Comparison (Bar Chart)', fontsize=14)
@@ -85,17 +87,17 @@ def visualize_pareto_frontier(pareto_front: List[Dict[str, Any]]):
     ax1.set_ylim(0, 1.0)
     ax1.legend(loc='upper left')
     ax1.grid(True, alpha=0.3, axis='y')
     # --- Plot 2: Radar Chart ---
     ax2 = plt.subplot(1, 2, 2, projection='polar')
-    categories = ['Clinical\nAccuracy', 'Evidence\nGrounding',
                   'Actionability', 'Clarity', 'Safety']
     num_vars = len(categories)
     angles = np.linspace(0, 2 * np.pi, num_vars, endpoint=False).tolist()
     angles += angles[:1]
     for entry in pareto_front:
         e = entry['evaluation']
         values = [
@@ -106,47 +108,47 @@ def visualize_pareto_frontier(pareto_front: List[Dict[str, Any]]):
             e.safety_completeness.score
         ]
         values += values[:1]
         desc = entry.get('description', '')[:30]
         label = f"SOP v{entry['version']}: {desc}"
         ax2.plot(angles, values, 'o-', linewidth=2, label=label)
         ax2.fill(angles, values, alpha=0.15)
     ax2.set_xticks(angles[:-1])
     ax2.set_xticklabels(categories, size=10)
     ax2.set_ylim(0, 1)
     ax2.set_title('5D Performance Profiles (Radar Chart)', size=14, y=1.08)
     ax2.legend(loc='upper left', bbox_to_anchor=(1.2, 1.0), fontsize=9)
     ax2.grid(True)
     plt.tight_layout()
     # Create data directory if it doesn't exist
     from pathlib import Path
     data_dir = Path('data')
     data_dir.mkdir(exist_ok=True)
     output_path = data_dir / 'pareto_frontier_analysis.png'
     plt.savefig(output_path, dpi=300, bbox_inches='tight')
     plt.close()
     print(f"\n✓ Visualization saved to: {output_path}")
-def print_pareto_summary(pareto_front: List[Dict[str, Any]]):
     """Print human-readable summary of Pareto frontier"""
     print("\n" + "=" * 80)
     print("PARETO FRONTIER ANALYSIS")
     print("=" * 80)
     print(f"\nFound {len(pareto_front)} optimal (non-dominated) solutions:\n")
     for entry in pareto_front:
         v = entry['version']
         p = entry.get('parent')
         desc = entry.get('description', 'Baseline')
         e = entry['evaluation']
         print(f"SOP v{v} {f'(Child of v{p})' if p else '(Baseline)'}")
         print(f"  Description: {desc}")
         print(f"  Clinical Accuracy:     {e.clinical_accuracy.score:.3f}")
@@ -154,12 +156,12 @@ def print_pareto_summary(pareto_front: List[Dict[str, Any]]):
         print(f"  Actionability:         {e.actionability.score:.3f}")
         print(f"  Clarity:               {e.clarity.score:.3f}")
         print(f"  Safety & Completeness: {e.safety_completeness.score:.3f}")
         # Calculate average
         avg_score = np.mean(e.to_vector())
         print(f"  Average Score:         {avg_score:.3f}")
         print()
     print("=" * 80)
     print("\nRECOMMENDATION:")
     print("Review the visualizations and choose the SOP that best matches")
@@ -167,46 +169,46 @@ def print_pareto_summary(pareto_front: List[Dict[str, Any]]):
     print("=" * 80)
-def analyze_improvements(gene_pool_entries: List[Dict[str, Any]]):
     """Analyze improvements over baseline"""
     if len(gene_pool_entries) < 2:
         print("\n⚠️ Not enough SOPs to analyze improvements")
         return
     baseline = gene_pool_entries[0]
     baseline_scores = np.array(baseline['evaluation'].to_vector())
     print("\n" + "=" * 80)
     print("IMPROVEMENT ANALYSIS")
     print("=" * 80)
     print(f"\nBaseline (v{baseline['version']}): {baseline.get('description', 'Initial')}")
     print(f"  Average Score: {np.mean(baseline_scores):.3f}")
     improvements_found = False
     for entry in gene_pool_entries[1:]:
         scores = np.array(entry['evaluation'].to_vector())
         avg_score = np.mean(scores)
         baseline_avg = np.mean(baseline_scores)
         if avg_score > baseline_avg:
             improvements_found = True
             improvement_pct = ((avg_score - baseline_avg) / baseline_avg) * 100
-            print(f"\n✓ SOP v{entry['version']}: {entry.get('description', '')}")
             print(f"  Average Score: {avg_score:.3f} (+{improvement_pct:.1f}% vs baseline)")
             # Show per-metric improvements
-            metric_names = ['Clinical Accuracy', 'Evidence Grounding', 'Actionability',
                           'Clarity', 'Safety & Completeness']
             for i, (name, score, baseline_score) in enumerate(zip(metric_names, scores, baseline_scores)):
                 diff = score - baseline_score
                 if abs(diff) > 0.01:  # Show significant changes
                     symbol = "↑" if diff > 0 else "↓"
                     print(f"    {name}: {score:.3f} {symbol} ({diff:+.3f})")
     if not improvements_found:
         print("\n⚠️ No improvements found over baseline yet")
         print("   Consider running more evolution cycles or adjusting mutation strategies")
     print("\n" + "=" * 80)

 Identifies optimal trade-offs in multi-objective optimization
 """
+from typing import Any
 import matplotlib
+import numpy as np
 matplotlib.use('Agg')  # Use non-interactive backend
 import matplotlib.pyplot as plt
+def identify_pareto_front(gene_pool_entries: list[dict[str, Any]]) -> list[dict[str, Any]]:
     """
     Identifies non-dominated solutions (Pareto Frontier).
     - Strictly better on AT LEAST ONE metric
     """
     pareto_front = []
     for i, candidate in enumerate(gene_pool_entries):
         is_dominated = False
         # Get candidate's 5D score vector
         cand_scores = np.array(candidate['evaluation'].to_vector())
         for j, other in enumerate(gene_pool_entries):
             if i == j:
                 continue
             # Get other solution's 5D vector
             other_scores = np.array(other['evaluation'].to_vector())
             # Check domination: other >= candidate on ALL, other > candidate on SOME
             if np.all(other_scores >= cand_scores) and np.any(other_scores > cand_scores):
                 is_dominated = True
                 break
         if not is_dominated:
             pareto_front.append(candidate)
     return pareto_front
+def visualize_pareto_frontier(pareto_front: list[dict[str, Any]]):
     """
     Creates two visualizations:
     1. Parallel coordinates plot (5D)
     if not pareto_front:
         print("No solutions on Pareto front to visualize")
         return
     fig = plt.figure(figsize=(18, 7))
     # --- Plot 1: Bar Chart (since pandas might not be available) ---
     ax1 = plt.subplot(1, 2, 1)
     metrics = ['Clinical\nAccuracy', 'Evidence\nGrounding', 'Actionability', 'Clarity', 'Safety']
     x = np.arange(len(metrics))
     width = 0.8 / len(pareto_front)
     for idx, entry in enumerate(pareto_front):
         e = entry['evaluation']
         scores = [
             e.clarity.score,
             e.safety_completeness.score
         ]
         offset = (idx - len(pareto_front) / 2) * width + width / 2
         label = f"SOP v{entry['version']}"
         ax1.bar(x + offset, scores, width, label=label, alpha=0.8)
     ax1.set_xlabel('Metrics', fontsize=12)
     ax1.set_ylabel('Score', fontsize=12)
     ax1.set_title('5D Performance Comparison (Bar Chart)', fontsize=14)
     ax1.set_ylim(0, 1.0)
     ax1.legend(loc='upper left')
     ax1.grid(True, alpha=0.3, axis='y')
     # --- Plot 2: Radar Chart ---
     ax2 = plt.subplot(1, 2, 2, projection='polar')
+    categories = ['Clinical\nAccuracy', 'Evidence\nGrounding',
                   'Actionability', 'Clarity', 'Safety']
     num_vars = len(categories)
     angles = np.linspace(0, 2 * np.pi, num_vars, endpoint=False).tolist()
     angles += angles[:1]
     for entry in pareto_front:
         e = entry['evaluation']
         values = [
             e.safety_completeness.score
         ]
         values += values[:1]
         desc = entry.get('description', '')[:30]
         label = f"SOP v{entry['version']}: {desc}"
         ax2.plot(angles, values, 'o-', linewidth=2, label=label)
         ax2.fill(angles, values, alpha=0.15)
     ax2.set_xticks(angles[:-1])
     ax2.set_xticklabels(categories, size=10)
     ax2.set_ylim(0, 1)
     ax2.set_title('5D Performance Profiles (Radar Chart)', size=14, y=1.08)
     ax2.legend(loc='upper left', bbox_to_anchor=(1.2, 1.0), fontsize=9)
     ax2.grid(True)
     plt.tight_layout()
     # Create data directory if it doesn't exist
     from pathlib import Path
     data_dir = Path('data')
     data_dir.mkdir(exist_ok=True)
     output_path = data_dir / 'pareto_frontier_analysis.png'
     plt.savefig(output_path, dpi=300, bbox_inches='tight')
     plt.close()
     print(f"\n✓ Visualization saved to: {output_path}")
+def print_pareto_summary(pareto_front: list[dict[str, Any]]):
     """Print human-readable summary of Pareto frontier"""
     print("\n" + "=" * 80)
     print("PARETO FRONTIER ANALYSIS")
     print("=" * 80)
     print(f"\nFound {len(pareto_front)} optimal (non-dominated) solutions:\n")
     for entry in pareto_front:
         v = entry['version']
         p = entry.get('parent')
         desc = entry.get('description', 'Baseline')
         e = entry['evaluation']
         print(f"SOP v{v} {f'(Child of v{p})' if p else '(Baseline)'}")
         print(f"  Description: {desc}")
         print(f"  Clinical Accuracy:     {e.clinical_accuracy.score:.3f}")
         print(f"  Actionability:         {e.actionability.score:.3f}")
         print(f"  Clarity:               {e.clarity.score:.3f}")
         print(f"  Safety & Completeness: {e.safety_completeness.score:.3f}")
         # Calculate average
         avg_score = np.mean(e.to_vector())
         print(f"  Average Score:         {avg_score:.3f}")
         print()
     print("=" * 80)
     print("\nRECOMMENDATION:")
     print("Review the visualizations and choose the SOP that best matches")
     print("=" * 80)
+def analyze_improvements(gene_pool_entries: list[dict[str, Any]]):
     """Analyze improvements over baseline"""
     if len(gene_pool_entries) < 2:
         print("\n⚠️ Not enough SOPs to analyze improvements")
         return
     baseline = gene_pool_entries[0]
     baseline_scores = np.array(baseline['evaluation'].to_vector())
     print("\n" + "=" * 80)
     print("IMPROVEMENT ANALYSIS")
     print("=" * 80)
     print(f"\nBaseline (v{baseline['version']}): {baseline.get('description', 'Initial')}")
     print(f"  Average Score: {np.mean(baseline_scores):.3f}")
     improvements_found = False
     for entry in gene_pool_entries[1:]:
         scores = np.array(entry['evaluation'].to_vector())
         avg_score = np.mean(scores)
         baseline_avg = np.mean(baseline_scores)
         if avg_score > baseline_avg:
             improvements_found = True
             improvement_pct = ((avg_score - baseline_avg) / baseline_avg) * 100
+            print(f"\n✓ SOP v{entry['version']}: {entry.get('description', '')}")
             print(f"  Average Score: {avg_score:.3f} (+{improvement_pct:.1f}% vs baseline)")
             # Show per-metric improvements
+            metric_names = ['Clinical Accuracy', 'Evidence Grounding', 'Actionability',
                           'Clarity', 'Safety & Completeness']
             for i, (name, score, baseline_score) in enumerate(zip(metric_names, scores, baseline_scores)):
                 diff = score - baseline_score
                 if abs(diff) > 0.01:  # Show significant changes
                     symbol = "↑" if diff > 0 else "↓"
                     print(f"    {name}: {score:.3f} {symbol} ({diff:+.3f})")
     if not improvements_found:
         print("\n⚠️ No improvements found over baseline yet")
         print("   Consider running more evolution cycles or adjusting mutation strategies")
     print("\n" + "=" * 80)

archive/sop_evolution.py CHANGED Viewed

@@ -8,9 +8,10 @@ from __future__ import annotations
 from datetime import datetime, timedelta
-from airflow import DAG
 from airflow.operators.python import PythonOperator
 default_args = {
     "owner": "mediguard",
     "retries": 1,

 from datetime import datetime, timedelta
 from airflow.operators.python import PythonOperator
+from airflow import DAG
 default_args = {
     "owner": "mediguard",
     "retries": 1,

{tests → archive/tests}/test_evolution_loop.py RENAMED Viewed

@@ -10,20 +10,20 @@ from pathlib import Path
 project_root = Path(__file__).parent.parent
 sys.path.insert(0, str(project_root))
-from src.workflow import create_guild
-from src.pdf_processor import get_all_retrievers
 from src.config import BASELINE_SOP
-from src.state import PatientInput, GuildState
 from src.evaluation.evaluators import run_full_evaluation
 from src.evolution.director import SOPGenePool, run_evolution_cycle
 from src.evolution.pareto import (
     identify_pareto_front,
-    visualize_pareto_frontier,
     print_pareto_summary,
-    analyze_improvements
 )
-from datetime import datetime
-from typing import Dict, Any
 def create_test_patient() -> PatientInput:
@@ -53,8 +53,8 @@ def create_test_patient() -> PatientInput:
         "Chloride": 102.0,
         "Bicarbonate": 24.0
     }
-    model_prediction: Dict[str, Any] = {
         'disease': 'Type 2 Diabetes',
         'confidence': 0.92,
         'probabilities': {
@@ -64,7 +64,7 @@ def create_test_patient() -> PatientInput:
         },
         'prediction_timestamp': '2025-01-01T10:00:00'
     }
     patient_context = {
         'patient_id': 'TEST-001',
         'age': 55,
@@ -74,7 +74,7 @@ def create_test_patient() -> PatientInput:
         'current_medications': ["Metformin 500mg"],
         'query': "My blood sugar has been high lately. What should I do?"
     }
     return PatientInput(
         biomarkers=biomarkers,
         model_prediction=model_prediction,
@@ -87,19 +87,19 @@ def main():
     print("\n" + "=" * 80)
     print("PHASE 3: SELF-IMPROVEMENT LOOP TEST")
     print("=" * 80)
     # Setup
     print("\n1. Initializing system...")
     guild = create_guild()
     patient = create_test_patient()
     # Initialize gene pool with baseline
     print("\n2. Creating SOP Gene Pool...")
     gene_pool = SOPGenePool()
     print("\n3. Evaluating Baseline SOP...")
     # Run workflow with baseline SOP
     initial_state: GuildState = {
         'patient_biomarkers': patient.biomarkers,
         'model_prediction': patient.model_prediction,
@@ -113,41 +113,41 @@ def main():
         'processing_timestamp': datetime.now().isoformat(),
         'sop_version': "Baseline"
     }
     guild_state = guild.workflow.invoke(initial_state)
     baseline_response = guild_state['final_response']
     agent_outputs = guild_state['agent_outputs']
     baseline_eval = run_full_evaluation(
         final_response=baseline_response,
         agent_outputs=agent_outputs,
         biomarkers=patient.biomarkers
     )
     gene_pool.add(
         sop=BASELINE_SOP,
         evaluation=baseline_eval,
         parent_version=None,
         description="Baseline SOP"
     )
     print(f"\n✓ Baseline Average Score: {baseline_eval.average_score():.3f}")
     print(f"  Clinical Accuracy:     {baseline_eval.clinical_accuracy.score:.3f}")
     print(f"  Evidence Grounding:    {baseline_eval.evidence_grounding.score:.3f}")
     print(f"  Actionability:         {baseline_eval.actionability.score:.3f}")
     print(f"  Clarity:               {baseline_eval.clarity.score:.3f}")
     print(f"  Safety & Completeness: {baseline_eval.safety_completeness.score:.3f}")
     # Run evolution cycles
     num_cycles = 2
     print(f"\n4. Running {num_cycles} Evolution Cycles...")
     for cycle in range(1, num_cycles + 1):
         print(f"\n{'─' * 80}")
         print(f"EVOLUTION CYCLE {cycle}")
         print(f"{'─' * 80}")
         try:
             # Create evaluation function for this cycle
             def eval_func(final_response, agent_outputs, biomarkers):
@@ -156,61 +156,61 @@ def main():
                     agent_outputs=agent_outputs,
                     biomarkers=biomarkers
                 )
             new_entries = run_evolution_cycle(
                 gene_pool=gene_pool,
                 patient_input=patient,
                 workflow_graph=guild.workflow,
                 evaluation_func=eval_func
             )
             print(f"\n✓ Cycle {cycle} complete: Added {len(new_entries)} new SOPs to gene pool")
             for entry in new_entries:
                 print(f"\n  SOP v{entry['version']}: {entry['description']}")
                 print(f"    Average Score: {entry['evaluation'].average_score():.3f}")
         except Exception as e:
             print(f"\n⚠️ Cycle {cycle} encountered error: {e}")
             print("Continuing to next cycle...")
     # Show gene pool summary
     print("\n5. Gene Pool Summary:")
     gene_pool.summary()
     # Pareto Analysis
     print("\n6. Identifying Pareto Frontier...")
     all_entries = gene_pool.gene_pool
     pareto_front = identify_pareto_front(all_entries)
     print(f"\n✓ Pareto frontier contains {len(pareto_front)} non-dominated solutions")
     print_pareto_summary(pareto_front)
     # Improvement Analysis
     print("\n7. Analyzing Improvements...")
     analyze_improvements(all_entries)
     # Visualizations
     print("\n8. Generating Visualizations...")
     visualize_pareto_frontier(pareto_front)
     # Final Summary
     print("\n" + "=" * 80)
     print("EVOLUTION TEST COMPLETE")
     print("=" * 80)
     print(f"\n✓ Total SOPs in Gene Pool: {len(all_entries)}")
     print(f"✓ Pareto Optimal SOPs: {len(pareto_front)}")
     # Find best average score
     best_sop = max(all_entries, key=lambda e: e['evaluation'].average_score())
     baseline_avg = baseline_eval.average_score()
     best_avg = best_sop['evaluation'].average_score()
     improvement = ((best_avg - baseline_avg) / baseline_avg) * 100
     print(f"\nBest SOP: v{best_sop['version']} - {best_sop['description']}")
     print(f"  Average Score: {best_avg:.3f} ({improvement:+.1f}% vs baseline)")
     print("\n✓ Visualization saved to: data/pareto_frontier_analysis.png")
     print("\n" + "=" * 80)

 project_root = Path(__file__).parent.parent
 sys.path.insert(0, str(project_root))
+from datetime import datetime
+from typing import Any
 from src.config import BASELINE_SOP
 from src.evaluation.evaluators import run_full_evaluation
 from src.evolution.director import SOPGenePool, run_evolution_cycle
 from src.evolution.pareto import (
+    analyze_improvements,
     identify_pareto_front,
     print_pareto_summary,
+    visualize_pareto_frontier,
 )
+from src.state import GuildState, PatientInput
+from src.workflow import create_guild
 def create_test_patient() -> PatientInput:
         "Chloride": 102.0,
         "Bicarbonate": 24.0
     }
+    model_prediction: dict[str, Any] = {
         'disease': 'Type 2 Diabetes',
         'confidence': 0.92,
         'probabilities': {
         },
         'prediction_timestamp': '2025-01-01T10:00:00'
     }
     patient_context = {
         'patient_id': 'TEST-001',
         'age': 55,
         'current_medications': ["Metformin 500mg"],
         'query': "My blood sugar has been high lately. What should I do?"
     }
     return PatientInput(
         biomarkers=biomarkers,
         model_prediction=model_prediction,
     print("\n" + "=" * 80)
     print("PHASE 3: SELF-IMPROVEMENT LOOP TEST")
     print("=" * 80)
     # Setup
     print("\n1. Initializing system...")
     guild = create_guild()
     patient = create_test_patient()
     # Initialize gene pool with baseline
     print("\n2. Creating SOP Gene Pool...")
     gene_pool = SOPGenePool()
     print("\n3. Evaluating Baseline SOP...")
     # Run workflow with baseline SOP
     initial_state: GuildState = {
         'patient_biomarkers': patient.biomarkers,
         'model_prediction': patient.model_prediction,
         'processing_timestamp': datetime.now().isoformat(),
         'sop_version': "Baseline"
     }
     guild_state = guild.workflow.invoke(initial_state)
     baseline_response = guild_state['final_response']
     agent_outputs = guild_state['agent_outputs']
     baseline_eval = run_full_evaluation(
         final_response=baseline_response,
         agent_outputs=agent_outputs,
         biomarkers=patient.biomarkers
     )
     gene_pool.add(
         sop=BASELINE_SOP,
         evaluation=baseline_eval,
         parent_version=None,
         description="Baseline SOP"
     )
     print(f"\n✓ Baseline Average Score: {baseline_eval.average_score():.3f}")
     print(f"  Clinical Accuracy:     {baseline_eval.clinical_accuracy.score:.3f}")
     print(f"  Evidence Grounding:    {baseline_eval.evidence_grounding.score:.3f}")
     print(f"  Actionability:         {baseline_eval.actionability.score:.3f}")
     print(f"  Clarity:               {baseline_eval.clarity.score:.3f}")
     print(f"  Safety & Completeness: {baseline_eval.safety_completeness.score:.3f}")
     # Run evolution cycles
     num_cycles = 2
     print(f"\n4. Running {num_cycles} Evolution Cycles...")
     for cycle in range(1, num_cycles + 1):
         print(f"\n{'─' * 80}")
         print(f"EVOLUTION CYCLE {cycle}")
         print(f"{'─' * 80}")
         try:
             # Create evaluation function for this cycle
             def eval_func(final_response, agent_outputs, biomarkers):
                     agent_outputs=agent_outputs,
                     biomarkers=biomarkers
                 )
             new_entries = run_evolution_cycle(
                 gene_pool=gene_pool,
                 patient_input=patient,
                 workflow_graph=guild.workflow,
                 evaluation_func=eval_func
             )
             print(f"\n✓ Cycle {cycle} complete: Added {len(new_entries)} new SOPs to gene pool")
             for entry in new_entries:
                 print(f"\n  SOP v{entry['version']}: {entry['description']}")
                 print(f"    Average Score: {entry['evaluation'].average_score():.3f}")
         except Exception as e:
             print(f"\n⚠️ Cycle {cycle} encountered error: {e}")
             print("Continuing to next cycle...")
     # Show gene pool summary
     print("\n5. Gene Pool Summary:")
     gene_pool.summary()
     # Pareto Analysis
     print("\n6. Identifying Pareto Frontier...")
     all_entries = gene_pool.gene_pool
     pareto_front = identify_pareto_front(all_entries)
     print(f"\n✓ Pareto frontier contains {len(pareto_front)} non-dominated solutions")
     print_pareto_summary(pareto_front)
     # Improvement Analysis
     print("\n7. Analyzing Improvements...")
     analyze_improvements(all_entries)
     # Visualizations
     print("\n8. Generating Visualizations...")
     visualize_pareto_frontier(pareto_front)
     # Final Summary
     print("\n" + "=" * 80)
     print("EVOLUTION TEST COMPLETE")
     print("=" * 80)
     print(f"\n✓ Total SOPs in Gene Pool: {len(all_entries)}")
     print(f"✓ Pareto Optimal SOPs: {len(pareto_front)}")
     # Find best average score
     best_sop = max(all_entries, key=lambda e: e['evaluation'].average_score())
     baseline_avg = baseline_eval.average_score()
     best_avg = best_sop['evaluation'].average_score()
     improvement = ((best_avg - baseline_avg) / baseline_avg) * 100
     print(f"\nBest SOP: v{best_sop['version']} - {best_sop['description']}")
     print(f"  Average Score: {best_avg:.3f} ({improvement:+.1f}% vs baseline)")
     print("\n✓ Visualization saved to: data/pareto_frontier_analysis.png")
     print("\n" + "=" * 80)

{tests → archive/tests}/test_evolution_quick.py RENAMED Viewed

@@ -5,6 +5,7 @@ Tests gene pool, diagnostician, and architect without full workflow
 import sys
 from pathlib import Path
 sys.path.insert(0, str(Path(__file__).parent.parent))
 from src.config import BASELINE_SOP
@@ -17,11 +18,11 @@ def main():
     print("\n" + "=" * 80)
     print("QUICK PHASE 3 TEST")
     print("=" * 80)
     # Test 1: Gene Pool
     print("\n1. Testing Gene Pool...")
     gene_pool = SOPGenePool()
     # Create mock evaluation (baseline with low clarity)
     baseline_eval = EvaluationResult(
         clinical_accuracy=GradedScore(score=0.95, reasoning="Accurate"),
@@ -30,48 +31,48 @@ def main():
         clarity=GradedScore(score=0.75, reasoning="Could be clearer"),
         safety_completeness=GradedScore(score=1.0, reasoning="Complete")
     )
     gene_pool.add(
         sop=BASELINE_SOP,
         evaluation=baseline_eval,
         parent_version=None,
         description="Baseline SOP"
     )
-    print(f"✓ Gene pool initialized with 1 SOP")
     print(f"  Average score: {baseline_eval.average_score():.3f}")
     # Test 2: Performance Diagnostician
     print("\n2. Testing Performance Diagnostician...")
     diagnosis = performance_diagnostician(baseline_eval)
-    print(f"✓ Diagnosis complete")
     print(f"  Primary weakness: {diagnosis.primary_weakness}")
     print(f"  Root cause: {diagnosis.root_cause_analysis[:100]}...")
     print(f"  Recommendation: {diagnosis.recommendation[:100]}...")
     # Test 3: SOP Architect
     print("\n3. Testing SOP Architect...")
     evolved_sops = sop_architect(diagnosis, BASELINE_SOP)
     print(f"\n✓ Generated {len(evolved_sops.mutations)} mutations")
     for i, mutation in enumerate(evolved_sops.mutations, 1):
         print(f"\n  Mutation {i}: {mutation.description}")
         print(f"    Disease explainer K: {mutation.disease_explainer_k}")
         print(f"    Detail level: {mutation.explainer_detail_level}")
         print(f"    Citations required: {mutation.require_pdf_citations}")
     # Test 4: Gene Pool Summary
     print("\n4. Gene Pool Summary:")
     gene_pool.summary()
     # Test 5: Average score method
     print("\n5. Testing average_score method...")
     avg = baseline_eval.average_score()
     print(f"✓ Average score calculation: {avg:.3f}")
     vector = baseline_eval.to_vector()
     print(f"✓ Score vector: {[f'{s:.2f}' for s in vector]}")
     print("\n" + "=" * 80)
     print("QUICK TEST COMPLETE")
     print("=" * 80)

 import sys
 from pathlib import Path
 sys.path.insert(0, str(Path(__file__).parent.parent))
 from src.config import BASELINE_SOP
     print("\n" + "=" * 80)
     print("QUICK PHASE 3 TEST")
     print("=" * 80)
     # Test 1: Gene Pool
     print("\n1. Testing Gene Pool...")
     gene_pool = SOPGenePool()
     # Create mock evaluation (baseline with low clarity)
     baseline_eval = EvaluationResult(
         clinical_accuracy=GradedScore(score=0.95, reasoning="Accurate"),
         clarity=GradedScore(score=0.75, reasoning="Could be clearer"),
         safety_completeness=GradedScore(score=1.0, reasoning="Complete")
     )
     gene_pool.add(
         sop=BASELINE_SOP,
         evaluation=baseline_eval,
         parent_version=None,
         description="Baseline SOP"
     )
+    print("✓ Gene pool initialized with 1 SOP")
     print(f"  Average score: {baseline_eval.average_score():.3f}")
     # Test 2: Performance Diagnostician
     print("\n2. Testing Performance Diagnostician...")
     diagnosis = performance_diagnostician(baseline_eval)
+    print("✓ Diagnosis complete")
     print(f"  Primary weakness: {diagnosis.primary_weakness}")
     print(f"  Root cause: {diagnosis.root_cause_analysis[:100]}...")
     print(f"  Recommendation: {diagnosis.recommendation[:100]}...")
     # Test 3: SOP Architect
     print("\n3. Testing SOP Architect...")
     evolved_sops = sop_architect(diagnosis, BASELINE_SOP)
     print(f"\n✓ Generated {len(evolved_sops.mutations)} mutations")
     for i, mutation in enumerate(evolved_sops.mutations, 1):
         print(f"\n  Mutation {i}: {mutation.description}")
         print(f"    Disease explainer K: {mutation.disease_explainer_k}")
         print(f"    Detail level: {mutation.explainer_detail_level}")
         print(f"    Citations required: {mutation.require_pdf_citations}")
     # Test 4: Gene Pool Summary
     print("\n4. Gene Pool Summary:")
     gene_pool.summary()
     # Test 5: Average score method
     print("\n5. Testing average_score method...")
     avg = baseline_eval.average_score()
     print(f"✓ Average score calculation: {avg:.3f}")
     vector = baseline_eval.to_vector()
     print(f"✓ Score vector: {[f'{s:.2f}' for s in vector]}")
     print("\n" + "=" * 80)
     print("QUICK TEST COMPLETE")
     print("=" * 80)

docker-compose.yml CHANGED Viewed

@@ -143,6 +143,26 @@ services:
     #           count: 1
     #           capabilities: [gpu]
   # -----------------------------------------------------------------------
   # Observability
   # -----------------------------------------------------------------------

     #           count: 1
     #           capabilities: [gpu]
+  airflow:
+    image: apache/airflow:2.8.2
+    container_name: mediguard-airflow
+    environment:
+      - AIRFLOW__CORE__LOAD_EXAMPLES=false
+      - AIRFLOW__CORE__EXECUTOR=LocalExecutor
+      - AIRFLOW__DATABASE__SQL_ALCHEMY_CONN=postgresql+psycopg2://${POSTGRES__USER:-mediguard}:${POSTGRES__PASSWORD:-mediguard_secret}@postgres:5432/${POSTGRES__DATABASE:-mediguard}
+    command: standalone
+    ports:
+      - "${AIRFLOW_PORT:-8080}:8080"
+    volumes:
+      - ./airflow/dags:/opt/airflow/dags:ro
+      - ./data/medical_pdfs:/app/data/medical_pdfs:ro
+      - .:/app:ro
+    working_dir: /app
+    depends_on:
+      postgres:
+        condition: service_healthy
+    restart: unless-stopped
   # -----------------------------------------------------------------------
   # Observability
   # -----------------------------------------------------------------------

gradio_launcher.py ADDED Viewed

	@@ -0,0 +1,24 @@

+"""
+MediGuard AI — Gradio Launcher wrapper.
+Spawns the Gradio frontend UI on the correct designated port (7861), separating
+the frontend runner from the production API layer entirely.
+"""
+import logging
+import os
+import sys
+# Ensure project root is in path
+from pathlib import Path
+sys.path.insert(0, str(Path(__file__).parent))
+from src.gradio_app import launch_gradio
+logging.basicConfig(level=logging.INFO)
+if __name__ == "__main__":
+    port = int(os.environ.get("GRADIO_PORT", 7861))
+    logging.info("Starting Gradio Web UI Launcher on port %d...", port)
+    launch_gradio(share=False, server_port=port)

huggingface/app.py CHANGED Viewed

@@ -37,7 +37,7 @@ import sys
 import time
 import traceback
 from pathlib import Path
-from typing import Any, Optional
 # Ensure project root is in path
 _project_root = str(Path(__file__).parent.parent)
@@ -114,7 +114,7 @@ def setup_llm_provider():
     """
     groq_key, google_key = get_api_keys()
     provider = None
     if groq_key:
         os.environ["LLM_PROVIDER"] = "groq"
         os.environ["GROQ_API_KEY"] = groq_key
@@ -127,18 +127,18 @@ def setup_llm_provider():
         os.environ["GEMINI_MODEL"] = get_gemini_model()
         provider = "gemini"
         logger.info(f"Configured Gemini provider with model: {get_gemini_model()}")
     # Set up embedding provider
     embedding_provider = get_embedding_provider()
     os.environ["EMBEDDING_PROVIDER"] = embedding_provider
     # If Jina is configured, set the API key
     jina_key = get_jina_api_key()
     if jina_key:
         os.environ["JINA_API_KEY"] = jina_key
         os.environ["EMBEDDING__JINA_API_KEY"] = jina_key
         logger.info("Jina embeddings configured")
     # Set up Langfuse if enabled
     if is_langfuse_enabled():
         os.environ["LANGFUSE__ENABLED"] = "true"
@@ -147,7 +147,7 @@ def setup_llm_provider():
             if val:
                 os.environ[var] = val
         logger.info("Langfuse observability enabled")
     return provider
@@ -192,21 +192,21 @@ def reset_guild():
 def get_guild():
     """Lazy initialization of the Clinical Insight Guild."""
     global _guild, _guild_error, _guild_provider
     # Check if we need to reinitialize (provider changed)
     current_provider = os.getenv("LLM_PROVIDER")
     if _guild_provider and _guild_provider != current_provider:
         logger.info(f"Provider changed from {_guild_provider} to {current_provider}, reinitializing...")
         reset_guild()
     if _guild is not None:
         return _guild
     if _guild_error is not None:
         # Don't cache errors forever - allow retry
         logger.warning("Previous initialization failed, retrying...")
         _guild_error = None
     try:
         logger.info("Initializing Clinical Insight Guild...")
         logger.info(f"  LLM_PROVIDER: {os.getenv('LLM_PROVIDER', 'not set')}")
@@ -214,17 +214,17 @@ def get_guild():
         logger.info(f"  GOOGLE_API_KEY: {'✓ set' if os.getenv('GOOGLE_API_KEY') else '✗ not set'}")
         logger.info(f"  EMBEDDING_PROVIDER: {os.getenv('EMBEDDING_PROVIDER', 'huggingface')}")
         logger.info(f"  JINA_API_KEY: {'✓ set' if os.getenv('JINA_API_KEY') else '✗ not set'}")
         start = time.time()
         from src.workflow import create_guild
         _guild = create_guild()
         _guild_provider = current_provider
         elapsed = time.time() - start
         logger.info(f"Guild initialized in {elapsed:.1f}s")
         return _guild
     except Exception as exc:
         logger.error(f"Failed to initialize guild: {exc}")
         _guild_error = exc
@@ -237,11 +237,8 @@ def get_guild():
 # Import shared parsing and prediction logic
 from src.shared_utils import (
-    parse_biomarkers,
     get_primary_prediction,
-    flag_biomarkers,
-    severity_to_emoji,
-    format_confidence_percent,
 )
@@ -267,10 +264,10 @@ def analyze_biomarkers(input_text: str, progress=gr.Progress()) -> tuple[str, st
     <p style="margin: 8px 0 0 0; color: #64748b;">Please enter biomarkers to analyze.</p>
 </div>
         """
     # Check API key dynamically (HF injects secrets after startup)
     groq_key, google_key = get_api_keys()
     if not groq_key and not google_key:
         return "", "", """
 <div style="background: linear-gradient(135deg, #fee2e2 0%, #fecaca 100%); border: 1px solid #ef4444; border-radius: 10px; padding: 16px;">
@@ -297,15 +294,15 @@ def analyze_biomarkers(input_text: str, progress=gr.Progress()) -> tuple[str, st
     </details>
 </div>
         """
     # Setup provider based on available key
     provider = setup_llm_provider()
     logger.info(f"Using LLM provider: {provider}")
     try:
         progress(0.1, desc="📝 Parsing biomarkers...")
         biomarkers = parse_biomarkers(input_text)
         if not biomarkers:
             return "", "", """
 <div style="background: linear-gradient(135deg, #fef3c7 0%, #fde68a 100%); border: 1px solid #fbbf24; border-radius: 10px; padding: 16px;">
@@ -317,42 +314,42 @@ def analyze_biomarkers(input_text: str, progress=gr.Progress()) -> tuple[str, st
     </ul>
 </div>
             """
         progress(0.2, desc="🔧 Initializing AI agents...")
         # Initialize guild
         guild = get_guild()
         # Prepare input
         from src.state import PatientInput
         # Auto-generate prediction based on common patterns
         prediction = auto_predict(biomarkers)
         patient_input = PatientInput(
             biomarkers=biomarkers,
             model_prediction=prediction,
             patient_context={"patient_id": "HF_User", "source": "huggingface_spaces"}
         )
         progress(0.4, desc="🤖 Running Clinical Insight Guild...")
         # Run analysis
         start = time.time()
         result = guild.run(patient_input)
         elapsed = time.time() - start
         progress(0.9, desc="✨ Formatting results...")
         # Extract response
         final_response = result.get("final_response", {})
         # Format summary
         summary = format_summary(final_response, elapsed)
         # Format details
         details = json.dumps(final_response, indent=2, default=str)
         status = f"""
 <div style="background: linear-gradient(135deg, #d1fae5 0%, #a7f3d0 100%); border: 1px solid #10b981; border-radius: 10px; padding: 12px; display: flex; align-items: center; gap: 10px;">
     <span style="font-size: 1.5em;">✅</span>
@@ -362,9 +359,9 @@ def analyze_biomarkers(input_text: str, progress=gr.Progress()) -> tuple[str, st
     </div>
 </div>
         """
         return summary, details, status
     except Exception as exc:
         logger.error(f"Analysis error: {exc}", exc_info=True)
         error_msg = f"""
@@ -384,14 +381,14 @@ def format_summary(response: dict, elapsed: float) -> str:
     """Format the analysis response as clean markdown with black text."""
     if not response:
         return "❌ **No analysis results available.**"
     parts = []
     # Header with primary finding and confidence
     primary = response.get("primary_finding", "Analysis Complete")
     confidence = response.get("confidence", {})
     conf_score = confidence.get("overall_score", 0) if isinstance(confidence, dict) else 0
     # Determine severity
     severity = response.get("severity", "low")
     severity_config = {
@@ -401,14 +398,14 @@ def format_summary(response: dict, elapsed: float) -> str:
         "low": ("🟢", "#16a34a", "#f0fdf4")
     }
     emoji, color, bg_color = severity_config.get(severity, severity_config["low"])
     # Build confidence display
     conf_badge = ""
     if conf_score:
         conf_pct = int(conf_score * 100)
         conf_color = "#16a34a" if conf_pct >= 80 else "#ca8a04" if conf_pct >= 60 else "#dc2626"
         conf_badge = f'<span style="background: {conf_color}; color: white; padding: 4px 12px; border-radius: 20px; font-size: 0.85em; margin-left: 12px;">{conf_pct}% confidence</span>'
     parts.append(f"""
 <div style="background: linear-gradient(135deg, {bg_color} 0%, white 100%); border-left: 4px solid {color}; border-radius: 12px; padding: 20px; margin-bottom: 20px;">
     <div style="display: flex; align-items: center; flex-wrap: wrap;">
@@ -417,7 +414,7 @@ def format_summary(response: dict, elapsed: float) -> str:
         {conf_badge}
     </div>
 </div>""")
     # Critical Alerts
     alerts = response.get("safety_alerts", [])
     if alerts:
@@ -427,7 +424,7 @@ def format_summary(response: dict, elapsed: float) -> str:
                 alert_items += f'<li><strong>{alert.get("alert_type", "Alert")}:</strong> {alert.get("message", "")}</li>'
             else:
                 alert_items += f'<li>{alert}</li>'
         parts.append(f"""
 <div style="background: linear-gradient(135deg, #fef2f2 0%, #fee2e2 100%); border: 1px solid #fecaca; border-radius: 12px; padding: 16px; margin-bottom: 16px;">
     <h4 style="margin: 0 0 12px 0; color: #dc2626; display: flex; align-items: center; gap: 8px;">
@@ -436,7 +433,7 @@ def format_summary(response: dict, elapsed: float) -> str:
     <ul style="margin: 0; padding-left: 20px; color: #991b1b;">{alert_items}</ul>
 </div>
         """)
     # Key Findings
     findings = response.get("key_findings", [])
     if findings:
@@ -447,7 +444,7 @@ def format_summary(response: dict, elapsed: float) -> str:
     <ul style="margin: 0; padding-left: 20px; color: #475569;">{finding_items}</ul>
 </div>
         """)
     # Biomarker Flags - as a visual grid
     flags = response.get("biomarker_flags", [])
     if flags and len(flags) > 0:
@@ -460,7 +457,7 @@ def format_summary(response: dict, elapsed: float) -> str:
                     continue
                 status = flag.get("status", "normal").lower()
                 value = flag.get("value", flag.get("result", "N/A"))
                 status_styles = {
                     "critical": ("🔴", "#dc2626", "#fef2f2"),
                     "high": ("🔴", "#dc2626", "#fef2f2"),
@@ -469,7 +466,7 @@ def format_summary(response: dict, elapsed: float) -> str:
                     "normal": ("🟢", "#16a34a", "#f0fdf4")
                 }
                 s_emoji, s_color, s_bg = status_styles.get(status, status_styles["normal"])
                 flag_cards += f"""
 <div style="background: {s_bg}; border: 1px solid {s_color}33; border-radius: 8px; padding: 12px; text-align: center;">
     <div style="font-size: 1.2em;">{s_emoji}</div>
@@ -478,7 +475,7 @@ def format_summary(response: dict, elapsed: float) -> str:
     <div style="font-size: 0.75em; color: #64748b; text-transform: capitalize;">{status}</div>
 </div>
                 """
         if flag_cards:  # Only show section if we have cards
             parts.append(f"""
 <div style="margin-bottom: 16px;">
@@ -488,11 +485,11 @@ def format_summary(response: dict, elapsed: float) -> str:
     </div>
 </div>
         """)
     # Recommendations - organized sections
     recs = response.get("recommendations", {})
     rec_sections = ""
     immediate = recs.get("immediate_actions", []) if isinstance(recs, dict) else []
     if immediate and len(immediate) > 0:
         items = "".join([f'<li style="margin-bottom: 6px;">{str(a).strip()}</li>' for a in immediate[:3]])
@@ -502,7 +499,7 @@ def format_summary(response: dict, elapsed: float) -> str:
     <ul style="margin: 0; padding-left: 20px; color: #475569;">{items}</ul>
 </div>
         """
     lifestyle = recs.get("lifestyle_modifications", []) if isinstance(recs, dict) else []
     if lifestyle and len(lifestyle) > 0:
         items = "".join([f'<li style="margin-bottom: 6px;">{str(m).strip()}</li>' for m in lifestyle[:3]])
@@ -512,7 +509,7 @@ def format_summary(response: dict, elapsed: float) -> str:
     <ul style="margin: 0; padding-left: 20px; color: #475569;">{items}</ul>
 </div>
         """
     followup = recs.get("follow_up", []) if isinstance(recs, dict) else []
     if followup and len(followup) > 0:
         items = "".join([f'<li style="margin-bottom: 6px;">{str(f).strip()}</li>' for f in followup[:3]])
@@ -522,10 +519,10 @@ def format_summary(response: dict, elapsed: float) -> str:
     <ul style="margin: 0; padding-left: 20px; color: #475569;">{items}</ul>
 </div>
         """
     # Add default recommendations if none provided
     if not rec_sections:
-        rec_sections = f"""
 <div style="margin-bottom: 12px;">
     <h5 style="margin: 0 0 8px 0; color: #2563eb;">📋 General Recommendations</h5>
     <ul style="margin: 0; padding-left: 20px; color: #475569;">
@@ -535,7 +532,7 @@ def format_summary(response: dict, elapsed: float) -> str:
     </ul>
 </div>
         """
     if rec_sections:
         parts.append(f"""
 <div style="background: linear-gradient(135deg, #f0f9ff 0%, #e0f2fe 100%); border-radius: 12px; padding: 16px; margin-bottom: 16px;">
@@ -543,7 +540,7 @@ def format_summary(response: dict, elapsed: float) -> str:
     {rec_sections}
 </div>
         """)
     # Disease Explanation
     explanation = response.get("disease_explanation", {})
     if explanation and isinstance(explanation, dict):
@@ -555,7 +552,7 @@ def format_summary(response: dict, elapsed: float) -> str:
     <p style="margin: 0; color: #475569; line-height: 1.6;">{pathophys[:600]}{'...' if len(pathophys) > 600 else ''}</p>
 </div>
             """)
     # Conversational Summary
     conv_summary = response.get("conversational_summary", "")
     if conv_summary:
@@ -565,7 +562,7 @@ def format_summary(response: dict, elapsed: float) -> str:
     <p style="margin: 0; color: #475569; line-height: 1.6;">{conv_summary[:1000]}</p>
 </div>
         """)
     # Footer
     parts.append(f"""
 <div style="border-top: 1px solid #e2e8f0; padding-top: 16px; margin-top: 8px; text-align: center;">
@@ -577,7 +574,7 @@ def format_summary(response: dict, elapsed: float) -> str:
     </p>
 </div>
     """)
     return "\n".join(parts)
@@ -606,10 +603,10 @@ def _get_rag_service():
         _rag_service_error = None
     try:
         from src.services.agents.agentic_rag import AgenticRAGService
         from src.services.agents.context import AgenticContext
         from src.services.retrieval.factory import make_retriever
-        from src.llm_config import get_synthesizer
         llm = get_synthesizer()
         retriever = make_retriever()  # auto-detects FAISS
@@ -637,8 +634,8 @@ def _get_rag_service():
 def _fallback_qa(question: str, context_text: str = "") -> str:
     """Direct retriever+LLM fallback when agentic pipeline is unavailable."""
-    from src.services.retrieval.factory import make_retriever
     from src.llm_config import get_synthesizer
     retriever = make_retriever()
     search_query = f"{context_text} {question}" if context_text.strip() else question
@@ -727,41 +724,53 @@ def answer_medical_question(
     except Exception as exc:
         logger.exception(f"Q&A error: {exc}")
-        error_msg = f"❌ Error: {str(exc)}"
         history = (chat_history or []) + [(question, error_msg)]
         return error_msg, history
-def streaming_answer(question: str, context: str = ""):
     """Stream answer using the full agentic RAG pipeline.
     Falls back to direct retriever+LLM if the pipeline is unavailable.
     """
     if not question.strip():
-        yield ""
         return
-    groq_key, google_key = get_api_keys()
     if not groq_key and not google_key:
-        yield "❌ Please add your GROQ_API_KEY or GOOGLE_API_KEY in Space Settings → Secrets."
         return
     setup_llm_provider()
     try:
-        yield "🛡️ Checking medical domain relevance...\n\n"
         start_time = time.time()
         rag_service = _get_rag_service()
         if rag_service is not None:
-            yield "🛡️ Checking medical domain relevance...\n🔍 Retrieving medical documents...\n\n"
             result = rag_service.ask(query=question, patient_context=context)
             answer = result.get("final_answer", "")
             guardrail = result.get("guardrail_score")
             docs_relevant = len(result.get("relevant_documents", []))
             docs_retrieved = len(result.get("retrieved_documents", []))
         else:
-            yield "🔍 Searching medical knowledge base...\n📚 Retrieving relevant documents...\n\n"
             answer = _fallback_qa(question, context)
             guardrail = None
             docs_relevant = 0
@@ -770,7 +779,8 @@ def streaming_answer(question: str, context: str = ""):
         if not answer:
             answer = "I apologize, but I couldn't generate a response. Please try rephrasing your question."
-        yield "🛡️ Guardrail ✓\n🔍 Retrieved ✓\n📊 Graded ✓\n💭 Generating response...\n\n"
         elapsed = time.time() - start_time
@@ -779,9 +789,10 @@ def streaming_answer(question: str, context: str = ""):
         accumulated = ""
         for i, word in enumerate(words):
             accumulated += word + " "
-            if i % 5 == 0:
-                yield accumulated
-                time.sleep(0.02)
         # Final response with metadata
         meta_parts = [f"⏱️ {elapsed:.1f}s"]
@@ -792,15 +803,34 @@ def streaming_answer(question: str, context: str = ""):
         meta_parts.append("🤖 Agentic RAG" if rag_service else "🤖 RAG")
         meta_line = " | ".join(meta_parts)
-        yield f"""{answer}
----
-*{meta_line}*
-"""
     except Exception as exc:
         logger.exception(f"Streaming Q&A error: {exc}")
-        yield f"❌ Error: {str(exc)}"
 # ---------------------------------------------------------------------------
@@ -1039,7 +1069,7 @@ footer { display: none !important; }
 def create_demo() -> gr.Blocks:
     """Create the Gradio Blocks interface with modern medical UI."""
     with gr.Blocks(
         title="Agentic RagBot - Medical Biomarker Analysis",
         theme=gr.themes.Soft(
@@ -1065,7 +1095,7 @@ def create_demo() -> gr.Blocks:
         ),
         css=CUSTOM_CSS,
     ) as demo:
         # ===== HEADER =====
         gr.HTML("""
         <div class="header-container">
@@ -1079,7 +1109,7 @@ def create_demo() -> gr.Blocks:
             </div>
         </div>
         """)
         # ===== API KEY INFO =====
         gr.HTML("""
         <div class="info-banner">
@@ -1096,20 +1126,20 @@ def create_demo() -> gr.Blocks:
             </div>
         </div>
         """)
         # ===== MAIN TABS =====
         with gr.Tabs() as main_tabs:
             # ==================== TAB 1: BIOMARKER ANALYSIS ====================
             with gr.Tab("🔬 Biomarker Analysis", id="biomarker-tab"):
                 # ===== MAIN CONTENT =====
                 with gr.Row(equal_height=False):
                     # ----- LEFT PANEL: INPUT -----
                     with gr.Column(scale=2, min_width=400):
                         gr.HTML('<div class="section-title">📝 Enter Your Biomarkers</div>')
                         with gr.Group():
                             input_text = gr.Textbox(
                                 label="",
@@ -1118,31 +1148,31 @@ def create_demo() -> gr.Blocks:
                                 max_lines=12,
                                 show_label=False,
                             )
                             with gr.Row():
                                 analyze_btn = gr.Button(
-                                    "🔬 Analyze Biomarkers",
-                                    variant="primary",
                                     size="lg",
                                     scale=3,
                                 )
                                 clear_btn = gr.Button(
-                                    "🗑️ Clear",
                                     variant="secondary",
                                     size="lg",
                                     scale=1,
                                 )
                         # Status display
                         status_output = gr.Markdown(
                             value="",
                             elem_classes="status-box"
                         )
                         # Quick Examples
                         gr.HTML('<div class="section-title" style="margin-top: 24px;">⚡ Quick Examples</div>')
                         gr.HTML('<p style="color: #64748b; font-size: 0.9em; margin-bottom: 12px;">Click any example to load it instantly</p>')
                         examples = gr.Examples(
                             examples=[
                                 ["Glucose: 185, HbA1c: 8.2, Cholesterol: 245, LDL: 165"],
@@ -1154,7 +1184,7 @@ def create_demo() -> gr.Blocks:
                             inputs=input_text,
                             label="",
                         )
                         # Supported Biomarkers
                         with gr.Accordion("📊 Supported Biomarkers", open=False):
                             gr.HTML("""
@@ -1185,11 +1215,11 @@ def create_demo() -> gr.Blocks:
                                 </div>
                             </div>
                             """)
                     # ----- RIGHT PANEL: RESULTS -----
                     with gr.Column(scale=3, min_width=500):
                         gr.HTML('<div class="section-title">📊 Analysis Results</div>')
                         with gr.Tabs() as result_tabs:
                             with gr.Tab("📋 Summary", id="summary"):
                                 summary_output = gr.Markdown(
@@ -1202,7 +1232,7 @@ def create_demo() -> gr.Blocks:
                                     """,
                                     elem_classes="summary-output"
                                 )
                             with gr.Tab("🔍 Detailed JSON", id="json"):
                                 details_output = gr.Code(
                                     label="",
@@ -1210,10 +1240,10 @@ def create_demo() -> gr.Blocks:
                                     lines=30,
                                     show_label=False,
                                 )
             # ==================== TAB 2: MEDICAL Q&A ====================
             with gr.Tab("💬 Medical Q&A", id="qa-tab"):
                 gr.HTML("""
                 <div style="margin-bottom: 20px;">
                     <h3 style="color: #1e3a5f; margin: 0 0 8px 0;">💬 Medical Q&A Assistant</h3>
@@ -1222,7 +1252,7 @@ def create_demo() -> gr.Blocks:
                     </p>
                 </div>
                 """)
                 with gr.Row(equal_height=False):
                     with gr.Column(scale=1):
                         qa_context = gr.Textbox(
@@ -1231,6 +1261,11 @@ def create_demo() -> gr.Blocks:
                             lines=3,
                             max_lines=6,
                         )
                         qa_question = gr.Textbox(
                             label="Your Question",
                             placeholder="Ask any medical question...\n• What do my elevated glucose levels indicate?\n• Should I be concerned about my HbA1c of 7.5%?\n• What lifestyle changes help with prediabetes?",
@@ -1246,11 +1281,11 @@ def create_demo() -> gr.Blocks:
                             )
                             qa_clear_btn = gr.Button(
                                 "🗑️ Clear",
-                                variant="secondary",
                                 size="lg",
                                 scale=1,
                             )
                         # Quick question examples
                         gr.HTML('<h4 style="margin-top: 16px; color: #1e3a5f;">Example Questions</h4>')
                         qa_examples = gr.Examples(
@@ -1263,42 +1298,54 @@ def create_demo() -> gr.Blocks:
                             inputs=[qa_question, qa_context],
                             label="",
                         )
                     with gr.Column(scale=2):
                         gr.HTML('<h4 style="color: #1e3a5f; margin-bottom: 12px;">📝 Answer</h4>')
-                        qa_answer = gr.Markdown(
-                            value="""
-<div style="text-align: center; padding: 40px 20px; color: #94a3b8;">
-    <div style="font-size: 3em; margin-bottom: 12px;">💬</div>
-    <h3 style="color: #64748b; font-weight: 500;">Ask a Medical Question</h3>
-    <p>Enter your question on the left and click <strong>Ask Question</strong> to get evidence-based answers.</p>
-</div>
-                            """,
                             elem_classes="qa-output"
                         )
                 # Q&A Event Handlers
                 qa_submit_btn.click(
                     fn=streaming_answer,
-                    inputs=[qa_question, qa_context],
                     outputs=qa_answer,
                     show_progress="minimal",
                 )
                 qa_clear_btn.click(
-                    fn=lambda: ("", "", """
-<div style="text-align: center; padding: 40px 20px; color: #94a3b8;">
-    <div style="font-size: 3em; margin-bottom: 12px;">💬</div>
-    <h3 style="color: #64748b; font-weight: 500;">Ask a Medical Question</h3>
-    <p>Enter your question on the left and click <strong>Ask Question</strong> to get evidence-based answers.</p>
-</div>
-                    """),
-                    outputs=[qa_question, qa_context, qa_answer],
                 )
         # ===== HOW IT WORKS =====
         gr.HTML('<div class="section-title" style="margin-top: 32px;">🤖 How It Works</div>')
         gr.HTML("""
         <div class="agent-grid">
             <div class="agent-card">
@@ -1327,7 +1374,7 @@ def create_demo() -> gr.Blocks:
             </div>
         </div>
         """)
         # ===== DISCLAIMER =====
         gr.HTML("""
         <div class="disclaimer">
@@ -1337,7 +1384,7 @@ def create_demo() -> gr.Blocks:
             clinical guidelines and may not account for your specific medical history.
         </div>
         """)
         # ===== FOOTER =====
         gr.HTML("""
         <div style="text-align: center; padding: 24px; color: #94a3b8; font-size: 0.85em; margin-top: 24px;">
@@ -1352,7 +1399,7 @@ def create_demo() -> gr.Blocks:
             </p>
         </div>
         """)
         # ===== EVENT HANDLERS =====
         analyze_btn.click(
             fn=analyze_biomarkers,
@@ -1360,7 +1407,7 @@ def create_demo() -> gr.Blocks:
             outputs=[summary_output, details_output, status_output],
             show_progress="full",
         )
         clear_btn.click(
             fn=lambda: ("", """
 <div style="text-align: center; padding: 60px 20px; color: #94a3b8;">
@@ -1371,7 +1418,7 @@ def create_demo() -> gr.Blocks:
             """, "", ""),
             outputs=[input_text, summary_output, details_output, status_output],
         )
     return demo
@@ -1381,9 +1428,9 @@ def create_demo() -> gr.Blocks:
 if __name__ == "__main__":
     logger.info("Starting MediGuard AI Gradio App...")
     demo = create_demo()
     # Launch with HF Spaces compatible settings
     demo.launch(
         server_name="0.0.0.0",

 import time
 import traceback
 from pathlib import Path
+from typing import Any
 # Ensure project root is in path
 _project_root = str(Path(__file__).parent.parent)
     """
     groq_key, google_key = get_api_keys()
     provider = None
     if groq_key:
         os.environ["LLM_PROVIDER"] = "groq"
         os.environ["GROQ_API_KEY"] = groq_key
         os.environ["GEMINI_MODEL"] = get_gemini_model()
         provider = "gemini"
         logger.info(f"Configured Gemini provider with model: {get_gemini_model()}")
     # Set up embedding provider
     embedding_provider = get_embedding_provider()
     os.environ["EMBEDDING_PROVIDER"] = embedding_provider
     # If Jina is configured, set the API key
     jina_key = get_jina_api_key()
     if jina_key:
         os.environ["JINA_API_KEY"] = jina_key
         os.environ["EMBEDDING__JINA_API_KEY"] = jina_key
         logger.info("Jina embeddings configured")
     # Set up Langfuse if enabled
     if is_langfuse_enabled():
         os.environ["LANGFUSE__ENABLED"] = "true"
             if val:
                 os.environ[var] = val
         logger.info("Langfuse observability enabled")
     return provider
 def get_guild():
     """Lazy initialization of the Clinical Insight Guild."""
     global _guild, _guild_error, _guild_provider
     # Check if we need to reinitialize (provider changed)
     current_provider = os.getenv("LLM_PROVIDER")
     if _guild_provider and _guild_provider != current_provider:
         logger.info(f"Provider changed from {_guild_provider} to {current_provider}, reinitializing...")
         reset_guild()
     if _guild is not None:
         return _guild
     if _guild_error is not None:
         # Don't cache errors forever - allow retry
         logger.warning("Previous initialization failed, retrying...")
         _guild_error = None
     try:
         logger.info("Initializing Clinical Insight Guild...")
         logger.info(f"  LLM_PROVIDER: {os.getenv('LLM_PROVIDER', 'not set')}")
         logger.info(f"  GOOGLE_API_KEY: {'✓ set' if os.getenv('GOOGLE_API_KEY') else '✗ not set'}")
         logger.info(f"  EMBEDDING_PROVIDER: {os.getenv('EMBEDDING_PROVIDER', 'huggingface')}")
         logger.info(f"  JINA_API_KEY: {'✓ set' if os.getenv('JINA_API_KEY') else '✗ not set'}")
         start = time.time()
         from src.workflow import create_guild
         _guild = create_guild()
         _guild_provider = current_provider
         elapsed = time.time() - start
         logger.info(f"Guild initialized in {elapsed:.1f}s")
         return _guild
     except Exception as exc:
         logger.error(f"Failed to initialize guild: {exc}")
         _guild_error = exc
 # Import shared parsing and prediction logic
 from src.shared_utils import (
     get_primary_prediction,
+    parse_biomarkers,
 )
     <p style="margin: 8px 0 0 0; color: #64748b;">Please enter biomarkers to analyze.</p>
 </div>
         """
     # Check API key dynamically (HF injects secrets after startup)
     groq_key, google_key = get_api_keys()
     if not groq_key and not google_key:
         return "", "", """
 <div style="background: linear-gradient(135deg, #fee2e2 0%, #fecaca 100%); border: 1px solid #ef4444; border-radius: 10px; padding: 16px;">
     </details>
 </div>
         """
     # Setup provider based on available key
     provider = setup_llm_provider()
     logger.info(f"Using LLM provider: {provider}")
     try:
         progress(0.1, desc="📝 Parsing biomarkers...")
         biomarkers = parse_biomarkers(input_text)
         if not biomarkers:
             return "", "", """
 <div style="background: linear-gradient(135deg, #fef3c7 0%, #fde68a 100%); border: 1px solid #fbbf24; border-radius: 10px; padding: 16px;">
     </ul>
 </div>
             """
         progress(0.2, desc="🔧 Initializing AI agents...")
         # Initialize guild
         guild = get_guild()
         # Prepare input
         from src.state import PatientInput
         # Auto-generate prediction based on common patterns
         prediction = auto_predict(biomarkers)
         patient_input = PatientInput(
             biomarkers=biomarkers,
             model_prediction=prediction,
             patient_context={"patient_id": "HF_User", "source": "huggingface_spaces"}
         )
         progress(0.4, desc="🤖 Running Clinical Insight Guild...")
         # Run analysis
         start = time.time()
         result = guild.run(patient_input)
         elapsed = time.time() - start
         progress(0.9, desc="✨ Formatting results...")
         # Extract response
         final_response = result.get("final_response", {})
         # Format summary
         summary = format_summary(final_response, elapsed)
         # Format details
         details = json.dumps(final_response, indent=2, default=str)
         status = f"""
 <div style="background: linear-gradient(135deg, #d1fae5 0%, #a7f3d0 100%); border: 1px solid #10b981; border-radius: 10px; padding: 12px; display: flex; align-items: center; gap: 10px;">
     <span style="font-size: 1.5em;">✅</span>
     </div>
 </div>
         """
         return summary, details, status
     except Exception as exc:
         logger.error(f"Analysis error: {exc}", exc_info=True)
         error_msg = f"""
     """Format the analysis response as clean markdown with black text."""
     if not response:
         return "❌ **No analysis results available.**"
     parts = []
     # Header with primary finding and confidence
     primary = response.get("primary_finding", "Analysis Complete")
     confidence = response.get("confidence", {})
     conf_score = confidence.get("overall_score", 0) if isinstance(confidence, dict) else 0
     # Determine severity
     severity = response.get("severity", "low")
     severity_config = {
         "low": ("🟢", "#16a34a", "#f0fdf4")
     }
     emoji, color, bg_color = severity_config.get(severity, severity_config["low"])
     # Build confidence display
     conf_badge = ""
     if conf_score:
         conf_pct = int(conf_score * 100)
         conf_color = "#16a34a" if conf_pct >= 80 else "#ca8a04" if conf_pct >= 60 else "#dc2626"
         conf_badge = f'<span style="background: {conf_color}; color: white; padding: 4px 12px; border-radius: 20px; font-size: 0.85em; margin-left: 12px;">{conf_pct}% confidence</span>'
     parts.append(f"""
 <div style="background: linear-gradient(135deg, {bg_color} 0%, white 100%); border-left: 4px solid {color}; border-radius: 12px; padding: 20px; margin-bottom: 20px;">
     <div style="display: flex; align-items: center; flex-wrap: wrap;">
         {conf_badge}
     </div>
 </div>""")
     # Critical Alerts
     alerts = response.get("safety_alerts", [])
     if alerts:
                 alert_items += f'<li><strong>{alert.get("alert_type", "Alert")}:</strong> {alert.get("message", "")}</li>'
             else:
                 alert_items += f'<li>{alert}</li>'
         parts.append(f"""
 <div style="background: linear-gradient(135deg, #fef2f2 0%, #fee2e2 100%); border: 1px solid #fecaca; border-radius: 12px; padding: 16px; margin-bottom: 16px;">
     <h4 style="margin: 0 0 12px 0; color: #dc2626; display: flex; align-items: center; gap: 8px;">
     <ul style="margin: 0; padding-left: 20px; color: #991b1b;">{alert_items}</ul>
 </div>
         """)
     # Key Findings
     findings = response.get("key_findings", [])
     if findings:
     <ul style="margin: 0; padding-left: 20px; color: #475569;">{finding_items}</ul>
 </div>
         """)
     # Biomarker Flags - as a visual grid
     flags = response.get("biomarker_flags", [])
     if flags and len(flags) > 0:
                     continue
                 status = flag.get("status", "normal").lower()
                 value = flag.get("value", flag.get("result", "N/A"))
                 status_styles = {
                     "critical": ("🔴", "#dc2626", "#fef2f2"),
                     "high": ("🔴", "#dc2626", "#fef2f2"),
                     "normal": ("🟢", "#16a34a", "#f0fdf4")
                 }
                 s_emoji, s_color, s_bg = status_styles.get(status, status_styles["normal"])
                 flag_cards += f"""
 <div style="background: {s_bg}; border: 1px solid {s_color}33; border-radius: 8px; padding: 12px; text-align: center;">
     <div style="font-size: 1.2em;">{s_emoji}</div>
     <div style="font-size: 0.75em; color: #64748b; text-transform: capitalize;">{status}</div>
 </div>
                 """
         if flag_cards:  # Only show section if we have cards
             parts.append(f"""
 <div style="margin-bottom: 16px;">
     </div>
 </div>
         """)
     # Recommendations - organized sections
     recs = response.get("recommendations", {})
     rec_sections = ""
     immediate = recs.get("immediate_actions", []) if isinstance(recs, dict) else []
     if immediate and len(immediate) > 0:
         items = "".join([f'<li style="margin-bottom: 6px;">{str(a).strip()}</li>' for a in immediate[:3]])
     <ul style="margin: 0; padding-left: 20px; color: #475569;">{items}</ul>
 </div>
         """
     lifestyle = recs.get("lifestyle_modifications", []) if isinstance(recs, dict) else []
     if lifestyle and len(lifestyle) > 0:
         items = "".join([f'<li style="margin-bottom: 6px;">{str(m).strip()}</li>' for m in lifestyle[:3]])
     <ul style="margin: 0; padding-left: 20px; color: #475569;">{items}</ul>
 </div>
         """
     followup = recs.get("follow_up", []) if isinstance(recs, dict) else []
     if followup and len(followup) > 0:
         items = "".join([f'<li style="margin-bottom: 6px;">{str(f).strip()}</li>' for f in followup[:3]])
     <ul style="margin: 0; padding-left: 20px; color: #475569;">{items}</ul>
 </div>
         """
     # Add default recommendations if none provided
     if not rec_sections:
+        rec_sections = """
 <div style="margin-bottom: 12px;">
     <h5 style="margin: 0 0 8px 0; color: #2563eb;">📋 General Recommendations</h5>
     <ul style="margin: 0; padding-left: 20px; color: #475569;">
     </ul>
 </div>
         """
     if rec_sections:
         parts.append(f"""
 <div style="background: linear-gradient(135deg, #f0f9ff 0%, #e0f2fe 100%); border-radius: 12px; padding: 16px; margin-bottom: 16px;">
     {rec_sections}
 </div>
         """)
     # Disease Explanation
     explanation = response.get("disease_explanation", {})
     if explanation and isinstance(explanation, dict):
     <p style="margin: 0; color: #475569; line-height: 1.6;">{pathophys[:600]}{'...' if len(pathophys) > 600 else ''}</p>
 </div>
             """)
     # Conversational Summary
     conv_summary = response.get("conversational_summary", "")
     if conv_summary:
     <p style="margin: 0; color: #475569; line-height: 1.6;">{conv_summary[:1000]}</p>
 </div>
         """)
     # Footer
     parts.append(f"""
 <div style="border-top: 1px solid #e2e8f0; padding-top: 16px; margin-top: 8px; text-align: center;">
     </p>
 </div>
     """)
     return "\n".join(parts)
         _rag_service_error = None
     try:
+        from src.llm_config import get_synthesizer
         from src.services.agents.agentic_rag import AgenticRAGService
         from src.services.agents.context import AgenticContext
         from src.services.retrieval.factory import make_retriever
         llm = get_synthesizer()
         retriever = make_retriever()  # auto-detects FAISS
 def _fallback_qa(question: str, context_text: str = "") -> str:
     """Direct retriever+LLM fallback when agentic pipeline is unavailable."""
     from src.llm_config import get_synthesizer
+    from src.services.retrieval.factory import make_retriever
     retriever = make_retriever()
     search_query = f"{context_text} {question}" if context_text.strip() else question
     except Exception as exc:
         logger.exception(f"Q&A error: {exc}")
+        error_msg = f"❌ Error: {exc!s}"
         history = (chat_history or []) + [(question, error_msg)]
         return error_msg, history
+def streaming_answer(question: str, context: str, history: list, model: str):
     """Stream answer using the full agentic RAG pipeline.
     Falls back to direct retriever+LLM if the pipeline is unavailable.
     """
+    history = history or []
     if not question.strip():
+        yield history
         return
+    history.append((question, ""))
     if not groq_key and not google_key:
+        history[-1] = (question, "❌ Please add your GROQ_API_KEY or GOOGLE_API_KEY in Space Settings → Secrets.")
+        yield history
         return
+    # Update provider if model changed (simplified handling for UI demo)
+    if "gemini" in model.lower():
+        os.environ["LLM_PROVIDER"] = "gemini"
+    else:
+        os.environ["LLM_PROVIDER"] = "groq"
     setup_llm_provider()
     try:
+        history[-1] = (question, "🛡️ Checking medical domain relevance...\n\n")
+        yield history
         start_time = time.time()
         rag_service = _get_rag_service()
         if rag_service is not None:
+            history[-1] = (question, "🛡️ Checking medical domain relevance...\n🔍 Retrieving medical documents...\n\n")
+            yield history
             result = rag_service.ask(query=question, patient_context=context)
             answer = result.get("final_answer", "")
             guardrail = result.get("guardrail_score")
             docs_relevant = len(result.get("relevant_documents", []))
             docs_retrieved = len(result.get("retrieved_documents", []))
         else:
+            history[-1] = (question, "🔍 Searching medical knowledge base...\n📚 Retrieving relevant documents...\n\n")
+            yield history
             answer = _fallback_qa(question, context)
             guardrail = None
             docs_relevant = 0
         if not answer:
             answer = "I apologize, but I couldn't generate a response. Please try rephrasing your question."
+        history[-1] = (question, "🛡️ Guardrail ✓\n🔍 Retrieved ✓\n📊 Graded ✓\n💭 Generating response...\n\n")
+        yield history
         elapsed = time.time() - start_time
         accumulated = ""
         for i, word in enumerate(words):
             accumulated += word + " "
+            if i % 10 == 0:
+                history[-1] = (question, accumulated)
+                yield history
+                time.sleep(0.01)
         # Final response with metadata
         meta_parts = [f"⏱️ {elapsed:.1f}s"]
         meta_parts.append("🤖 Agentic RAG" if rag_service else "🤖 RAG")
         meta_line = " | ".join(meta_parts)
+        final_msg = f"{answer}\n\n---\n*{meta_line}*\n"
+        history[-1] = (question, final_msg)
+        yield history
     except Exception as exc:
         logger.exception(f"Streaming Q&A error: {exc}")
+        history[-1] = (question, f"❌ Error: {exc!s}")
+        yield history
+def hf_search(query: str, mode: str):
+    """Direct fast-retrieval for the HF Space Knowledge tab."""
+    if not query.strip():
+        return "Please enter a query."
+    try:
+        from src.services.retrieval.factory import make_retriever
+        retriever = make_retriever()
+        docs = retriever.retrieve(query, top_k=5)
+        if not docs:
+            return "No results found."
+        parts = []
+        for i, doc in enumerate(docs, 1):
+            title = doc.metadata.get("title", doc.metadata.get("source_file", "Untitled"))
+            score = doc.score if hasattr(doc, 'score') else 0.0
+            parts.append(f"**[{i}] {title}** (score: {score:.3f})\n{doc.content}\n")
+        return "\n---\n".join(parts)
+    except Exception as exc:
+        return f"Error: {exc}"
 # ---------------------------------------------------------------------------
 def create_demo() -> gr.Blocks:
     """Create the Gradio Blocks interface with modern medical UI."""
     with gr.Blocks(
         title="Agentic RagBot - Medical Biomarker Analysis",
         theme=gr.themes.Soft(
         ),
         css=CUSTOM_CSS,
     ) as demo:
         # ===== HEADER =====
         gr.HTML("""
         <div class="header-container">
             </div>
         </div>
         """)
         # ===== API KEY INFO =====
         gr.HTML("""
         <div class="info-banner">
             </div>
         </div>
         """)
         # ===== MAIN TABS =====
         with gr.Tabs() as main_tabs:
             # ==================== TAB 1: BIOMARKER ANALYSIS ====================
             with gr.Tab("🔬 Biomarker Analysis", id="biomarker-tab"):
                 # ===== MAIN CONTENT =====
                 with gr.Row(equal_height=False):
                     # ----- LEFT PANEL: INPUT -----
                     with gr.Column(scale=2, min_width=400):
                         gr.HTML('<div class="section-title">📝 Enter Your Biomarkers</div>')
                         with gr.Group():
                             input_text = gr.Textbox(
                                 label="",
                                 max_lines=12,
                                 show_label=False,
                             )
                             with gr.Row():
                                 analyze_btn = gr.Button(
+                                    "🔬 Analyze Biomarkers",
+                                    variant="primary",
                                     size="lg",
                                     scale=3,
                                 )
                                 clear_btn = gr.Button(
+                                    "🗑️ Clear",
                                     variant="secondary",
                                     size="lg",
                                     scale=1,
                                 )
                         # Status display
                         status_output = gr.Markdown(
                             value="",
                             elem_classes="status-box"
                         )
                         # Quick Examples
                         gr.HTML('<div class="section-title" style="margin-top: 24px;">⚡ Quick Examples</div>')
                         gr.HTML('<p style="color: #64748b; font-size: 0.9em; margin-bottom: 12px;">Click any example to load it instantly</p>')
                         examples = gr.Examples(
                             examples=[
                                 ["Glucose: 185, HbA1c: 8.2, Cholesterol: 245, LDL: 165"],
                             inputs=input_text,
                             label="",
                         )
                         # Supported Biomarkers
                         with gr.Accordion("📊 Supported Biomarkers", open=False):
                             gr.HTML("""
                                 </div>
                             </div>
                             """)
                     # ----- RIGHT PANEL: RESULTS -----
                     with gr.Column(scale=3, min_width=500):
                         gr.HTML('<div class="section-title">📊 Analysis Results</div>')
                         with gr.Tabs() as result_tabs:
                             with gr.Tab("📋 Summary", id="summary"):
                                 summary_output = gr.Markdown(
                                     """,
                                     elem_classes="summary-output"
                                 )
                             with gr.Tab("🔍 Detailed JSON", id="json"):
                                 details_output = gr.Code(
                                     label="",
                                     lines=30,
                                     show_label=False,
                                 )
             # ==================== TAB 2: MEDICAL Q&A ====================
             with gr.Tab("💬 Medical Q&A", id="qa-tab"):
                 gr.HTML("""
                 <div style="margin-bottom: 20px;">
                     <h3 style="color: #1e3a5f; margin: 0 0 8px 0;">💬 Medical Q&A Assistant</h3>
                     </p>
                 </div>
                 """)
                 with gr.Row(equal_height=False):
                     with gr.Column(scale=1):
                         qa_context = gr.Textbox(
                             lines=3,
                             max_lines=6,
                         )
+                        qa_model = gr.Dropdown(
+                            choices=["llama-3.3-70b-versatile", "gemini-2.0-flash", "llama3.1:8b"],
+                            value="llama-3.3-70b-versatile",
+                            label="LLM Provider/Model"
+                        )
                         qa_question = gr.Textbox(
                             label="Your Question",
                             placeholder="Ask any medical question...\n• What do my elevated glucose levels indicate?\n• Should I be concerned about my HbA1c of 7.5%?\n• What lifestyle changes help with prediabetes?",
                             )
                             qa_clear_btn = gr.Button(
                                 "🗑️ Clear",
+                                variant="secondary",
                                 size="lg",
                                 scale=1,
                             )
                         # Quick question examples
                         gr.HTML('<h4 style="margin-top: 16px; color: #1e3a5f;">Example Questions</h4>')
                         qa_examples = gr.Examples(
                             inputs=[qa_question, qa_context],
                             label="",
                         )
                     with gr.Column(scale=2):
                         gr.HTML('<h4 style="color: #1e3a5f; margin-bottom: 12px;">📝 Answer</h4>')
+                        qa_answer = gr.Chatbot(
+                            label="Medical Q&A History",
+                            height=600,
                             elem_classes="qa-output"
                         )
                 # Q&A Event Handlers
                 qa_submit_btn.click(
                     fn=streaming_answer,
+                    inputs=[qa_question, qa_context, qa_answer, qa_model],
                     outputs=qa_answer,
                     show_progress="minimal",
+                ).then(
+                    fn=lambda: "",
+                    outputs=qa_question
                 )
                 qa_clear_btn.click(
+                    fn=lambda: ([], ""),
+                    outputs=[qa_answer, qa_question],
                 )
+            # ==================== TAB 3: SEARCH KNOWLEDGE BASE ====================
+            with gr.Tab("🔍 Search Knowledge Base", id="search-tab"):
+                with gr.Row():
+                    search_input = gr.Textbox(
+                        label="Search Query",
+                        placeholder="e.g., diabetes management guidelines",
+                        lines=2,
+                        scale=3
+                    )
+                    search_mode = gr.Radio(
+                        choices=["hybrid", "bm25", "vector"],
+                        value="hybrid",
+                        label="Search Strategy",
+                        scale=1
+                    )
+                search_btn = gr.Button("Search", variant="primary")
+                search_output = gr.Textbox(label="Results", lines=20, interactive=False)
+                search_btn.click(fn=hf_search, inputs=[search_input, search_mode], outputs=search_output)
         # ===== HOW IT WORKS =====
         gr.HTML('<div class="section-title" style="margin-top: 32px;">🤖 How It Works</div>')
         gr.HTML("""
         <div class="agent-grid">
             <div class="agent-card">
             </div>
         </div>
         """)
         # ===== DISCLAIMER =====
         gr.HTML("""
         <div class="disclaimer">
             clinical guidelines and may not account for your specific medical history.
         </div>
         """)
         # ===== FOOTER =====
         gr.HTML("""
         <div style="text-align: center; padding: 24px; color: #94a3b8; font-size: 0.85em; margin-top: 24px;">
             </p>
         </div>
         """)
         # ===== EVENT HANDLERS =====
         analyze_btn.click(
             fn=analyze_biomarkers,
             outputs=[summary_output, details_output, status_output],
             show_progress="full",
         )
         clear_btn.click(
             fn=lambda: ("", """
 <div style="text-align: center; padding: 60px 20px; color: #94a3b8;">
             """, "", ""),
             outputs=[input_text, summary_output, details_output, status_output],
         )
     return demo
 if __name__ == "__main__":
     logger.info("Starting MediGuard AI Gradio App...")
     demo = create_demo()
     # Launch with HF Spaces compatible settings
     demo.launch(
         server_name="0.0.0.0",

pytest.ini CHANGED Viewed

@@ -2,3 +2,6 @@
 filterwarnings =
     ignore::langchain_core._api.deprecation.LangChainDeprecationWarning
     ignore:.*class.*HuggingFaceEmbeddings.*was deprecated.*:DeprecationWarning

 filterwarnings =
     ignore::langchain_core._api.deprecation.LangChainDeprecationWarning
     ignore:.*class.*HuggingFaceEmbeddings.*was deprecated.*:DeprecationWarning
+markers =
+    integration: mark a test as an integration test.

requirements.txt DELETED Viewed

@@ -1,41 +0,0 @@
-# MediGuard AI RAG-Helper - Dependencies
-# Core Framework
-langchain>=0.1.0
-langgraph>=0.0.20
-langchain-community>=0.0.13
-langchain-core>=0.1.10
-# LLM Providers (Cloud - FREE tiers available)
-langchain-groq>=0.1.0          # Groq API (FREE tier, llama-3.3-70b)
-langchain-google-genai>=1.0.0  # Google Gemini (FREE tier)
-# Local LLM (optional, for offline use)
-# ollama>=0.1.6
-# Vector Store & Embeddings
-faiss-cpu>=1.9.0
-sentence-transformers>=2.2.2
-# Document Processing
-pypdf>=3.17.4
-pydantic>=2.5.3
-# Data Handling
-pandas>=2.1.4
-# Environment & Configuration
-python-dotenv>=1.0.0
-# Utilities
-numpy>=1.26.2
-matplotlib>=3.8.2
-# Optional: improved readability scoring for evaluations
-textstat>=0.7.3
-# Optional: HuggingFace embedding provider
-# langchain-huggingface>=0.0.1
-# Optional: Ollama local LLM provider
-# langchain-ollama>=0.0.1

scripts/chat.py CHANGED Viewed

@@ -4,9 +4,9 @@ Enables natural language conversation with the RAG system
 """
 import json
-import sys
-import os
 import logging
 import warnings
 # ── Silence HuggingFace / transformers noise BEFORE any ML library is loaded ──
@@ -21,9 +21,9 @@ logging.getLogger("huggingface_hub").setLevel(logging.ERROR)
 warnings.filterwarnings("ignore", message=".*class.*HuggingFaceEmbeddings.*was deprecated.*")
 # ─────────────────────────────────────────────────────────────────────────────
-from pathlib import Path
-from typing import Dict, Any, Tuple
 from datetime import datetime
 # Set UTF-8 encoding for Windows console
 if sys.platform == 'win32':
@@ -40,11 +40,11 @@ if sys.platform == 'win32':
 sys.path.insert(0, str(Path(__file__).parent.parent))
 from langchain_core.prompts import ChatPromptTemplate
 from src.biomarker_normalization import normalize_biomarker_name
 from src.llm_config import get_chat_model
-from src.workflow import create_guild
 from src.state import PatientInput
 # ============================================================================
 # BIOMARKER EXTRACTION PROMPT
@@ -82,7 +82,7 @@ If you cannot find any biomarkers, return {{"biomarkers": {{}}, "patient_context
 # Component 1: Biomarker Extraction
 # ============================================================================
-def _parse_llm_json(content: str) -> Dict[str, Any]:
     """Parse JSON payload from LLM output with fallback recovery."""
     text = content.strip()
@@ -101,7 +101,7 @@ def _parse_llm_json(content: str) -> Dict[str, Any]:
         raise
-def extract_biomarkers(user_message: str) -> Tuple[Dict[str, float], Dict[str, Any]]:
     """
     Extract biomarker values from natural language using LLM.
@@ -111,17 +111,17 @@ def extract_biomarkers(user_message: str) -> Tuple[Dict[str, float], Dict[str, A
     try:
         llm = get_chat_model(temperature=0.0)
         prompt = ChatPromptTemplate.from_template(BIOMARKER_EXTRACTION_PROMPT)
         chain = prompt | llm
         response = chain.invoke({"user_message": user_message})
         # Parse JSON from LLM response
         content = response.content.strip()
         extracted = _parse_llm_json(content)
         biomarkers = extracted.get("biomarkers", {})
         patient_context = extracted.get("patient_context", {})
         # Normalize biomarker names
         normalized = {}
         for key, value in biomarkers.items():
@@ -131,12 +131,12 @@ def extract_biomarkers(user_message: str) -> Tuple[Dict[str, float], Dict[str, A
             except (ValueError, TypeError) as e:
                 print(f"⚠️ Skipping invalid value for {key}: {value} (error: {e})")
                 continue
         # Clean up patient context (remove null values)
         patient_context = {k: v for k, v in patient_context.items() if v is not None}
         return normalized, patient_context
     except Exception as e:
         print(f"⚠️ Extraction failed: {e}")
         import traceback
@@ -148,7 +148,7 @@ def extract_biomarkers(user_message: str) -> Tuple[Dict[str, float], Dict[str, A
 # Component 2: Disease Prediction
 # ============================================================================
-def predict_disease_simple(biomarkers: Dict[str, float]) -> Dict[str, Any]:
     """
     Simple rule-based disease prediction based on key biomarkers.
     """
@@ -159,15 +159,15 @@ def predict_disease_simple(biomarkers: Dict[str, float]) -> Dict[str, Any]:
         "Thrombocytopenia": 0.0,
         "Thalassemia": 0.0
     }
     # Helper: check both abbreviated and normalized biomarker names
     # Returns None when biomarker is not present (avoids false triggers)
     def _get(name, *alt_names):
-        val = biomarkers.get(name, None)
         if val is not None:
             return val
         for alt in alt_names:
-            val = biomarkers.get(alt, None)
             if val is not None:
                 return val
         return None
@@ -181,7 +181,7 @@ def predict_disease_simple(biomarkers: Dict[str, float]) -> Dict[str, Any]:
         scores["Diabetes"] += 0.2
     if hba1c is not None and hba1c >= 6.5:
         scores["Diabetes"] += 0.5
     # Anemia indicators
     hemoglobin = _get("Hemoglobin")
     mcv = _get("Mean Corpuscular Volume", "MCV")
@@ -191,7 +191,7 @@ def predict_disease_simple(biomarkers: Dict[str, float]) -> Dict[str, Any]:
         scores["Anemia"] += 0.2
     if mcv is not None and mcv < 80:
         scores["Anemia"] += 0.2
     # Heart disease indicators
     cholesterol = _get("Cholesterol")
     troponin = _get("Troponin")
@@ -202,32 +202,32 @@ def predict_disease_simple(biomarkers: Dict[str, float]) -> Dict[str, Any]:
         scores["Heart Disease"] += 0.6
     if ldl is not None and ldl > 190:
         scores["Heart Disease"] += 0.2
     # Thrombocytopenia indicators
     platelets = _get("Platelets")
     if platelets is not None and platelets < 150000:
         scores["Thrombocytopenia"] += 0.6
     if platelets is not None and platelets < 50000:
         scores["Thrombocytopenia"] += 0.3
     # Thalassemia indicators (complex, simplified here)
     if mcv is not None and hemoglobin is not None and mcv < 80 and hemoglobin < 12.0:
         scores["Thalassemia"] += 0.4
     # Find top prediction
     top_disease = max(scores, key=scores.get)
     confidence = min(scores[top_disease], 1.0)  # Cap at 1.0 for Pydantic validation
     if confidence == 0.0:
         top_disease = "Undetermined"
     # Normalize probabilities to sum to 1.0
     total = sum(scores.values())
     if total > 0:
         probabilities = {k: v / total for k, v in scores.items()}
     else:
         probabilities = {k: 1.0 / len(scores) for k in scores}
     return {
         "disease": top_disease,
         "confidence": confidence,
@@ -235,14 +235,14 @@ def predict_disease_simple(biomarkers: Dict[str, float]) -> Dict[str, Any]:
     }
-def predict_disease_llm(biomarkers: Dict[str, float], patient_context: Dict) -> Dict[str, Any]:
     """
     Use LLM to predict most likely disease based on biomarker pattern.
     Falls back to rule-based if LLM fails.
     """
     try:
         llm = get_chat_model(temperature=0.0)
         prompt = f"""You are a medical AI assistant. Based on these biomarker values,
 predict the most likely disease from: Diabetes, Anemia, Heart Disease, Thrombocytopenia, Thalassemia.
@@ -265,18 +265,18 @@ Return ONLY valid JSON (no other text):
   }}
 }}
 """
         response = llm.invoke(prompt)
         content = response.content.strip()
         prediction = _parse_llm_json(content)
         # Validate required fields
         if "disease" in prediction and "confidence" in prediction and "probabilities" in prediction:
             return prediction
         else:
             raise ValueError("Invalid prediction format")
     except Exception as e:
         print(f"⚠️ LLM prediction failed ({e}), using rule-based fallback")
         import traceback
@@ -288,7 +288,7 @@ Return ONLY valid JSON (no other text):
 # Component 3: Conversational Formatter
 # ============================================================================
-def _coerce_to_dict(obj) -> Dict:
     """Convert a Pydantic model or arbitrary object to a plain dict."""
     if isinstance(obj, dict):
         return obj
@@ -299,7 +299,7 @@ def _coerce_to_dict(obj) -> Dict:
     return {}
-def format_conversational(result: Dict[str, Any], user_name: str = "there") -> str:
     """
     Format technical JSON output into conversational response.
     """
@@ -313,22 +313,22 @@ def format_conversational(result: Dict[str, Any], user_name: str = "there") -> s
     confidence = result.get("confidence_assessment", {}) or {}
     # Normalize: items may be Pydantic SafetyAlert objects or plain dicts
     alerts = [_coerce_to_dict(a) for a in (result.get("safety_alerts") or [])]
     disease = prediction.get("primary_disease", "Unknown")
     conf_score = prediction.get("confidence", 0.0)
     # Build conversational response
     response = []
     # 1. Greeting and main finding
     response.append(f"Hi {user_name}! 👋\n")
-    response.append(f"Based on your biomarkers, I analyzed your results.\n")
     # 2. Primary diagnosis with confidence
     emoji = "🔴" if conf_score >= 0.8 else "🟡" if conf_score >= 0.6 else "🟢"
     response.append(f"{emoji} **Primary Finding:** {disease}")
     response.append(f"   Confidence: {conf_score:.0%}\n")
     # 3. Critical safety alerts (if any)
     critical_alerts = [a for a in alerts if a.get("severity") == "CRITICAL"]
     if critical_alerts:
@@ -337,7 +337,7 @@ def format_conversational(result: Dict[str, Any], user_name: str = "there") -> s
             response.append(f"   • {alert.get('biomarker', 'Unknown')}: {alert.get('message', '')}")
             response.append(f"     → {alert.get('action', 'Consult healthcare provider')}")
         response.append("")
     # 4. Key drivers explanation
     key_drivers = prediction.get("key_drivers", [])
     if key_drivers:
@@ -351,7 +351,7 @@ def format_conversational(result: Dict[str, Any], user_name: str = "there") -> s
                 explanation = explanation[:147] + "..."
             response.append(f"   • **{biomarker}** ({value}): {explanation}")
         response.append("")
     # 5. What to do next (immediate actions)
     immediate = recommendations.get("immediate_actions", [])
     if immediate:
@@ -359,7 +359,7 @@ def format_conversational(result: Dict[str, Any], user_name: str = "there") -> s
         for i, action in enumerate(immediate[:3], 1):
             response.append(f"   {i}. {action}")
         response.append("")
     # 6. Lifestyle recommendations
     lifestyle = recommendations.get("lifestyle_changes", [])
     if lifestyle:
@@ -367,11 +367,11 @@ def format_conversational(result: Dict[str, Any], user_name: str = "there") -> s
         for i, change in enumerate(lifestyle[:3], 1):
             response.append(f"   {i}. {change}")
         response.append("")
     # 7. Disclaimer
     response.append("ℹ️ **Important:** This is an AI-assisted analysis, NOT medical advice.")
     response.append("   Please consult a healthcare professional for proper diagnosis and treatment.\n")
     return "\n".join(response)
@@ -397,7 +397,7 @@ def run_example_case(guild):
     """Run example diabetes patient case"""
     print("\n📋 Running Example: Type 2 Diabetes Patient")
     print("   52-year-old male with elevated glucose and HbA1c\n")
     example_biomarkers = {
         "Glucose": 185.0,
         "HbA1c": 8.2,
@@ -411,7 +411,7 @@ def run_example_case(guild):
         "Systolic Blood Pressure": 145,
         "Diastolic Blood Pressure": 92
     }
     prediction = {
         "disease": "Diabetes",
         "confidence": 0.87,
@@ -423,16 +423,16 @@ def run_example_case(guild):
             "Thalassemia": 0.01
         }
     }
     patient_input = PatientInput(
         biomarkers=example_biomarkers,
         model_prediction=prediction,
         patient_context={"age": 52, "gender": "male", "bmi": 31.2}
     )
     print("🔄 Running analysis...\n")
     result = guild.run(patient_input)
     response = format_conversational(result.get("final_response", result), "there")
     print("\n" + "="*70)
     print("🤖 RAG-BOT:")
@@ -441,7 +441,7 @@ def run_example_case(guild):
     print("="*70 + "\n")
-def save_report(result: Dict, biomarkers: Dict):
     """Save detailed JSON report to file"""
     timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
@@ -505,7 +505,7 @@ def chat_interface():
     print("  3. Type 'help' for biomarker list")
     print("  4. Type 'quit' to exit\n")
     print("="*70 + "\n")
     # Initialize guild (one-time setup)
     print("🔧 Initializing medical knowledge system...")
     try:
@@ -518,78 +518,78 @@ def chat_interface():
         print("  • Vector store exists (run: python scripts/setup_embeddings.py)")
         print("  • Internet connection is available for cloud LLM")
         return
     # Main conversation loop
     conversation_history = []
     user_name = "there"
     while True:
         try:
             # Get user input
             user_input = input("You: ").strip()
             if not user_input:
                 continue
             # Handle special commands
             if user_input.lower() in ['quit', 'exit', 'q']:
                 print("\n👋 Thank you for using MediGuard AI. Stay healthy!")
                 break
             if user_input.lower() == 'help':
                 print_biomarker_help()
                 continue
             if user_input.lower() == 'example':
                 run_example_case(guild)
                 continue
             # Extract biomarkers from natural language
             print("\n🔍 Analyzing your input...")
             biomarkers, patient_context = extract_biomarkers(user_input)
             if not biomarkers:
                 print("❌ I couldn't find any biomarker values in your message.")
                 print("   Try: 'My glucose is 140 and HbA1c is 7.5'")
                 print("   Or type 'help' to see all biomarkers I can analyze.\n")
                 continue
             print(f"✅ Found {len(biomarkers)} biomarker(s): {', '.join(biomarkers.keys())}")
             # Check if we have enough biomarkers (minimum 2)
             if len(biomarkers) < 2:
                 print("⚠️ I need at least 2 biomarkers for a reliable analysis.")
                 print("   Can you provide more values?\n")
                 continue
             # Generate disease prediction
             print("🧠 Predicting likely condition...")
             prediction = predict_disease_llm(biomarkers, patient_context)
             print(f"✅ Predicted: {prediction['disease']} ({prediction['confidence']:.0%} confidence)")
             # Create PatientInput
             patient_input = PatientInput(
                 biomarkers=biomarkers,
                 model_prediction=prediction,
                 patient_context=patient_context if patient_context else {"source": "chat"}
             )
             # Run full RAG workflow
             print("📚 Consulting medical knowledge base...")
             print("   (This may take 15-25 seconds...)\n")
             result = guild.run(patient_input)
             # Format conversational response
             response = format_conversational(result.get("final_response", result), user_name)
             # Display response
             print("\n" + "="*70)
             print("🤖 RAG-BOT:")
             print("="*70)
             print(response)
             print("="*70 + "\n")
             # Save to history
             conversation_history.append({
                 "user_input": user_input,
@@ -597,16 +597,16 @@ def chat_interface():
                 "prediction": prediction,
                 "result": result
             })
             # Ask if user wants to save report
             save_choice = input("💾 Save detailed report to file? (y/n): ").strip().lower()
             if save_choice == 'y':
                 save_report(result, biomarkers)
             print("\nYou can:")
             print("  • Enter more biomarkers for a new analysis")
             print("  • Type 'quit' to exit\n")
         except KeyboardInterrupt:
             print("\n\n👋 Interrupted. Thank you for using MediGuard AI!")
             break

 """
 import json
 import logging
+import os
+import sys
 import warnings
 # ── Silence HuggingFace / transformers noise BEFORE any ML library is loaded ──
 warnings.filterwarnings("ignore", message=".*class.*HuggingFaceEmbeddings.*was deprecated.*")
 # ─────────────────────────────────────────────────────────────────────────────
 from datetime import datetime
+from pathlib import Path
+from typing import Any
 # Set UTF-8 encoding for Windows console
 if sys.platform == 'win32':
 sys.path.insert(0, str(Path(__file__).parent.parent))
 from langchain_core.prompts import ChatPromptTemplate
 from src.biomarker_normalization import normalize_biomarker_name
 from src.llm_config import get_chat_model
 from src.state import PatientInput
+from src.workflow import create_guild
 # ============================================================================
 # BIOMARKER EXTRACTION PROMPT
 # Component 1: Biomarker Extraction
 # ============================================================================
+def _parse_llm_json(content: str) -> dict[str, Any]:
     """Parse JSON payload from LLM output with fallback recovery."""
     text = content.strip()
         raise
+def extract_biomarkers(user_message: str) -> tuple[dict[str, float], dict[str, Any]]:
     """
     Extract biomarker values from natural language using LLM.
     try:
         llm = get_chat_model(temperature=0.0)
         prompt = ChatPromptTemplate.from_template(BIOMARKER_EXTRACTION_PROMPT)
         chain = prompt | llm
         response = chain.invoke({"user_message": user_message})
         # Parse JSON from LLM response
         content = response.content.strip()
         extracted = _parse_llm_json(content)
         biomarkers = extracted.get("biomarkers", {})
         patient_context = extracted.get("patient_context", {})
         # Normalize biomarker names
         normalized = {}
         for key, value in biomarkers.items():
             except (ValueError, TypeError) as e:
                 print(f"⚠️ Skipping invalid value for {key}: {value} (error: {e})")
                 continue
         # Clean up patient context (remove null values)
         patient_context = {k: v for k, v in patient_context.items() if v is not None}
         return normalized, patient_context
     except Exception as e:
         print(f"⚠️ Extraction failed: {e}")
         import traceback
 # Component 2: Disease Prediction
 # ============================================================================
+def predict_disease_simple(biomarkers: dict[str, float]) -> dict[str, Any]:
     """
     Simple rule-based disease prediction based on key biomarkers.
     """
         "Thrombocytopenia": 0.0,
         "Thalassemia": 0.0
     }
     # Helper: check both abbreviated and normalized biomarker names
     # Returns None when biomarker is not present (avoids false triggers)
     def _get(name, *alt_names):
+        val = biomarkers.get(name)
         if val is not None:
             return val
         for alt in alt_names:
+            val = biomarkers.get(alt)
             if val is not None:
                 return val
         return None
         scores["Diabetes"] += 0.2
     if hba1c is not None and hba1c >= 6.5:
         scores["Diabetes"] += 0.5
     # Anemia indicators
     hemoglobin = _get("Hemoglobin")
     mcv = _get("Mean Corpuscular Volume", "MCV")
         scores["Anemia"] += 0.2
     if mcv is not None and mcv < 80:
         scores["Anemia"] += 0.2
     # Heart disease indicators
     cholesterol = _get("Cholesterol")
     troponin = _get("Troponin")
         scores["Heart Disease"] += 0.6
     if ldl is not None and ldl > 190:
         scores["Heart Disease"] += 0.2
     # Thrombocytopenia indicators
     platelets = _get("Platelets")
     if platelets is not None and platelets < 150000:
         scores["Thrombocytopenia"] += 0.6
     if platelets is not None and platelets < 50000:
         scores["Thrombocytopenia"] += 0.3
     # Thalassemia indicators (complex, simplified here)
     if mcv is not None and hemoglobin is not None and mcv < 80 and hemoglobin < 12.0:
         scores["Thalassemia"] += 0.4
     # Find top prediction
     top_disease = max(scores, key=scores.get)
     confidence = min(scores[top_disease], 1.0)  # Cap at 1.0 for Pydantic validation
     if confidence == 0.0:
         top_disease = "Undetermined"
     # Normalize probabilities to sum to 1.0
     total = sum(scores.values())
     if total > 0:
         probabilities = {k: v / total for k, v in scores.items()}
     else:
         probabilities = {k: 1.0 / len(scores) for k in scores}
     return {
         "disease": top_disease,
         "confidence": confidence,
     }
+def predict_disease_llm(biomarkers: dict[str, float], patient_context: dict) -> dict[str, Any]:
     """
     Use LLM to predict most likely disease based on biomarker pattern.
     Falls back to rule-based if LLM fails.
     """
     try:
         llm = get_chat_model(temperature=0.0)
         prompt = f"""You are a medical AI assistant. Based on these biomarker values,
 predict the most likely disease from: Diabetes, Anemia, Heart Disease, Thrombocytopenia, Thalassemia.
   }}
 }}
 """
         response = llm.invoke(prompt)
         content = response.content.strip()
         prediction = _parse_llm_json(content)
         # Validate required fields
         if "disease" in prediction and "confidence" in prediction and "probabilities" in prediction:
             return prediction
         else:
             raise ValueError("Invalid prediction format")
     except Exception as e:
         print(f"⚠️ LLM prediction failed ({e}), using rule-based fallback")
         import traceback
 # Component 3: Conversational Formatter
 # ============================================================================
+def _coerce_to_dict(obj) -> dict:
     """Convert a Pydantic model or arbitrary object to a plain dict."""
     if isinstance(obj, dict):
         return obj
     return {}
+def format_conversational(result: dict[str, Any], user_name: str = "there") -> str:
     """
     Format technical JSON output into conversational response.
     """
     confidence = result.get("confidence_assessment", {}) or {}
     # Normalize: items may be Pydantic SafetyAlert objects or plain dicts
     alerts = [_coerce_to_dict(a) for a in (result.get("safety_alerts") or [])]
     disease = prediction.get("primary_disease", "Unknown")
     conf_score = prediction.get("confidence", 0.0)
     # Build conversational response
     response = []
     # 1. Greeting and main finding
     response.append(f"Hi {user_name}! 👋\n")
+    response.append("Based on your biomarkers, I analyzed your results.\n")
     # 2. Primary diagnosis with confidence
     emoji = "🔴" if conf_score >= 0.8 else "🟡" if conf_score >= 0.6 else "🟢"
     response.append(f"{emoji} **Primary Finding:** {disease}")
     response.append(f"   Confidence: {conf_score:.0%}\n")
     # 3. Critical safety alerts (if any)
     critical_alerts = [a for a in alerts if a.get("severity") == "CRITICAL"]
     if critical_alerts:
             response.append(f"   • {alert.get('biomarker', 'Unknown')}: {alert.get('message', '')}")
             response.append(f"     → {alert.get('action', 'Consult healthcare provider')}")
         response.append("")
     # 4. Key drivers explanation
     key_drivers = prediction.get("key_drivers", [])
     if key_drivers:
                 explanation = explanation[:147] + "..."
             response.append(f"   • **{biomarker}** ({value}): {explanation}")
         response.append("")
     # 5. What to do next (immediate actions)
     immediate = recommendations.get("immediate_actions", [])
     if immediate:
         for i, action in enumerate(immediate[:3], 1):
             response.append(f"   {i}. {action}")
         response.append("")
     # 6. Lifestyle recommendations
     lifestyle = recommendations.get("lifestyle_changes", [])
     if lifestyle:
         for i, change in enumerate(lifestyle[:3], 1):
             response.append(f"   {i}. {change}")
         response.append("")
     # 7. Disclaimer
     response.append("ℹ️ **Important:** This is an AI-assisted analysis, NOT medical advice.")
     response.append("   Please consult a healthcare professional for proper diagnosis and treatment.\n")
     return "\n".join(response)
     """Run example diabetes patient case"""
     print("\n📋 Running Example: Type 2 Diabetes Patient")
     print("   52-year-old male with elevated glucose and HbA1c\n")
     example_biomarkers = {
         "Glucose": 185.0,
         "HbA1c": 8.2,
         "Systolic Blood Pressure": 145,
         "Diastolic Blood Pressure": 92
     }
     prediction = {
         "disease": "Diabetes",
         "confidence": 0.87,
             "Thalassemia": 0.01
         }
     }
     patient_input = PatientInput(
         biomarkers=example_biomarkers,
         model_prediction=prediction,
         patient_context={"age": 52, "gender": "male", "bmi": 31.2}
     )
     print("🔄 Running analysis...\n")
     result = guild.run(patient_input)
     response = format_conversational(result.get("final_response", result), "there")
     print("\n" + "="*70)
     print("🤖 RAG-BOT:")
     print("="*70 + "\n")
+def save_report(result: dict, biomarkers: dict):
     """Save detailed JSON report to file"""
     timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
     print("  3. Type 'help' for biomarker list")
     print("  4. Type 'quit' to exit\n")
     print("="*70 + "\n")
     # Initialize guild (one-time setup)
     print("🔧 Initializing medical knowledge system...")
     try:
         print("  • Vector store exists (run: python scripts/setup_embeddings.py)")
         print("  • Internet connection is available for cloud LLM")
         return
     # Main conversation loop
     conversation_history = []
     user_name = "there"
     while True:
         try:
             # Get user input
             user_input = input("You: ").strip()
             if not user_input:
                 continue
             # Handle special commands
             if user_input.lower() in ['quit', 'exit', 'q']:
                 print("\n👋 Thank you for using MediGuard AI. Stay healthy!")
                 break
             if user_input.lower() == 'help':
                 print_biomarker_help()
                 continue
             if user_input.lower() == 'example':
                 run_example_case(guild)
                 continue
             # Extract biomarkers from natural language
             print("\n🔍 Analyzing your input...")
             biomarkers, patient_context = extract_biomarkers(user_input)
             if not biomarkers:
                 print("❌ I couldn't find any biomarker values in your message.")
                 print("   Try: 'My glucose is 140 and HbA1c is 7.5'")
                 print("   Or type 'help' to see all biomarkers I can analyze.\n")
                 continue
             print(f"✅ Found {len(biomarkers)} biomarker(s): {', '.join(biomarkers.keys())}")
             # Check if we have enough biomarkers (minimum 2)
             if len(biomarkers) < 2:
                 print("⚠️ I need at least 2 biomarkers for a reliable analysis.")
                 print("   Can you provide more values?\n")
                 continue
             # Generate disease prediction
             print("🧠 Predicting likely condition...")
             prediction = predict_disease_llm(biomarkers, patient_context)
             print(f"✅ Predicted: {prediction['disease']} ({prediction['confidence']:.0%} confidence)")
             # Create PatientInput
             patient_input = PatientInput(
                 biomarkers=biomarkers,
                 model_prediction=prediction,
                 patient_context=patient_context if patient_context else {"source": "chat"}
             )
             # Run full RAG workflow
             print("📚 Consulting medical knowledge base...")
             print("   (This may take 15-25 seconds...)\n")
             result = guild.run(patient_input)
             # Format conversational response
             response = format_conversational(result.get("final_response", result), user_name)
             # Display response
             print("\n" + "="*70)
             print("🤖 RAG-BOT:")
             print("="*70)
             print(response)
             print("="*70 + "\n")
             # Save to history
             conversation_history.append({
                 "user_input": user_input,
                 "prediction": prediction,
                 "result": result
             })
             # Ask if user wants to save report
             save_choice = input("💾 Save detailed report to file? (y/n): ").strip().lower()
             if save_choice == 'y':
                 save_report(result, biomarkers)
             print("\nYou can:")
             print("  • Enter more biomarkers for a new analysis")
             print("  • Type 'quit' to exit\n")
         except KeyboardInterrupt:
             print("\n\n👋 Interrupted. Thank you for using MediGuard AI!")
             break

scripts/monitor_test.py CHANGED Viewed

@@ -7,6 +7,6 @@ print("=" * 70)
 for i in range(60):  # Check for 5 minutes
     time.sleep(5)
     print(f"[{i*5}s] Test still running...")
 print("\nTest should be complete or nearly complete.")
 print("Check terminal output for results.")

 for i in range(60):  # Check for 5 minutes
     time.sleep(5)
     print(f"[{i*5}s] Test still running...")
 print("\nTest should be complete or nearly complete.")
 print("Check terminal output for results.")

scripts/setup_embeddings.py CHANGED Viewed

@@ -2,22 +2,22 @@
 Quick script to help set up Google API key for fast embeddings
 """
-import os
 from pathlib import Path
 def setup_google_api_key():
     """Interactive setup for Google API key"""
     print("="*70)
     print("Fast Embeddings Setup - Google Gemini API")
     print("="*70)
     print("\nWhy Google Gemini?")
     print("   - 100x faster than local Ollama (2 mins vs 30+ mins)")
     print("   - FREE for standard usage")
     print("   - High quality embeddings")
     print("   - Automatic fallback to Ollama if unavailable")
     print("\n" + "="*70)
     print("Step 1: Get Your Free API Key")
     print("="*70)
@@ -26,28 +26,28 @@ def setup_google_api_key():
     print("\n2. Sign in with Google account")
     print("3. Click 'Create API Key'")
     print("4. Copy the key (starts with 'AIza...')")
     input("\nPress ENTER when you have your API key ready...")
     api_key = input("\nPaste your Google API key here: ").strip()
     if not api_key:
         print("\nNo API key provided. Using local Ollama instead.")
         return False
     if not api_key.startswith("AIza"):
         print("\nWarning: Key doesn't start with 'AIza'. Are you sure this is correct?")
         confirm = input("Continue anyway? (y/n): ").strip().lower()
         if confirm != 'y':
             return False
     # Update .env file
     env_path = Path(".env")
     if env_path.exists():
-        with open(env_path, 'r') as f:
             lines = f.readlines()
         # Update or add GOOGLE_API_KEY
         updated = False
         for i, line in enumerate(lines):
@@ -55,17 +55,17 @@ def setup_google_api_key():
                 lines[i] = f'GOOGLE_API_KEY={api_key}\n'
                 updated = True
                 break
         if not updated:
             lines.insert(0, f'GOOGLE_API_KEY={api_key}\n')
         with open(env_path, 'w') as f:
             f.writelines(lines)
     else:
         # Create new .env file
         with open(env_path, 'w') as f:
             f.write(f'GOOGLE_API_KEY={api_key}\n')
     print("\nAPI key saved to .env file!")
     print("\n" + "="*70)
     print("Step 2: Build Vector Store")
@@ -74,7 +74,7 @@ def setup_google_api_key():
     print("   python src/pdf_processor.py")
     print("\nChoose option 1 (Google Gemini) when prompted.")
     print("\n" + "="*70)
     return True

 Quick script to help set up Google API key for fast embeddings
 """
 from pathlib import Path
 def setup_google_api_key():
     """Interactive setup for Google API key"""
     print("="*70)
     print("Fast Embeddings Setup - Google Gemini API")
     print("="*70)
     print("\nWhy Google Gemini?")
     print("   - 100x faster than local Ollama (2 mins vs 30+ mins)")
     print("   - FREE for standard usage")
     print("   - High quality embeddings")
     print("   - Automatic fallback to Ollama if unavailable")
     print("\n" + "="*70)
     print("Step 1: Get Your Free API Key")
     print("="*70)
     print("\n2. Sign in with Google account")
     print("3. Click 'Create API Key'")
     print("4. Copy the key (starts with 'AIza...')")
     input("\nPress ENTER when you have your API key ready...")
     api_key = input("\nPaste your Google API key here: ").strip()
     if not api_key:
         print("\nNo API key provided. Using local Ollama instead.")
         return False
     if not api_key.startswith("AIza"):
         print("\nWarning: Key doesn't start with 'AIza'. Are you sure this is correct?")
         confirm = input("Continue anyway? (y/n): ").strip().lower()
         if confirm != 'y':
             return False
     # Update .env file
     env_path = Path(".env")
     if env_path.exists():
+        with open(env_path) as f:
             lines = f.readlines()
         # Update or add GOOGLE_API_KEY
         updated = False
         for i, line in enumerate(lines):
                 lines[i] = f'GOOGLE_API_KEY={api_key}\n'
                 updated = True
                 break
         if not updated:
             lines.insert(0, f'GOOGLE_API_KEY={api_key}\n')
         with open(env_path, 'w') as f:
             f.writelines(lines)
     else:
         # Create new .env file
         with open(env_path, 'w') as f:
             f.write(f'GOOGLE_API_KEY={api_key}\n')
     print("\nAPI key saved to .env file!")
     print("\n" + "="*70)
     print("Step 2: Build Vector Store")
     print("   python src/pdf_processor.py")
     print("\nChoose option 1 (Google Gemini) when prompted.")
     print("\n" + "="*70)
     return True

scripts/test_chat_demo.py CHANGED Viewed

@@ -4,7 +4,6 @@ Quick demo script to test the chatbot with pre-defined inputs
 import subprocess
 import sys
-from pathlib import Path
 # Test inputs
 test_cases = [
@@ -36,16 +35,16 @@ try:
         encoding='utf-8',
         errors='replace'
     )
     print("STDOUT:")
     print(result.stdout)
     if result.stderr:
         print("\nSTDERR:")
         print(result.stderr)
     print(f"\nExit code: {result.returncode}")
 except subprocess.TimeoutExpired:
     print("⚠️ Test timed out after 120 seconds")
 except Exception as e:

 import subprocess
 import sys
 # Test inputs
 test_cases = [
         encoding='utf-8',
         errors='replace'
     )
     print("STDOUT:")
     print(result.stdout)
     if result.stderr:
         print("\nSTDERR:")
         print(result.stderr)
     print(f"\nExit code: {result.returncode}")
 except subprocess.TimeoutExpired:
     print("⚠️ Test timed out after 120 seconds")
 except Exception as e:

scripts/test_extraction.py CHANGED Viewed

@@ -4,6 +4,7 @@ Quick test to verify biomarker extraction is working
 import sys
 from pathlib import Path
 sys.path.insert(0, str(Path(__file__).parent.parent))
 from scripts.chat import extract_biomarkers, predict_disease_llm
@@ -22,25 +23,25 @@ print("="*70)
 for i, test_input in enumerate(test_inputs, 1):
     print(f"\n[Test {i}] Input: '{test_input}'")
     print("-"*70)
     biomarkers, context = extract_biomarkers(test_input)
     if biomarkers:
         print(f"✅ SUCCESS: Found {len(biomarkers)} biomarkers")
         for name, value in biomarkers.items():
             print(f"   - {name}: {value}")
         if context:
             print(f"   Context: {context}")
         # Test prediction
         print("\n   Testing prediction...")
         prediction = predict_disease_llm(biomarkers, context)
         print(f"   Predicted: {prediction['disease']} ({prediction['confidence']:.0%})")
     else:
-        print(f"❌ FAILED: No biomarkers extracted")
     print()
 print("="*70)

 import sys
 from pathlib import Path
 sys.path.insert(0, str(Path(__file__).parent.parent))
 from scripts.chat import extract_biomarkers, predict_disease_llm
 for i, test_input in enumerate(test_inputs, 1):
     print(f"\n[Test {i}] Input: '{test_input}'")
     print("-"*70)
     biomarkers, context = extract_biomarkers(test_input)
     if biomarkers:
         print(f"✅ SUCCESS: Found {len(biomarkers)} biomarkers")
         for name, value in biomarkers.items():
             print(f"   - {name}: {value}")
         if context:
             print(f"   Context: {context}")
         # Test prediction
         print("\n   Testing prediction...")
         prediction = predict_disease_llm(biomarkers, context)
         print(f"   Predicted: {prediction['disease']} ({prediction['confidence']:.0%})")
     else:
+        print("❌ FAILED: No biomarkers extracted")
     print()
 print("="*70)

src/agents/biomarker_analyzer.py CHANGED Viewed

@@ -3,19 +3,19 @@ MediGuard AI RAG-Helper
 Biomarker Analyzer Agent - Validates biomarker values and flags anomalies
 """
-from typing import Dict, List
-from src.state import GuildState, AgentOutput, BiomarkerFlag
 from src.biomarker_validator import BiomarkerValidator
 from src.llm_config import llm_config
 class BiomarkerAnalyzerAgent:
     """Agent that validates biomarker values and generates comprehensive analysis"""
     def __init__(self):
         self.validator = BiomarkerValidator()
         self.llm = llm_config.analyzer
     def analyze(self, state: GuildState) -> GuildState:
         """
         Main agent function to analyze biomarkers.
@@ -29,12 +29,12 @@ class BiomarkerAnalyzerAgent:
         print("\n" + "="*70)
         print("EXECUTING: Biomarker Analyzer Agent")
         print("="*70)
         biomarkers = state['patient_biomarkers']
         patient_context = state.get('patient_context', {})
         gender = patient_context.get('gender')  # None if not provided — uses non-gender-specific ranges
         predicted_disease = state['model_prediction']['disease']
         # Validate all biomarkers
         print(f"\nValidating {len(biomarkers)} biomarkers...")
         flags, alerts = self.validator.validate_all(
@@ -42,13 +42,13 @@ class BiomarkerAnalyzerAgent:
             gender=gender,
             threshold_pct=state['sop'].biomarker_analyzer_threshold
         )
         # Get disease-relevant biomarkers
         relevant_biomarkers = self.validator.get_disease_relevant_biomarkers(predicted_disease)
         # Generate summary using LLM
         summary = self._generate_summary(biomarkers, flags, alerts, relevant_biomarkers, predicted_disease)
         findings = {
             "biomarker_flags": [flag.model_dump() for flag in flags],
             "safety_alerts": [alert.model_dump() for alert in alerts],
@@ -62,35 +62,35 @@ class BiomarkerAnalyzerAgent:
             agent_name="Biomarker Analyzer",
             findings=findings
         )
         # Update state
         print("\nAnalysis complete:")
         print(f"  - {len(flags)} biomarkers validated")
         print(f"  - {len([f for f in flags if f.status != 'NORMAL'])} out-of-range values")
         print(f"  - {len(alerts)} safety alerts generated")
         print(f"  - {len(relevant_biomarkers)} disease-relevant biomarkers identified")
         return {
             'agent_outputs': [output],
             'biomarker_flags': flags,
             'safety_alerts': alerts,
             'biomarker_analysis': findings
         }
     def _generate_summary(
         self,
-        biomarkers: Dict[str, float],
-        flags: List[BiomarkerFlag],
-        alerts: List,
-        relevant_biomarkers: List[str],
         disease: str
     ) -> str:
         """Generate a concise summary of biomarker findings"""
         # Count anomalies
         critical = [f for f in flags if 'CRITICAL' in f.status]
         high_low = [f for f in flags if f.status in ['HIGH', 'LOW']]
         prompt = f"""You are a medical data analyst. Provide a brief, clinical summary of these biomarker results.
 **Patient Context:**
@@ -115,24 +115,24 @@ Keep it concise and clinical."""
         except Exception as e:
             print(f"Warning: LLM summary generation failed: {e}")
             return f"Biomarker analysis complete. {len(critical)} critical values, {len(high_low)} out-of-range values detected."
     def _format_key_findings(self, critical, high_low, relevant):
         """Format findings for LLM prompt"""
         findings = []
         if critical:
             findings.append("CRITICAL VALUES:")
             for f in critical[:3]:  # Top 3
                 findings.append(f"  - {f.name}: {f.value} {f.unit} ({f.status})")
         if high_low:
             findings.append("\nOUT-OF-RANGE VALUES:")
             for f in high_low[:5]:  # Top 5
                 findings.append(f"  - {f.name}: {f.value} {f.unit} ({f.status})")
         if relevant:
             findings.append(f"\nDISEASE-RELEVANT BIOMARKERS: {', '.join(relevant[:5])}")
         return "\n".join(findings) if findings else "All biomarkers within normal range."

 Biomarker Analyzer Agent - Validates biomarker values and flags anomalies
 """
 from src.biomarker_validator import BiomarkerValidator
 from src.llm_config import llm_config
+from src.state import AgentOutput, BiomarkerFlag, GuildState
 class BiomarkerAnalyzerAgent:
     """Agent that validates biomarker values and generates comprehensive analysis"""
     def __init__(self):
         self.validator = BiomarkerValidator()
         self.llm = llm_config.analyzer
     def analyze(self, state: GuildState) -> GuildState:
         """
         Main agent function to analyze biomarkers.
         print("\n" + "="*70)
         print("EXECUTING: Biomarker Analyzer Agent")
         print("="*70)
         biomarkers = state['patient_biomarkers']
         patient_context = state.get('patient_context', {})
         gender = patient_context.get('gender')  # None if not provided — uses non-gender-specific ranges
         predicted_disease = state['model_prediction']['disease']
         # Validate all biomarkers
         print(f"\nValidating {len(biomarkers)} biomarkers...")
         flags, alerts = self.validator.validate_all(
             gender=gender,
             threshold_pct=state['sop'].biomarker_analyzer_threshold
         )
         # Get disease-relevant biomarkers
         relevant_biomarkers = self.validator.get_disease_relevant_biomarkers(predicted_disease)
         # Generate summary using LLM
         summary = self._generate_summary(biomarkers, flags, alerts, relevant_biomarkers, predicted_disease)
         findings = {
             "biomarker_flags": [flag.model_dump() for flag in flags],
             "safety_alerts": [alert.model_dump() for alert in alerts],
             agent_name="Biomarker Analyzer",
             findings=findings
         )
         # Update state
         print("\nAnalysis complete:")
         print(f"  - {len(flags)} biomarkers validated")
         print(f"  - {len([f for f in flags if f.status != 'NORMAL'])} out-of-range values")
         print(f"  - {len(alerts)} safety alerts generated")
         print(f"  - {len(relevant_biomarkers)} disease-relevant biomarkers identified")
         return {
             'agent_outputs': [output],
             'biomarker_flags': flags,
             'safety_alerts': alerts,
             'biomarker_analysis': findings
         }
     def _generate_summary(
         self,
+        biomarkers: dict[str, float],
+        flags: list[BiomarkerFlag],
+        alerts: list,
+        relevant_biomarkers: list[str],
         disease: str
     ) -> str:
         """Generate a concise summary of biomarker findings"""
         # Count anomalies
         critical = [f for f in flags if 'CRITICAL' in f.status]
         high_low = [f for f in flags if f.status in ['HIGH', 'LOW']]
         prompt = f"""You are a medical data analyst. Provide a brief, clinical summary of these biomarker results.
 **Patient Context:**
         except Exception as e:
             print(f"Warning: LLM summary generation failed: {e}")
             return f"Biomarker analysis complete. {len(critical)} critical values, {len(high_low)} out-of-range values detected."
     def _format_key_findings(self, critical, high_low, relevant):
         """Format findings for LLM prompt"""
         findings = []
         if critical:
             findings.append("CRITICAL VALUES:")
             for f in critical[:3]:  # Top 3
                 findings.append(f"  - {f.name}: {f.value} {f.unit} ({f.status})")
         if high_low:
             findings.append("\nOUT-OF-RANGE VALUES:")
             for f in high_low[:5]:  # Top 5
                 findings.append(f"  - {f.name}: {f.value} {f.unit} ({f.status})")
         if relevant:
             findings.append(f"\nDISEASE-RELEVANT BIOMARKERS: {', '.join(relevant[:5])}")
         return "\n".join(findings) if findings else "All biomarkers within normal range."

src/agents/biomarker_linker.py CHANGED Viewed

@@ -3,15 +3,15 @@ MediGuard AI RAG-Helper
 Biomarker-Disease Linker Agent - Connects biomarker values to predicted disease
 """
-from typing import Dict, List
-from src.state import GuildState, AgentOutput, KeyDriver
 from src.llm_config import llm_config
-from langchain_core.prompts import ChatPromptTemplate
 class BiomarkerDiseaseLinkerAgent:
     """Agent that links specific biomarker values to the predicted disease"""
     def __init__(self, retriever):
         """
         Initialize with a retriever for biomarker-disease connections.
@@ -21,7 +21,7 @@ class BiomarkerDiseaseLinkerAgent:
         """
         self.retriever = retriever
         self.llm = llm_config.explainer
     def link(self, state: GuildState) -> GuildState:
         """
         Link biomarkers to disease prediction.
@@ -35,14 +35,14 @@ class BiomarkerDiseaseLinkerAgent:
         print("\n" + "="*70)
         print("EXECUTING: Biomarker-Disease Linker Agent (RAG)")
         print("="*70)
         model_prediction = state['model_prediction']
         disease = model_prediction['disease']
         biomarkers = state['patient_biomarkers']
         # Get biomarker analysis from previous agent
         biomarker_analysis = state.get('biomarker_analysis') or {}
         # Identify key drivers
         print(f"\nIdentifying key drivers for {disease}...")
         key_drivers, citations_missing = self._identify_key_drivers(
@@ -51,9 +51,9 @@ class BiomarkerDiseaseLinkerAgent:
             biomarker_analysis,
             state
         )
         print(f"Identified {len(key_drivers)} key biomarker drivers")
         # Create agent output
         output = AgentOutput(
             agent_name="Biomarker-Disease Linker",
@@ -65,45 +65,45 @@ class BiomarkerDiseaseLinkerAgent:
                 "citations_missing": citations_missing
             }
         )
         # Update state
         print("\nBiomarker-disease linking complete")
         return {'agent_outputs': [output]}
     def _identify_key_drivers(
         self,
         disease: str,
-        biomarkers: Dict[str, float],
         analysis: dict,
         state: GuildState
-    ) -> tuple[List[KeyDriver], bool]:
         """Identify which biomarkers are driving the disease prediction"""
         # Get out-of-range biomarkers from analysis
         flags = analysis.get('biomarker_flags', [])
         abnormal_biomarkers = [
-            f for f in flags
             if f['status'] != 'NORMAL'
         ]
         # Get disease-relevant biomarkers
         relevant = analysis.get('relevant_biomarkers', [])
         # Focus on biomarkers that are both abnormal AND disease-relevant
         key_biomarkers = [
             f for f in abnormal_biomarkers
             if f['name'] in relevant
         ]
         # If no key biomarkers found, use top abnormal ones
         if not key_biomarkers:
             key_biomarkers = abnormal_biomarkers[:5]
         print(f"  Analyzing {len(key_biomarkers)} key biomarkers...")
         # Generate key drivers with evidence
-        key_drivers: List[KeyDriver] = []
         citations_missing = False
         for biomarker_flag in key_biomarkers[:5]:  # Top 5
             driver, driver_missing = self._create_key_driver(
@@ -115,7 +115,7 @@ class BiomarkerDiseaseLinkerAgent:
             citations_missing = citations_missing or driver_missing
         return key_drivers, citations_missing
     def _create_key_driver(
         self,
         biomarker_flag: dict,
@@ -123,15 +123,15 @@ class BiomarkerDiseaseLinkerAgent:
         state: GuildState
     ) -> tuple[KeyDriver, bool]:
         """Create a KeyDriver object with evidence from RAG"""
         name = biomarker_flag['name']
         value = biomarker_flag['value']
         unit = biomarker_flag['unit']
         status = biomarker_flag['status']
         # Retrieve evidence linking this biomarker to the disease
         query = f"How does {name} relate to {disease}? What does {status} {name} indicate?"
         citations_missing = False
         try:
             docs = self.retriever.invoke(query)
@@ -147,12 +147,12 @@ class BiomarkerDiseaseLinkerAgent:
             evidence_text = f"{status} {name} may be related to {disease}."
             contribution = "Unknown"
             citations_missing = True
         # Generate explanation using LLM
         explanation = self._generate_explanation(
             name, value, unit, status, disease, evidence_text
         )
         driver = KeyDriver(
             biomarker=name,
             value=value,
@@ -162,12 +162,12 @@ class BiomarkerDiseaseLinkerAgent:
         )
         return driver, citations_missing
     def _extract_evidence(self, docs: list, biomarker: str, disease: str) -> str:
         """Extract relevant evidence from retrieved documents"""
         if not docs:
             return f"Limited evidence available for {biomarker} in {disease}."
         # Combine relevant passages
         evidence = []
         for doc in docs[:2]:  # Top 2 docs
@@ -175,17 +175,17 @@ class BiomarkerDiseaseLinkerAgent:
             # Extract sentences mentioning the biomarker
             sentences = content.split('.')
             relevant_sentences = [
-                s.strip() for s in sentences
                 if biomarker.lower() in s.lower() or disease.lower() in s.lower()
             ]
             evidence.extend(relevant_sentences[:2])
         return ". ".join(evidence[:3]) + "." if evidence else content[:300]
     def _estimate_contribution(self, biomarker_flag: dict, doc_count: int) -> str:
         """Estimate the contribution percentage (simplified)"""
         status = biomarker_flag['status']
         # Simple heuristic based on severity
         if 'CRITICAL' in status:
             base = 40
@@ -193,13 +193,13 @@ class BiomarkerDiseaseLinkerAgent:
             base = 25
         else:
             base = 10
         # Adjust based on evidence strength
         evidence_boost = min(doc_count * 2, 15)
         total = min(base + evidence_boost, 60)
         return f"{total}%"
     def _generate_explanation(
         self,
         biomarker: str,
@@ -210,7 +210,7 @@ class BiomarkerDiseaseLinkerAgent:
         evidence: str
     ) -> str:
         """Generate patient-friendly explanation"""
         prompt = f"""Explain in 1-2 sentences how this biomarker result relates to {disease}:
 Biomarker: {biomarker}
@@ -220,11 +220,11 @@ Status: {status}
 Medical Evidence: {evidence}
 Write in patient-friendly language, explaining what this means for the diagnosis."""
         try:
             response = self.llm.invoke(prompt)
             return response.content.strip()
-        except Exception as e:
             return f"{biomarker} at {value} {unit} is {status}, which may be associated with {disease}."

 Biomarker-Disease Linker Agent - Connects biomarker values to predicted disease
 """
 from src.llm_config import llm_config
+from src.state import AgentOutput, GuildState, KeyDriver
 class BiomarkerDiseaseLinkerAgent:
     """Agent that links specific biomarker values to the predicted disease"""
     def __init__(self, retriever):
         """
         Initialize with a retriever for biomarker-disease connections.
         """
         self.retriever = retriever
         self.llm = llm_config.explainer
     def link(self, state: GuildState) -> GuildState:
         """
         Link biomarkers to disease prediction.
         print("\n" + "="*70)
         print("EXECUTING: Biomarker-Disease Linker Agent (RAG)")
         print("="*70)
         model_prediction = state['model_prediction']
         disease = model_prediction['disease']
         biomarkers = state['patient_biomarkers']
         # Get biomarker analysis from previous agent
         biomarker_analysis = state.get('biomarker_analysis') or {}
         # Identify key drivers
         print(f"\nIdentifying key drivers for {disease}...")
         key_drivers, citations_missing = self._identify_key_drivers(
             biomarker_analysis,
             state
         )
         print(f"Identified {len(key_drivers)} key biomarker drivers")
         # Create agent output
         output = AgentOutput(
             agent_name="Biomarker-Disease Linker",
                 "citations_missing": citations_missing
             }
         )
         # Update state
         print("\nBiomarker-disease linking complete")
         return {'agent_outputs': [output]}
     def _identify_key_drivers(
         self,
         disease: str,
+        biomarkers: dict[str, float],
         analysis: dict,
         state: GuildState
+    ) -> tuple[list[KeyDriver], bool]:
         """Identify which biomarkers are driving the disease prediction"""
         # Get out-of-range biomarkers from analysis
         flags = analysis.get('biomarker_flags', [])
         abnormal_biomarkers = [
+            f for f in flags
             if f['status'] != 'NORMAL'
         ]
         # Get disease-relevant biomarkers
         relevant = analysis.get('relevant_biomarkers', [])
         # Focus on biomarkers that are both abnormal AND disease-relevant
         key_biomarkers = [
             f for f in abnormal_biomarkers
             if f['name'] in relevant
         ]
         # If no key biomarkers found, use top abnormal ones
         if not key_biomarkers:
             key_biomarkers = abnormal_biomarkers[:5]
         print(f"  Analyzing {len(key_biomarkers)} key biomarkers...")
         # Generate key drivers with evidence
+        key_drivers: list[KeyDriver] = []
         citations_missing = False
         for biomarker_flag in key_biomarkers[:5]:  # Top 5
             driver, driver_missing = self._create_key_driver(
             citations_missing = citations_missing or driver_missing
         return key_drivers, citations_missing
     def _create_key_driver(
         self,
         biomarker_flag: dict,
         state: GuildState
     ) -> tuple[KeyDriver, bool]:
         """Create a KeyDriver object with evidence from RAG"""
         name = biomarker_flag['name']
         value = biomarker_flag['value']
         unit = biomarker_flag['unit']
         status = biomarker_flag['status']
         # Retrieve evidence linking this biomarker to the disease
         query = f"How does {name} relate to {disease}? What does {status} {name} indicate?"
         citations_missing = False
         try:
             docs = self.retriever.invoke(query)
             evidence_text = f"{status} {name} may be related to {disease}."
             contribution = "Unknown"
             citations_missing = True
         # Generate explanation using LLM
         explanation = self._generate_explanation(
             name, value, unit, status, disease, evidence_text
         )
         driver = KeyDriver(
             biomarker=name,
             value=value,
         )
         return driver, citations_missing
     def _extract_evidence(self, docs: list, biomarker: str, disease: str) -> str:
         """Extract relevant evidence from retrieved documents"""
         if not docs:
             return f"Limited evidence available for {biomarker} in {disease}."
         # Combine relevant passages
         evidence = []
         for doc in docs[:2]:  # Top 2 docs
             # Extract sentences mentioning the biomarker
             sentences = content.split('.')
             relevant_sentences = [
+                s.strip() for s in sentences
                 if biomarker.lower() in s.lower() or disease.lower() in s.lower()
             ]
             evidence.extend(relevant_sentences[:2])
         return ". ".join(evidence[:3]) + "." if evidence else content[:300]
     def _estimate_contribution(self, biomarker_flag: dict, doc_count: int) -> str:
         """Estimate the contribution percentage (simplified)"""
         status = biomarker_flag['status']
         # Simple heuristic based on severity
         if 'CRITICAL' in status:
             base = 40
             base = 25
         else:
             base = 10
         # Adjust based on evidence strength
         evidence_boost = min(doc_count * 2, 15)
         total = min(base + evidence_boost, 60)
         return f"{total}%"
     def _generate_explanation(
         self,
         biomarker: str,
         evidence: str
     ) -> str:
         """Generate patient-friendly explanation"""
         prompt = f"""Explain in 1-2 sentences how this biomarker result relates to {disease}:
 Biomarker: {biomarker}
 Medical Evidence: {evidence}
 Write in patient-friendly language, explaining what this means for the diagnosis."""
         try:
             response = self.llm.invoke(prompt)
             return response.content.strip()
+        except Exception:
             return f"{biomarker} at {value} {unit} is {status}, which may be associated with {disease}."

src/agents/clinical_guidelines.py CHANGED Viewed

@@ -4,15 +4,16 @@ Clinical Guidelines Agent - Retrieves evidence-based recommendations
 """
 from pathlib import Path
-from typing import List
-from src.state import GuildState, AgentOutput
-from src.llm_config import llm_config
 from langchain_core.prompts import ChatPromptTemplate
 class ClinicalGuidelinesAgent:
     """Agent that retrieves clinical guidelines and recommendations using RAG"""
     def __init__(self, retriever):
         """
         Initialize with a retriever for clinical guidelines.
@@ -22,7 +23,7 @@ class ClinicalGuidelinesAgent:
         """
         self.retriever = retriever
         self.llm = llm_config.explainer
     def recommend(self, state: GuildState) -> GuildState:
         """
         Retrieve clinical guidelines and generate recommendations.
@@ -36,25 +37,25 @@ class ClinicalGuidelinesAgent:
         print("\n" + "="*70)
         print("EXECUTING: Clinical Guidelines Agent (RAG)")
         print("="*70)
         model_prediction = state['model_prediction']
         disease = model_prediction['disease']
         confidence = model_prediction['confidence']
         # Get biomarker analysis
         biomarker_analysis = state.get('biomarker_analysis') or {}
         safety_alerts = biomarker_analysis.get('safety_alerts', [])
         # Retrieve guidelines
         print(f"\nRetrieving clinical guidelines for {disease}...")
         query = f"""What are the clinical practice guidelines for managing {disease}?
         Include lifestyle modifications, monitoring recommendations, and when to seek medical care."""
         docs = self.retriever.invoke(query)
         print(f"Retrieved {len(docs)} guideline documents")
         # Generate recommendations
         if state['sop'].require_pdf_citations and not docs:
             recommendations = {
@@ -73,7 +74,7 @@ class ClinicalGuidelinesAgent:
                 confidence,
                 state
             )
         # Create agent output
         output = AgentOutput(
             agent_name="Clinical Guidelines",
@@ -87,15 +88,15 @@ class ClinicalGuidelinesAgent:
                 "citations_missing": state['sop'].require_pdf_citations and not docs
             }
         )
         # Update state
         print("\nRecommendations generated")
         print(f"  - Immediate actions: {len(recommendations['immediate_actions'])}")
         print(f"  - Lifestyle changes: {len(recommendations['lifestyle_changes'])}")
         print(f"  - Monitoring recommendations: {len(recommendations['monitoring'])}")
         return {'agent_outputs': [output]}
     def _generate_recommendations(
         self,
         disease: str,
@@ -105,20 +106,20 @@ class ClinicalGuidelinesAgent:
         state: GuildState
     ) -> dict:
         """Generate structured recommendations using LLM and guidelines"""
         # Format retrieved guidelines
         guidelines_context = "\n\n---\n\n".join([
             f"Source: {doc.metadata.get('source', 'Unknown')}\n\n{doc.page_content}"
             for doc in docs
         ])
         # Build safety context
         safety_context = ""
         if safety_alerts:
             safety_context = "\n**CRITICAL SAFETY ALERTS:**\n"
             for alert in safety_alerts[:3]:
                 safety_context += f"- {alert.get('biomarker', 'Unknown')}: {alert.get('message', '')}\n"
         prompt = ChatPromptTemplate.from_messages([
             ("system", """You are a clinical decision support system providing evidence-based recommendations.
             Based on clinical practice guidelines, provide actionable recommendations for patient self-assessment.
@@ -139,9 +140,9 @@ class ClinicalGuidelinesAgent:
             Please provide structured recommendations for patient self-assessment.""")
         ])
         chain = prompt | self.llm
         try:
             response = chain.invoke({
                 "disease": disease,
@@ -149,18 +150,18 @@ class ClinicalGuidelinesAgent:
                 "safety_context": safety_context,
                 "guidelines": guidelines_context
             })
             recommendations = self._parse_recommendations(response.content)
         except Exception as e:
             print(f"Warning: LLM recommendation generation failed: {e}")
             recommendations = self._get_default_recommendations(disease, safety_alerts)
         # Add citations
         recommendations['citations'] = self._extract_citations(docs)
         return recommendations
     def _parse_recommendations(self, content: str) -> dict:
         """Parse LLM response into structured recommendations"""
         recommendations = {
@@ -168,14 +169,14 @@ class ClinicalGuidelinesAgent:
             "lifestyle_changes": [],
             "monitoring": []
         }
         current_section = None
         lines = content.split('\n')
         for line in lines:
             line_stripped = line.strip()
             line_upper = line_stripped.upper()
             # Detect section headers
             if 'IMMEDIATE' in line_upper or 'URGENT' in line_upper:
                 current_section = 'immediate_actions'
@@ -189,16 +190,16 @@ class ClinicalGuidelinesAgent:
                 cleaned = line_stripped.lstrip('•-*0123456789. ')
                 if cleaned and len(cleaned) > 10:  # Minimum length filter
                     recommendations[current_section].append(cleaned)
         # If parsing failed, create default structure
         if not any(recommendations.values()):
             sentences = content.split('.')
             recommendations['immediate_actions'] = [s.strip() for s in sentences[:2] if s.strip()]
             recommendations['lifestyle_changes'] = [s.strip() for s in sentences[2:4] if s.strip()]
             recommendations['monitoring'] = [s.strip() for s in sentences[4:6] if s.strip()]
         return recommendations
     def _get_default_recommendations(self, disease: str, safety_alerts: list) -> dict:
         """Provide default recommendations if LLM fails"""
         recommendations = {
@@ -206,7 +207,7 @@ class ClinicalGuidelinesAgent:
             "lifestyle_changes": [],
             "monitoring": []
         }
         # Add safety-based immediate actions
         if safety_alerts:
             recommendations['immediate_actions'].append(
@@ -219,36 +220,36 @@ class ClinicalGuidelinesAgent:
             recommendations['immediate_actions'].append(
                 f"Schedule appointment with healthcare provider to discuss {disease} findings"
             )
         # Generic lifestyle changes
         recommendations['lifestyle_changes'].extend([
             "Follow a balanced, nutrient-rich diet as recommended by healthcare provider",
             "Maintain regular physical activity appropriate for your health status",
             "Track symptoms and biomarker trends over time"
         ])
         # Generic monitoring
         recommendations['monitoring'].extend([
             f"Regular monitoring of {disease}-related biomarkers as advised by physician",
             "Keep a health journal tracking symptoms, diet, and activities",
             "Schedule follow-up appointments as recommended"
         ])
         return recommendations
-    def _extract_citations(self, docs: list) -> List[str]:
         """Extract citations from retrieved guideline documents"""
         citations = []
         for doc in docs:
             source = doc.metadata.get('source', 'Unknown')
             # Clean up source path
             if '\\' in source or '/' in source:
                 source = Path(source).name
             citations.append(source)
         return list(set(citations))  # Remove duplicates

 """
 from pathlib import Path
 from langchain_core.prompts import ChatPromptTemplate
+from src.llm_config import llm_config
+from src.state import AgentOutput, GuildState
 class ClinicalGuidelinesAgent:
     """Agent that retrieves clinical guidelines and recommendations using RAG"""
     def __init__(self, retriever):
         """
         Initialize with a retriever for clinical guidelines.
         """
         self.retriever = retriever
         self.llm = llm_config.explainer
     def recommend(self, state: GuildState) -> GuildState:
         """
         Retrieve clinical guidelines and generate recommendations.
         print("\n" + "="*70)
         print("EXECUTING: Clinical Guidelines Agent (RAG)")
         print("="*70)
         model_prediction = state['model_prediction']
         disease = model_prediction['disease']
         confidence = model_prediction['confidence']
         # Get biomarker analysis
         biomarker_analysis = state.get('biomarker_analysis') or {}
         safety_alerts = biomarker_analysis.get('safety_alerts', [])
         # Retrieve guidelines
         print(f"\nRetrieving clinical guidelines for {disease}...")
         query = f"""What are the clinical practice guidelines for managing {disease}?
         Include lifestyle modifications, monitoring recommendations, and when to seek medical care."""
         docs = self.retriever.invoke(query)
         print(f"Retrieved {len(docs)} guideline documents")
         # Generate recommendations
         if state['sop'].require_pdf_citations and not docs:
             recommendations = {
                 confidence,
                 state
             )
         # Create agent output
         output = AgentOutput(
             agent_name="Clinical Guidelines",
                 "citations_missing": state['sop'].require_pdf_citations and not docs
             }
         )
         # Update state
         print("\nRecommendations generated")
         print(f"  - Immediate actions: {len(recommendations['immediate_actions'])}")
         print(f"  - Lifestyle changes: {len(recommendations['lifestyle_changes'])}")
         print(f"  - Monitoring recommendations: {len(recommendations['monitoring'])}")
         return {'agent_outputs': [output]}
     def _generate_recommendations(
         self,
         disease: str,
         state: GuildState
     ) -> dict:
         """Generate structured recommendations using LLM and guidelines"""
         # Format retrieved guidelines
         guidelines_context = "\n\n---\n\n".join([
             f"Source: {doc.metadata.get('source', 'Unknown')}\n\n{doc.page_content}"
             for doc in docs
         ])
         # Build safety context
         safety_context = ""
         if safety_alerts:
             safety_context = "\n**CRITICAL SAFETY ALERTS:**\n"
             for alert in safety_alerts[:3]:
                 safety_context += f"- {alert.get('biomarker', 'Unknown')}: {alert.get('message', '')}\n"
         prompt = ChatPromptTemplate.from_messages([
             ("system", """You are a clinical decision support system providing evidence-based recommendations.
             Based on clinical practice guidelines, provide actionable recommendations for patient self-assessment.
             Please provide structured recommendations for patient self-assessment.""")
         ])
         chain = prompt | self.llm
         try:
             response = chain.invoke({
                 "disease": disease,
                 "safety_context": safety_context,
                 "guidelines": guidelines_context
             })
             recommendations = self._parse_recommendations(response.content)
         except Exception as e:
             print(f"Warning: LLM recommendation generation failed: {e}")
             recommendations = self._get_default_recommendations(disease, safety_alerts)
         # Add citations
         recommendations['citations'] = self._extract_citations(docs)
         return recommendations
     def _parse_recommendations(self, content: str) -> dict:
         """Parse LLM response into structured recommendations"""
         recommendations = {
             "lifestyle_changes": [],
             "monitoring": []
         }
         current_section = None
         lines = content.split('\n')
         for line in lines:
             line_stripped = line.strip()
             line_upper = line_stripped.upper()
             # Detect section headers
             if 'IMMEDIATE' in line_upper or 'URGENT' in line_upper:
                 current_section = 'immediate_actions'
                 cleaned = line_stripped.lstrip('•-*0123456789. ')
                 if cleaned and len(cleaned) > 10:  # Minimum length filter
                     recommendations[current_section].append(cleaned)
         # If parsing failed, create default structure
         if not any(recommendations.values()):
             sentences = content.split('.')
             recommendations['immediate_actions'] = [s.strip() for s in sentences[:2] if s.strip()]
             recommendations['lifestyle_changes'] = [s.strip() for s in sentences[2:4] if s.strip()]
             recommendations['monitoring'] = [s.strip() for s in sentences[4:6] if s.strip()]
         return recommendations
     def _get_default_recommendations(self, disease: str, safety_alerts: list) -> dict:
         """Provide default recommendations if LLM fails"""
         recommendations = {
             "lifestyle_changes": [],
             "monitoring": []
         }
         # Add safety-based immediate actions
         if safety_alerts:
             recommendations['immediate_actions'].append(
             recommendations['immediate_actions'].append(
                 f"Schedule appointment with healthcare provider to discuss {disease} findings"
             )
         # Generic lifestyle changes
         recommendations['lifestyle_changes'].extend([
             "Follow a balanced, nutrient-rich diet as recommended by healthcare provider",
             "Maintain regular physical activity appropriate for your health status",
             "Track symptoms and biomarker trends over time"
         ])
         # Generic monitoring
         recommendations['monitoring'].extend([
             f"Regular monitoring of {disease}-related biomarkers as advised by physician",
             "Keep a health journal tracking symptoms, diet, and activities",
             "Schedule follow-up appointments as recommended"
         ])
         return recommendations
+    def _extract_citations(self, docs: list) -> list[str]:
         """Extract citations from retrieved guideline documents"""
         citations = []
         for doc in docs:
             source = doc.metadata.get('source', 'Unknown')
             # Clean up source path
             if '\\' in source or '/' in source:
                 source = Path(source).name
             citations.append(source)
         return list(set(citations))  # Remove duplicates

src/agents/confidence_assessor.py CHANGED Viewed

@@ -3,19 +3,19 @@ MediGuard AI RAG-Helper
 Confidence Assessor Agent - Evaluates prediction reliability
 """
-from typing import Any, Dict, List
-from src.state import GuildState, AgentOutput
 from src.biomarker_validator import BiomarkerValidator
 from src.llm_config import llm_config
-from langchain_core.prompts import ChatPromptTemplate
 class ConfidenceAssessorAgent:
     """Agent that assesses the reliability and limitations of the prediction"""
     def __init__(self):
         self.llm = llm_config.analyzer
     def assess(self, state: GuildState) -> GuildState:
         """
         Assess prediction confidence and identify limitations.
@@ -29,41 +29,41 @@ class ConfidenceAssessorAgent:
         print("\n" + "="*70)
         print("EXECUTING: Confidence Assessor Agent")
         print("="*70)
         model_prediction = state['model_prediction']
         disease = model_prediction['disease']
         ml_confidence = model_prediction['confidence']
         probabilities = model_prediction.get('probabilities', {})
         biomarkers = state['patient_biomarkers']
         # Collect previous agent findings
         biomarker_analysis = state.get('biomarker_analysis') or {}
         disease_explanation = self._get_agent_findings(state, "Disease Explainer")
         linker_findings = self._get_agent_findings(state, "Biomarker-Disease Linker")
         print(f"\nAssessing confidence for {disease} prediction...")
         # Evaluate evidence strength
         evidence_strength = self._evaluate_evidence_strength(
             biomarker_analysis,
             disease_explanation,
             linker_findings
         )
         # Identify limitations
         limitations = self._identify_limitations(
             biomarkers,
             biomarker_analysis,
             probabilities
         )
         # Calculate aggregate reliability
         reliability = self._calculate_reliability(
             ml_confidence,
             evidence_strength,
             len(limitations)
         )
         # Generate assessment summary
         assessment_summary = self._generate_assessment(
             disease,
@@ -72,7 +72,7 @@ class ConfidenceAssessorAgent:
             evidence_strength,
             limitations
         )
         # Create agent output
         output = AgentOutput(
             agent_name="Confidence Assessor",
@@ -86,22 +86,22 @@ class ConfidenceAssessorAgent:
                 "alternative_diagnoses": self._get_alternatives(probabilities)
             }
         )
         # Update state
         print("\nConfidence assessment complete")
         print(f"  - Prediction reliability: {reliability}")
         print(f"  - Evidence strength: {evidence_strength}")
         print(f"  - Limitations identified: {len(limitations)}")
         return {'agent_outputs': [output]}
     def _get_agent_findings(self, state: GuildState, agent_name: str) -> dict:
         """Extract findings from a specific agent"""
         for output in state.get('agent_outputs', []):
             if output.agent_name == agent_name:
                 return output.findings
         return {}
     def _evaluate_evidence_strength(
         self,
         biomarker_analysis: dict,
@@ -109,10 +109,10 @@ class ConfidenceAssessorAgent:
         linker_findings: dict
     ) -> str:
         """Evaluate the strength of supporting evidence"""
         score = 0
         max_score = 5
         # Check biomarker validation quality
         flags = biomarker_analysis.get('biomarker_flags', [])
         abnormal_count = len([f for f in flags if f.get('status') != 'NORMAL'])
@@ -120,18 +120,18 @@ class ConfidenceAssessorAgent:
             score += 1
         if abnormal_count >= 5:
             score += 1
         # Check disease explanation quality
         if disease_explanation.get('retrieval_quality', 0) >= 3:
             score += 1
         # Check biomarker-disease linking
         key_drivers = linker_findings.get('key_drivers', [])
         if len(key_drivers) >= 2:
             score += 1
         if len(key_drivers) >= 4:
             score += 1
         # Map score to categorical rating
         if score >= 4:
             return "STRONG"
@@ -139,22 +139,22 @@ class ConfidenceAssessorAgent:
             return "MODERATE"
         else:
             return "WEAK"
     def _identify_limitations(
         self,
-        biomarkers: Dict[str, float],
         biomarker_analysis: dict,
-        probabilities: Dict[str, float]
-    ) -> List[str]:
         """Identify limitations and uncertainties"""
         limitations = []
         # Check for missing biomarkers
         expected_biomarkers = BiomarkerValidator().expected_biomarker_count()
         if len(biomarkers) < expected_biomarkers:
             missing = expected_biomarkers - len(biomarkers)
             limitations.append(f"Missing data: {missing} biomarker(s) not provided")
         # Check for close alternative predictions
         sorted_probs = sorted(probabilities.items(), key=lambda x: x[1], reverse=True)
         if len(sorted_probs) >= 2:
@@ -164,7 +164,7 @@ class ConfidenceAssessorAgent:
                 limitations.append(
                     f"Differential diagnosis: {top2} also possible ({prob2:.1%} probability)"
                 )
         # Check for normal biomarkers despite prediction
         flags = biomarker_analysis.get('biomarker_flags', [])
         relevant = biomarker_analysis.get('relevant_biomarkers', [])
@@ -174,18 +174,18 @@ class ConfidenceAssessorAgent:
         ]
         if len(normal_relevant) >= 2:
             limitations.append(
-                f"Some disease-relevant biomarkers are within normal range"
             )
         # Check for safety alerts (indicates complexity)
         alerts = biomarker_analysis.get('safety_alerts', [])
         if len(alerts) >= 2:
             limitations.append(
                 "Multiple critical values detected; professional evaluation essential"
             )
         return limitations
     def _calculate_reliability(
         self,
         ml_confidence: float,
@@ -193,9 +193,9 @@ class ConfidenceAssessorAgent:
         limitation_count: int
     ) -> str:
         """Calculate overall prediction reliability"""
         score = 0
         # ML confidence contribution
         if ml_confidence >= 0.8:
             score += 3
@@ -203,7 +203,7 @@ class ConfidenceAssessorAgent:
             score += 2
         elif ml_confidence >= 0.4:
             score += 1
         # Evidence strength contribution
         if evidence_strength == "STRONG":
             score += 3
@@ -211,10 +211,10 @@ class ConfidenceAssessorAgent:
             score += 2
         else:
             score += 1
         # Limitation penalty
         score -= min(limitation_count, 3)
         # Map to categorical
         if score >= 5:
             return "HIGH"
@@ -222,17 +222,17 @@ class ConfidenceAssessorAgent:
             return "MODERATE"
         else:
             return "LOW"
     def _generate_assessment(
         self,
         disease: str,
         ml_confidence: float,
         reliability: str,
         evidence_strength: str,
-        limitations: List[str]
     ) -> str:
         """Generate human-readable assessment summary"""
         prompt = f"""As a medical AI assessment system, provide a brief confidence statement about this prediction:
 Disease Predicted: {disease}
@@ -254,7 +254,7 @@ Be honest about uncertainty. Patient safety is paramount."""
         except Exception as e:
             print(f"Warning: Assessment generation failed: {e}")
             return f"The {disease} prediction has {reliability.lower()} reliability based on available data. Professional medical evaluation is strongly recommended for accurate diagnosis."
     def _get_recommendation(self, reliability: str) -> str:
         """Get action recommendation based on reliability"""
         if reliability == "HIGH":
@@ -263,11 +263,11 @@ Be honest about uncertainty. Patient safety is paramount."""
             return "Moderate confidence prediction. Medical consultation recommended for professional evaluation and additional testing if needed."
         else:
             return "Low confidence prediction. Professional medical assessment essential. Additional tests may be required for accurate diagnosis."
-    def _get_alternatives(self, probabilities: Dict[str, float]) -> List[Dict[str, Any]]:
         """Get alternative diagnoses to consider"""
         sorted_probs = sorted(probabilities.items(), key=lambda x: x[1], reverse=True)
         alternatives = []
         for disease, prob in sorted_probs[1:4]:  # Top 3 alternatives
             if prob > 0.05:  # Only significant alternatives
@@ -276,7 +276,7 @@ Be honest about uncertainty. Patient safety is paramount."""
                     "probability": prob,
                     "note": "Consider discussing with healthcare provider"
                 })
         return alternatives

 Confidence Assessor Agent - Evaluates prediction reliability
 """
+from typing import Any
 from src.biomarker_validator import BiomarkerValidator
 from src.llm_config import llm_config
+from src.state import AgentOutput, GuildState
 class ConfidenceAssessorAgent:
     """Agent that assesses the reliability and limitations of the prediction"""
     def __init__(self):
         self.llm = llm_config.analyzer
     def assess(self, state: GuildState) -> GuildState:
         """
         Assess prediction confidence and identify limitations.
         print("\n" + "="*70)
         print("EXECUTING: Confidence Assessor Agent")
         print("="*70)
         model_prediction = state['model_prediction']
         disease = model_prediction['disease']
         ml_confidence = model_prediction['confidence']
         probabilities = model_prediction.get('probabilities', {})
         biomarkers = state['patient_biomarkers']
         # Collect previous agent findings
         biomarker_analysis = state.get('biomarker_analysis') or {}
         disease_explanation = self._get_agent_findings(state, "Disease Explainer")
         linker_findings = self._get_agent_findings(state, "Biomarker-Disease Linker")
         print(f"\nAssessing confidence for {disease} prediction...")
         # Evaluate evidence strength
         evidence_strength = self._evaluate_evidence_strength(
             biomarker_analysis,
             disease_explanation,
             linker_findings
         )
         # Identify limitations
         limitations = self._identify_limitations(
             biomarkers,
             biomarker_analysis,
             probabilities
         )
         # Calculate aggregate reliability
         reliability = self._calculate_reliability(
             ml_confidence,
             evidence_strength,
             len(limitations)
         )
         # Generate assessment summary
         assessment_summary = self._generate_assessment(
             disease,
             evidence_strength,
             limitations
         )
         # Create agent output
         output = AgentOutput(
             agent_name="Confidence Assessor",
                 "alternative_diagnoses": self._get_alternatives(probabilities)
             }
         )
         # Update state
         print("\nConfidence assessment complete")
         print(f"  - Prediction reliability: {reliability}")
         print(f"  - Evidence strength: {evidence_strength}")
         print(f"  - Limitations identified: {len(limitations)}")
         return {'agent_outputs': [output]}
     def _get_agent_findings(self, state: GuildState, agent_name: str) -> dict:
         """Extract findings from a specific agent"""
         for output in state.get('agent_outputs', []):
             if output.agent_name == agent_name:
                 return output.findings
         return {}
     def _evaluate_evidence_strength(
         self,
         biomarker_analysis: dict,
         linker_findings: dict
     ) -> str:
         """Evaluate the strength of supporting evidence"""
         score = 0
         max_score = 5
         # Check biomarker validation quality
         flags = biomarker_analysis.get('biomarker_flags', [])
         abnormal_count = len([f for f in flags if f.get('status') != 'NORMAL'])
             score += 1
         if abnormal_count >= 5:
             score += 1
         # Check disease explanation quality
         if disease_explanation.get('retrieval_quality', 0) >= 3:
             score += 1
         # Check biomarker-disease linking
         key_drivers = linker_findings.get('key_drivers', [])
         if len(key_drivers) >= 2:
             score += 1
         if len(key_drivers) >= 4:
             score += 1
         # Map score to categorical rating
         if score >= 4:
             return "STRONG"
             return "MODERATE"
         else:
             return "WEAK"
     def _identify_limitations(
         self,
+        biomarkers: dict[str, float],
         biomarker_analysis: dict,
+        probabilities: dict[str, float]
+    ) -> list[str]:
         """Identify limitations and uncertainties"""
         limitations = []
         # Check for missing biomarkers
         expected_biomarkers = BiomarkerValidator().expected_biomarker_count()
         if len(biomarkers) < expected_biomarkers:
             missing = expected_biomarkers - len(biomarkers)
             limitations.append(f"Missing data: {missing} biomarker(s) not provided")
         # Check for close alternative predictions
         sorted_probs = sorted(probabilities.items(), key=lambda x: x[1], reverse=True)
         if len(sorted_probs) >= 2:
                 limitations.append(
                     f"Differential diagnosis: {top2} also possible ({prob2:.1%} probability)"
                 )
         # Check for normal biomarkers despite prediction
         flags = biomarker_analysis.get('biomarker_flags', [])
         relevant = biomarker_analysis.get('relevant_biomarkers', [])
         ]
         if len(normal_relevant) >= 2:
             limitations.append(
+                "Some disease-relevant biomarkers are within normal range"
             )
         # Check for safety alerts (indicates complexity)
         alerts = biomarker_analysis.get('safety_alerts', [])
         if len(alerts) >= 2:
             limitations.append(
                 "Multiple critical values detected; professional evaluation essential"
             )
         return limitations
     def _calculate_reliability(
         self,
         ml_confidence: float,
         limitation_count: int
     ) -> str:
         """Calculate overall prediction reliability"""
         score = 0
         # ML confidence contribution
         if ml_confidence >= 0.8:
             score += 3
             score += 2
         elif ml_confidence >= 0.4:
             score += 1
         # Evidence strength contribution
         if evidence_strength == "STRONG":
             score += 3
             score += 2
         else:
             score += 1
         # Limitation penalty
         score -= min(limitation_count, 3)
         # Map to categorical
         if score >= 5:
             return "HIGH"
             return "MODERATE"
         else:
             return "LOW"
     def _generate_assessment(
         self,
         disease: str,
         ml_confidence: float,
         reliability: str,
         evidence_strength: str,
+        limitations: list[str]
     ) -> str:
         """Generate human-readable assessment summary"""
         prompt = f"""As a medical AI assessment system, provide a brief confidence statement about this prediction:
 Disease Predicted: {disease}
         except Exception as e:
             print(f"Warning: Assessment generation failed: {e}")
             return f"The {disease} prediction has {reliability.lower()} reliability based on available data. Professional medical evaluation is strongly recommended for accurate diagnosis."
     def _get_recommendation(self, reliability: str) -> str:
         """Get action recommendation based on reliability"""
         if reliability == "HIGH":
             return "Moderate confidence prediction. Medical consultation recommended for professional evaluation and additional testing if needed."
         else:
             return "Low confidence prediction. Professional medical assessment essential. Additional tests may be required for accurate diagnosis."
+    def _get_alternatives(self, probabilities: dict[str, float]) -> list[dict[str, Any]]:
         """Get alternative diagnoses to consider"""
         sorted_probs = sorted(probabilities.items(), key=lambda x: x[1], reverse=True)
         alternatives = []
         for disease, prob in sorted_probs[1:4]:  # Top 3 alternatives
             if prob > 0.05:  # Only significant alternatives
                     "probability": prob,
                     "note": "Consider discussing with healthcare provider"
                 })
         return alternatives

src/agents/disease_explainer.py CHANGED Viewed

@@ -4,14 +4,16 @@ Disease Explainer Agent - Retrieves disease pathophysiology from medical PDFs
 """
 from pathlib import Path
-from src.state import GuildState, AgentOutput
-from src.llm_config import llm_config
 from langchain_core.prompts import ChatPromptTemplate
 class DiseaseExplainerAgent:
     """Agent that retrieves and explains disease mechanisms using RAG"""
     def __init__(self, retriever):
         """
         Initialize with a retriever for medical PDFs.
@@ -21,7 +23,7 @@ class DiseaseExplainerAgent:
         """
         self.retriever = retriever
         self.llm = llm_config.explainer
     def explain(self, state: GuildState) -> GuildState:
         """
         Retrieve and explain disease pathophysiology.
@@ -35,23 +37,23 @@ class DiseaseExplainerAgent:
         print("\n" + "="*70)
         print("EXECUTING: Disease Explainer Agent (RAG)")
         print("="*70)
         model_prediction = state['model_prediction']
         disease = model_prediction['disease']
         confidence = model_prediction['confidence']
         # Configure retrieval based on SOP — create a copy to avoid mutating shared retriever
         retrieval_k = state['sop'].disease_explainer_k
         original_search_kwargs = dict(self.retriever.search_kwargs)
         self.retriever.search_kwargs = {**original_search_kwargs, 'k': retrieval_k}
         # Retrieve relevant documents
         print(f"\nRetrieving information about: {disease}")
         print(f"Retrieval k={state['sop'].disease_explainer_k}")
         query = f"""What is {disease}? Explain the pathophysiology, diagnostic criteria,
         and clinical presentation. Focus on mechanisms relevant to blood biomarkers."""
         try:
             docs = self.retriever.invoke(query)
         finally:
@@ -87,13 +89,13 @@ class DiseaseExplainerAgent:
             print("  - Pathophysiology: insufficient evidence")
             print("  - Citations: 0 sources")
             return {'agent_outputs': [output]}
         # Generate explanation
         explanation = self._generate_explanation(disease, docs, confidence)
         # Extract citations
         citations = self._extract_citations(docs)
         # Create agent output
         output = AgentOutput(
             agent_name="Disease Explainer",
@@ -109,23 +111,23 @@ class DiseaseExplainerAgent:
                 "citations_missing": False
             }
         )
         # Update state
         print("\nDisease explanation generated")
         print(f"  - Pathophysiology: {len(explanation['pathophysiology'])} chars")
         print(f"  - Citations: {len(citations)} sources")
         return {'agent_outputs': [output]}
     def _generate_explanation(self, disease: str, docs: list, confidence: float) -> dict:
         """Generate structured disease explanation using LLM and retrieved docs"""
         # Format retrieved context
         context = "\n\n---\n\n".join([
             f"Source: {doc.metadata.get('source', 'Unknown')}\n\n{doc.page_content}"
             for doc in docs
         ])
         prompt = ChatPromptTemplate.from_messages([
             ("system", """You are a medical expert explaining diseases for patient self-assessment.
             Based on the provided medical literature, explain the disease in clear, accessible language.
@@ -144,20 +146,20 @@ class DiseaseExplainerAgent:
             Please provide a structured explanation.""")
         ])
         chain = prompt | self.llm
         try:
             response = chain.invoke({
                 "disease": disease,
                 "confidence": confidence,
                 "context": context
             })
             # Parse structured response
             content = response.content
             explanation = self._parse_explanation(content)
         except Exception as e:
             print(f"Warning: LLM explanation generation failed: {e}")
             explanation = {
@@ -166,9 +168,9 @@ class DiseaseExplainerAgent:
                 "clinical_presentation": "Clinical presentation varies by individual.",
                 "summary": f"{disease} detected with {confidence:.1%} confidence. Consult healthcare provider."
             }
         return explanation
     def _parse_explanation(self, content: str) -> dict:
         """Parse LLM response into structured sections"""
         sections = {
@@ -177,14 +179,14 @@ class DiseaseExplainerAgent:
             "clinical_presentation": "",
             "summary": ""
         }
         # Simple parsing logic
         current_section = None
         lines = content.split('\n')
         for line in lines:
             line_upper = line.upper().strip()
             if 'PATHOPHYSIOLOGY' in line_upper:
                 current_section = 'pathophysiology'
             elif 'DIAGNOSTIC' in line_upper:
@@ -195,31 +197,31 @@ class DiseaseExplainerAgent:
                 current_section = 'summary'
             elif current_section and line.strip():
                 sections[current_section] += line + "\n"
         # If parsing failed, use full content as summary
         if not any(sections.values()):
             sections['summary'] = content[:500]
         return sections
     def _extract_citations(self, docs: list) -> list:
         """Extract citations from retrieved documents"""
         citations = []
         for doc in docs:
             source = doc.metadata.get('source', 'Unknown')
             page = doc.metadata.get('page', 'N/A')
             # Clean up source path
             if '\\' in source or '/' in source:
                 source = Path(source).name
             citation = f"{source}"
             if page != 'N/A':
                 citation += f" (Page {page})"
             citations.append(citation)
         return citations

 """
 from pathlib import Path
 from langchain_core.prompts import ChatPromptTemplate
+from src.llm_config import llm_config
+from src.state import AgentOutput, GuildState
 class DiseaseExplainerAgent:
     """Agent that retrieves and explains disease mechanisms using RAG"""
     def __init__(self, retriever):
         """
         Initialize with a retriever for medical PDFs.
         """
         self.retriever = retriever
         self.llm = llm_config.explainer
     def explain(self, state: GuildState) -> GuildState:
         """
         Retrieve and explain disease pathophysiology.
         print("\n" + "="*70)
         print("EXECUTING: Disease Explainer Agent (RAG)")
         print("="*70)
         model_prediction = state['model_prediction']
         disease = model_prediction['disease']
         confidence = model_prediction['confidence']
         # Configure retrieval based on SOP — create a copy to avoid mutating shared retriever
         retrieval_k = state['sop'].disease_explainer_k
         original_search_kwargs = dict(self.retriever.search_kwargs)
         self.retriever.search_kwargs = {**original_search_kwargs, 'k': retrieval_k}
         # Retrieve relevant documents
         print(f"\nRetrieving information about: {disease}")
         print(f"Retrieval k={state['sop'].disease_explainer_k}")
         query = f"""What is {disease}? Explain the pathophysiology, diagnostic criteria,
         and clinical presentation. Focus on mechanisms relevant to blood biomarkers."""
         try:
             docs = self.retriever.invoke(query)
         finally:
             print("  - Pathophysiology: insufficient evidence")
             print("  - Citations: 0 sources")
             return {'agent_outputs': [output]}
         # Generate explanation
         explanation = self._generate_explanation(disease, docs, confidence)
         # Extract citations
         citations = self._extract_citations(docs)
         # Create agent output
         output = AgentOutput(
             agent_name="Disease Explainer",
                 "citations_missing": False
             }
         )
         # Update state
         print("\nDisease explanation generated")
         print(f"  - Pathophysiology: {len(explanation['pathophysiology'])} chars")
         print(f"  - Citations: {len(citations)} sources")
         return {'agent_outputs': [output]}
     def _generate_explanation(self, disease: str, docs: list, confidence: float) -> dict:
         """Generate structured disease explanation using LLM and retrieved docs"""
         # Format retrieved context
         context = "\n\n---\n\n".join([
             f"Source: {doc.metadata.get('source', 'Unknown')}\n\n{doc.page_content}"
             for doc in docs
         ])
         prompt = ChatPromptTemplate.from_messages([
             ("system", """You are a medical expert explaining diseases for patient self-assessment.
             Based on the provided medical literature, explain the disease in clear, accessible language.
             Please provide a structured explanation.""")
         ])
         chain = prompt | self.llm
         try:
             response = chain.invoke({
                 "disease": disease,
                 "confidence": confidence,
                 "context": context
             })
             # Parse structured response
             content = response.content
             explanation = self._parse_explanation(content)
         except Exception as e:
             print(f"Warning: LLM explanation generation failed: {e}")
             explanation = {
                 "clinical_presentation": "Clinical presentation varies by individual.",
                 "summary": f"{disease} detected with {confidence:.1%} confidence. Consult healthcare provider."
             }
         return explanation
     def _parse_explanation(self, content: str) -> dict:
         """Parse LLM response into structured sections"""
         sections = {
             "clinical_presentation": "",
             "summary": ""
         }
         # Simple parsing logic
         current_section = None
         lines = content.split('\n')
         for line in lines:
             line_upper = line.upper().strip()
             if 'PATHOPHYSIOLOGY' in line_upper:
                 current_section = 'pathophysiology'
             elif 'DIAGNOSTIC' in line_upper:
                 current_section = 'summary'
             elif current_section and line.strip():
                 sections[current_section] += line + "\n"
         # If parsing failed, use full content as summary
         if not any(sections.values()):
             sections['summary'] = content[:500]
         return sections
     def _extract_citations(self, docs: list) -> list:
         """Extract citations from retrieved documents"""
         citations = []
         for doc in docs:
             source = doc.metadata.get('source', 'Unknown')
             page = doc.metadata.get('page', 'N/A')
             # Clean up source path
             if '\\' in source or '/' in source:
                 source = Path(source).name
             citation = f"{source}"
             if page != 'N/A':
                 citation += f" (Page {page})"
             citations.append(citation)
         return citations

src/agents/response_synthesizer.py CHANGED Viewed

@@ -3,19 +3,20 @@ MediGuard AI RAG-Helper
 Response Synthesizer Agent - Compiles all findings into final structured JSON
 """
-import json
-from typing import Dict, List, Any
-from src.state import GuildState
-from src.llm_config import llm_config
 from langchain_core.prompts import ChatPromptTemplate
 class ResponseSynthesizerAgent:
     """Agent that synthesizes all specialist findings into the final response"""
     def __init__(self):
         self.llm = llm_config.get_synthesizer()
     def synthesize(self, state: GuildState) -> GuildState:
         """
         Synthesize all agent outputs into final response.
@@ -29,17 +30,17 @@ class ResponseSynthesizerAgent:
         print("\n" + "="*70)
         print("EXECUTING: Response Synthesizer Agent")
         print("="*70)
         model_prediction = state['model_prediction']
         patient_biomarkers = state['patient_biomarkers']
         patient_context = state.get('patient_context', {})
         agent_outputs = state.get('agent_outputs', [])
         # Collect findings from all agents
         findings = self._collect_findings(agent_outputs)
         print(f"\nSynthesizing findings from {len(agent_outputs)} specialist agents...")
         # Build structured response
         recs = self._build_recommendations(findings)
         response = {
@@ -64,38 +65,38 @@ class ResponseSynthesizerAgent:
                 "alternative_diagnoses": self._build_alternative_diagnoses(findings)
             }
         }
         # Generate patient-friendly summary
         response["patient_summary"]["narrative"] = self._generate_narrative_summary(
             model_prediction,
             findings,
             response
         )
         print("\nResponse synthesis complete")
-        print(f"  - Patient summary: Generated")
         print(f"  - Prediction explanation: {len(response['prediction_explanation']['key_drivers'])} key drivers")
         print(f"  - Recommendations: {len(response['clinical_recommendations']['immediate_actions'])} immediate actions")
         print(f"  - Safety alerts: {len(response['safety_alerts'])} alerts")
         return {'final_response': response}
-    def _collect_findings(self, agent_outputs: List) -> Dict[str, Any]:
         """Organize all agent findings by agent name"""
         findings = {}
         for output in agent_outputs:
             findings[output.agent_name] = output.findings
         return findings
-    def _build_patient_summary(self, biomarkers: Dict, findings: Dict) -> Dict:
         """Build patient summary section"""
         biomarker_analysis = findings.get("Biomarker Analyzer", {})
         flags = biomarker_analysis.get('biomarker_flags', [])
         # Count biomarker statuses
         critical = len([f for f in flags if 'CRITICAL' in f.get('status', '')])
         abnormal = len([f for f in flags if f.get('status') != 'NORMAL'])
         return {
             "total_biomarkers_tested": len(biomarkers),
             "biomarkers_in_normal_range": len(flags) - abnormal,
@@ -104,15 +105,15 @@ class ResponseSynthesizerAgent:
             "overall_risk_profile": biomarker_analysis.get('summary', 'Assessment complete'),
             "narrative": ""  # Will be filled later
         }
-    def _build_prediction_explanation(self, model_prediction: Dict, findings: Dict) -> Dict:
         """Build prediction explanation section"""
         disease_explanation = findings.get("Disease Explainer", {})
         linker_findings = findings.get("Biomarker-Disease Linker", {})
         disease = model_prediction['disease']
         confidence = model_prediction['confidence']
         # Get key drivers
         key_drivers_raw = linker_findings.get('key_drivers', [])
         key_drivers = [
@@ -125,7 +126,7 @@ class ResponseSynthesizerAgent:
             }
             for kd in key_drivers_raw
         ]
         return {
             "primary_disease": disease,
             "confidence": confidence,
@@ -135,37 +136,37 @@ class ResponseSynthesizerAgent:
             "pdf_references": disease_explanation.get('citations', [])
         }
-    def _build_biomarker_flags(self, findings: Dict) -> List[Dict]:
         biomarker_analysis = findings.get("Biomarker Analyzer", {})
         return biomarker_analysis.get('biomarker_flags', [])
-    def _build_key_drivers(self, findings: Dict) -> List[Dict]:
         linker_findings = findings.get("Biomarker-Disease Linker", {})
         return linker_findings.get('key_drivers', [])
-    def _build_disease_explanation(self, findings: Dict) -> Dict:
         disease_explanation = findings.get("Disease Explainer", {})
         return {
             "pathophysiology": disease_explanation.get('pathophysiology', ''),
             "citations": disease_explanation.get('citations', []),
             "retrieved_chunks": disease_explanation.get('retrieved_chunks')
         }
-    def _build_recommendations(self, findings: Dict) -> Dict:
         """Build clinical recommendations section"""
         guidelines = findings.get("Clinical Guidelines", {})
         return {
             "immediate_actions": guidelines.get('immediate_actions', []),
             "lifestyle_changes": guidelines.get('lifestyle_changes', []),
             "monitoring": guidelines.get('monitoring', []),
             "guideline_citations": guidelines.get('guideline_citations', [])
         }
-    def _build_confidence_assessment(self, findings: Dict) -> Dict:
         """Build confidence assessment section"""
         assessment = findings.get("Confidence Assessor", {})
         return {
             "prediction_reliability": assessment.get('prediction_reliability', 'UNKNOWN'),
             "evidence_strength": assessment.get('evidence_strength', 'UNKNOWN'),
@@ -175,19 +176,19 @@ class ResponseSynthesizerAgent:
             "alternative_diagnoses": assessment.get('alternative_diagnoses', [])
         }
-    def _build_alternative_diagnoses(self, findings: Dict) -> List[Dict]:
         assessment = findings.get("Confidence Assessor", {})
         return assessment.get('alternative_diagnoses', [])
-    def _build_safety_alerts(self, findings: Dict) -> List[Dict]:
         """Build safety alerts section"""
         biomarker_analysis = findings.get("Biomarker Analyzer", {})
         return biomarker_analysis.get('safety_alerts', [])
-    def _build_metadata(self, state: GuildState) -> Dict:
         """Build metadata section"""
         from datetime import datetime
         return {
             "timestamp": datetime.now().isoformat(),
             "system_version": "MediGuard AI RAG-Helper v1.0",
@@ -195,24 +196,24 @@ class ResponseSynthesizerAgent:
             "agents_executed": [output.agent_name for output in state.get('agent_outputs', [])],
             "disclaimer": "This is an AI-assisted analysis tool for patient self-assessment. It is NOT a substitute for professional medical advice, diagnosis, or treatment. Always consult qualified healthcare providers for medical decisions."
         }
     def _generate_narrative_summary(
         self,
         model_prediction,
-        findings: Dict,
-        response: Dict
     ) -> str:
         """Generate a patient-friendly narrative summary using LLM"""
         disease = model_prediction['disease']
         confidence = model_prediction['confidence']
         reliability = response['confidence_assessment']['prediction_reliability']
         # Get key points
         critical_count = response['patient_summary']['critical_values']
         abnormal_count = response['patient_summary']['biomarkers_out_of_range']
         key_drivers = response['prediction_explanation']['key_drivers']
         prompt = ChatPromptTemplate.from_messages([
             ("system", """You are a medical AI assistant explaining test results to a patient.
             Write a clear, compassionate 3-4 sentence summary that:
@@ -231,12 +232,12 @@ class ResponseSynthesizerAgent:
             Write a compassionate patient summary.""")
         ])
         chain = prompt | self.llm
         try:
             driver_names = [kd['biomarker'] for kd in key_drivers[:3]]
             response_obj = chain.invoke({
                 "disease": disease,
                 "confidence": confidence,
@@ -245,9 +246,9 @@ class ResponseSynthesizerAgent:
                 "abnormal": abnormal_count,
                 "drivers": ", ".join(driver_names) if driver_names else "Multiple biomarkers"
             })
             return response_obj.content.strip()
         except Exception as e:
             print(f"Warning: Narrative generation failed: {e}")
             return f"Your test results suggest {disease} with {confidence:.1%} confidence. {abnormal_count} biomarker(s) are out of normal range. Please consult with a healthcare provider for professional evaluation and guidance."

 Response Synthesizer Agent - Compiles all findings into final structured JSON
 """
+from typing import Any
 from langchain_core.prompts import ChatPromptTemplate
+from src.llm_config import llm_config
+from src.state import GuildState
 class ResponseSynthesizerAgent:
     """Agent that synthesizes all specialist findings into the final response"""
     def __init__(self):
         self.llm = llm_config.get_synthesizer()
     def synthesize(self, state: GuildState) -> GuildState:
         """
         Synthesize all agent outputs into final response.
         print("\n" + "="*70)
         print("EXECUTING: Response Synthesizer Agent")
         print("="*70)
         model_prediction = state['model_prediction']
         patient_biomarkers = state['patient_biomarkers']
         patient_context = state.get('patient_context', {})
         agent_outputs = state.get('agent_outputs', [])
         # Collect findings from all agents
         findings = self._collect_findings(agent_outputs)
         print(f"\nSynthesizing findings from {len(agent_outputs)} specialist agents...")
         # Build structured response
         recs = self._build_recommendations(findings)
         response = {
                 "alternative_diagnoses": self._build_alternative_diagnoses(findings)
             }
         }
         # Generate patient-friendly summary
         response["patient_summary"]["narrative"] = self._generate_narrative_summary(
             model_prediction,
             findings,
             response
         )
         print("\nResponse synthesis complete")
+        print("  - Patient summary: Generated")
         print(f"  - Prediction explanation: {len(response['prediction_explanation']['key_drivers'])} key drivers")
         print(f"  - Recommendations: {len(response['clinical_recommendations']['immediate_actions'])} immediate actions")
         print(f"  - Safety alerts: {len(response['safety_alerts'])} alerts")
         return {'final_response': response}
+    def _collect_findings(self, agent_outputs: list) -> dict[str, Any]:
         """Organize all agent findings by agent name"""
         findings = {}
         for output in agent_outputs:
             findings[output.agent_name] = output.findings
         return findings
+    def _build_patient_summary(self, biomarkers: dict, findings: dict) -> dict:
         """Build patient summary section"""
         biomarker_analysis = findings.get("Biomarker Analyzer", {})
         flags = biomarker_analysis.get('biomarker_flags', [])
         # Count biomarker statuses
         critical = len([f for f in flags if 'CRITICAL' in f.get('status', '')])
         abnormal = len([f for f in flags if f.get('status') != 'NORMAL'])
         return {
             "total_biomarkers_tested": len(biomarkers),
             "biomarkers_in_normal_range": len(flags) - abnormal,
             "overall_risk_profile": biomarker_analysis.get('summary', 'Assessment complete'),
             "narrative": ""  # Will be filled later
         }
+    def _build_prediction_explanation(self, model_prediction: dict, findings: dict) -> dict:
         """Build prediction explanation section"""
         disease_explanation = findings.get("Disease Explainer", {})
         linker_findings = findings.get("Biomarker-Disease Linker", {})
         disease = model_prediction['disease']
         confidence = model_prediction['confidence']
         # Get key drivers
         key_drivers_raw = linker_findings.get('key_drivers', [])
         key_drivers = [
             }
             for kd in key_drivers_raw
         ]
         return {
             "primary_disease": disease,
             "confidence": confidence,
             "pdf_references": disease_explanation.get('citations', [])
         }
+    def _build_biomarker_flags(self, findings: dict) -> list[dict]:
         biomarker_analysis = findings.get("Biomarker Analyzer", {})
         return biomarker_analysis.get('biomarker_flags', [])
+    def _build_key_drivers(self, findings: dict) -> list[dict]:
         linker_findings = findings.get("Biomarker-Disease Linker", {})
         return linker_findings.get('key_drivers', [])
+    def _build_disease_explanation(self, findings: dict) -> dict:
         disease_explanation = findings.get("Disease Explainer", {})
         return {
             "pathophysiology": disease_explanation.get('pathophysiology', ''),
             "citations": disease_explanation.get('citations', []),
             "retrieved_chunks": disease_explanation.get('retrieved_chunks')
         }
+    def _build_recommendations(self, findings: dict) -> dict:
         """Build clinical recommendations section"""
         guidelines = findings.get("Clinical Guidelines", {})
         return {
             "immediate_actions": guidelines.get('immediate_actions', []),
             "lifestyle_changes": guidelines.get('lifestyle_changes', []),
             "monitoring": guidelines.get('monitoring', []),
             "guideline_citations": guidelines.get('guideline_citations', [])
         }
+    def _build_confidence_assessment(self, findings: dict) -> dict:
         """Build confidence assessment section"""
         assessment = findings.get("Confidence Assessor", {})
         return {
             "prediction_reliability": assessment.get('prediction_reliability', 'UNKNOWN'),
             "evidence_strength": assessment.get('evidence_strength', 'UNKNOWN'),
             "alternative_diagnoses": assessment.get('alternative_diagnoses', [])
         }
+    def _build_alternative_diagnoses(self, findings: dict) -> list[dict]:
         assessment = findings.get("Confidence Assessor", {})
         return assessment.get('alternative_diagnoses', [])
+    def _build_safety_alerts(self, findings: dict) -> list[dict]:
         """Build safety alerts section"""
         biomarker_analysis = findings.get("Biomarker Analyzer", {})
         return biomarker_analysis.get('safety_alerts', [])
+    def _build_metadata(self, state: GuildState) -> dict:
         """Build metadata section"""
         from datetime import datetime
         return {
             "timestamp": datetime.now().isoformat(),
             "system_version": "MediGuard AI RAG-Helper v1.0",
             "agents_executed": [output.agent_name for output in state.get('agent_outputs', [])],
             "disclaimer": "This is an AI-assisted analysis tool for patient self-assessment. It is NOT a substitute for professional medical advice, diagnosis, or treatment. Always consult qualified healthcare providers for medical decisions."
         }
     def _generate_narrative_summary(
         self,
         model_prediction,
+        findings: dict,
+        response: dict
     ) -> str:
         """Generate a patient-friendly narrative summary using LLM"""
         disease = model_prediction['disease']
         confidence = model_prediction['confidence']
         reliability = response['confidence_assessment']['prediction_reliability']
         # Get key points
         critical_count = response['patient_summary']['critical_values']
         abnormal_count = response['patient_summary']['biomarkers_out_of_range']
         key_drivers = response['prediction_explanation']['key_drivers']
         prompt = ChatPromptTemplate.from_messages([
             ("system", """You are a medical AI assistant explaining test results to a patient.
             Write a clear, compassionate 3-4 sentence summary that:
             Write a compassionate patient summary.""")
         ])
         chain = prompt | self.llm
         try:
             driver_names = [kd['biomarker'] for kd in key_drivers[:3]]
             response_obj = chain.invoke({
                 "disease": disease,
                 "confidence": confidence,
                 "abnormal": abnormal_count,
                 "drivers": ", ".join(driver_names) if driver_names else "Multiple biomarkers"
             })
             return response_obj.content.strip()
         except Exception as e:
             print(f"Warning: Narrative generation failed: {e}")
             return f"Your test results suggest {disease} with {confidence:.1%} confidence. {abnormal_count} biomarker(s) are out of normal range. Please consult with a healthcare provider for professional evaluation and guidance."

src/biomarker_normalization.py CHANGED Viewed

@@ -3,10 +3,9 @@ MediGuard AI RAG-Helper
 Shared biomarker normalization utilities
 """
-from typing import Dict
 # Normalization map for biomarker aliases to canonical names.
-NORMALIZATION_MAP: Dict[str, str] = {
     # Glucose variations
     "glucose": "Glucose",
     "bloodsugar": "Glucose",

 Shared biomarker normalization utilities
 """
 # Normalization map for biomarker aliases to canonical names.
+NORMALIZATION_MAP: dict[str, str] = {
     # Glucose variations
     "glucose": "Glucose",
     "bloodsugar": "Glucose",

src/biomarker_validator.py CHANGED Viewed

@@ -5,24 +5,24 @@ Biomarker analysis and validation utilities
 import json
 from pathlib import Path
-from typing import Dict, List, Tuple, Optional
 from src.state import BiomarkerFlag, SafetyAlert
 class BiomarkerValidator:
     """Validates biomarker values against reference ranges"""
     def __init__(self, reference_file: str = "config/biomarker_references.json"):
         """Load biomarker reference ranges from JSON file"""
         ref_path = Path(__file__).parent.parent / reference_file
-        with open(ref_path, 'r') as f:
             self.references = json.load(f)['biomarkers']
     def validate_biomarker(
-        self,
-        name: str,
-        value: float,
-        gender: Optional[str] = None,
         threshold_pct: float = 0.0
     ) -> BiomarkerFlag:
         """
@@ -46,10 +46,10 @@ class BiomarkerValidator:
                 reference_range="No reference data available",
                 warning=f"No reference range found for {name}"
             )
         ref = self.references[name]
         unit = ref['unit']
         # Handle gender-specific ranges
         if ref.get('gender_specific', False) and gender:
             if gender.lower() in ['male', 'm']:
@@ -60,16 +60,16 @@ class BiomarkerValidator:
                 normal = ref['normal_range']
         else:
             normal = ref['normal_range']
         min_val = normal.get('min', 0)
         max_val = normal.get('max', float('inf'))
         critical_low = ref.get('critical_low')
         critical_high = ref.get('critical_high')
         # Determine status
         status = "NORMAL"
         warning = None
         # Check critical values first (threshold_pct does not suppress critical alerts)
         if critical_low and value < critical_low:
             status = "CRITICAL_LOW"
@@ -88,9 +88,9 @@ class BiomarkerValidator:
             if deviation > threshold_pct:
                 status = "HIGH"
                 warning = f"{name} is {value} {unit}, above normal range ({min_val}-{max_val} {unit}). {ref['clinical_significance'].get('high', '')}"
         reference_range = f"{min_val}-{max_val} {unit}"
         return BiomarkerFlag(
             name=name,
             value=value,
@@ -99,13 +99,13 @@ class BiomarkerValidator:
             reference_range=reference_range,
             warning=warning
         )
     def validate_all(
         self,
-        biomarkers: Dict[str, float],
-        gender: Optional[str] = None,
         threshold_pct: float = 0.0
-    ) -> Tuple[List[BiomarkerFlag], List[SafetyAlert]]:
         """
         Validate all biomarker values.
@@ -119,11 +119,11 @@ class BiomarkerValidator:
         """
         flags = []
         alerts = []
         for name, value in biomarkers.items():
             flag = self.validate_biomarker(name, value, gender, threshold_pct)
             flags.append(flag)
             # Generate safety alerts for critical values
             if flag.status in ["CRITICAL_LOW", "CRITICAL_HIGH"]:
                 alerts.append(SafetyAlert(
@@ -140,18 +140,18 @@ class BiomarkerValidator:
                     message=flag.warning or f"{name} out of normal range",
                     action="Consult with healthcare provider"
                 ))
         return flags, alerts
-    def get_biomarker_info(self, name: str) -> Optional[Dict]:
         """Get reference information for a biomarker"""
         return self.references.get(name)
     def expected_biomarker_count(self) -> int:
         """Return expected number of biomarkers from reference ranges."""
         return len(self.references)
-    def get_disease_relevant_biomarkers(self, disease: str) -> List[str]:
         """
         Get list of biomarkers most relevant to a specific disease.
@@ -159,19 +159,19 @@ class BiomarkerValidator:
         """
         disease_map = {
             "Diabetes": [
-                "Glucose", "HbA1c", "Insulin", "BMI",
                 "Triglycerides", "HDL Cholesterol", "LDL Cholesterol"
             ],
             "Type 2 Diabetes": [
-                "Glucose", "HbA1c", "Insulin", "BMI",
                 "Triglycerides", "HDL Cholesterol", "LDL Cholesterol"
             ],
             "Type 1 Diabetes": [
-                "Glucose", "HbA1c", "Insulin", "BMI",
                 "Triglycerides", "HDL Cholesterol", "LDL Cholesterol"
             ],
             "Anemia": [
-                "Hemoglobin", "Red Blood Cells", "Hematocrit",
                 "Mean Corpuscular Volume", "Mean Corpuscular Hemoglobin",
                 "Mean Corpuscular Hemoglobin Concentration"
             ],
@@ -189,5 +189,5 @@ class BiomarkerValidator:
                 "Heart Rate", "BMI"
             ]
         }
         return disease_map.get(disease, [])

 import json
 from pathlib import Path
 from src.state import BiomarkerFlag, SafetyAlert
 class BiomarkerValidator:
     """Validates biomarker values against reference ranges"""
     def __init__(self, reference_file: str = "config/biomarker_references.json"):
         """Load biomarker reference ranges from JSON file"""
         ref_path = Path(__file__).parent.parent / reference_file
+        with open(ref_path) as f:
             self.references = json.load(f)['biomarkers']
     def validate_biomarker(
+        self,
+        name: str,
+        value: float,
+        gender: str | None = None,
         threshold_pct: float = 0.0
     ) -> BiomarkerFlag:
         """
                 reference_range="No reference data available",
                 warning=f"No reference range found for {name}"
             )
         ref = self.references[name]
         unit = ref['unit']
         # Handle gender-specific ranges
         if ref.get('gender_specific', False) and gender:
             if gender.lower() in ['male', 'm']:
                 normal = ref['normal_range']
         else:
             normal = ref['normal_range']
         min_val = normal.get('min', 0)
         max_val = normal.get('max', float('inf'))
         critical_low = ref.get('critical_low')
         critical_high = ref.get('critical_high')
         # Determine status
         status = "NORMAL"
         warning = None
         # Check critical values first (threshold_pct does not suppress critical alerts)
         if critical_low and value < critical_low:
             status = "CRITICAL_LOW"
             if deviation > threshold_pct:
                 status = "HIGH"
                 warning = f"{name} is {value} {unit}, above normal range ({min_val}-{max_val} {unit}). {ref['clinical_significance'].get('high', '')}"
         reference_range = f"{min_val}-{max_val} {unit}"
         return BiomarkerFlag(
             name=name,
             value=value,
             reference_range=reference_range,
             warning=warning
         )
     def validate_all(
         self,
+        biomarkers: dict[str, float],
+        gender: str | None = None,
         threshold_pct: float = 0.0
+    ) -> tuple[list[BiomarkerFlag], list[SafetyAlert]]:
         """
         Validate all biomarker values.
         """
         flags = []
         alerts = []
         for name, value in biomarkers.items():
             flag = self.validate_biomarker(name, value, gender, threshold_pct)
             flags.append(flag)
             # Generate safety alerts for critical values
             if flag.status in ["CRITICAL_LOW", "CRITICAL_HIGH"]:
                 alerts.append(SafetyAlert(
                     message=flag.warning or f"{name} out of normal range",
                     action="Consult with healthcare provider"
                 ))
         return flags, alerts
+    def get_biomarker_info(self, name: str) -> dict | None:
         """Get reference information for a biomarker"""
         return self.references.get(name)
     def expected_biomarker_count(self) -> int:
         """Return expected number of biomarkers from reference ranges."""
         return len(self.references)
+    def get_disease_relevant_biomarkers(self, disease: str) -> list[str]:
         """
         Get list of biomarkers most relevant to a specific disease.
         """
         disease_map = {
             "Diabetes": [
+                "Glucose", "HbA1c", "Insulin", "BMI",
                 "Triglycerides", "HDL Cholesterol", "LDL Cholesterol"
             ],
             "Type 2 Diabetes": [
+                "Glucose", "HbA1c", "Insulin", "BMI",
                 "Triglycerides", "HDL Cholesterol", "LDL Cholesterol"
             ],
             "Type 1 Diabetes": [
+                "Glucose", "HbA1c", "Insulin", "BMI",
                 "Triglycerides", "HDL Cholesterol", "LDL Cholesterol"
             ],
             "Anemia": [
+                "Hemoglobin", "Red Blood Cells", "Hematocrit",
                 "Mean Corpuscular Volume", "Mean Corpuscular Hemoglobin",
                 "Mean Corpuscular Hemoglobin Concentration"
             ],
                 "Heart Rate", "BMI"
             ]
         }
         return disease_map.get(disease, [])

src/config.py CHANGED Viewed

@@ -3,8 +3,9 @@ MediGuard AI RAG-Helper
 Core configuration and SOP (Standard Operating Procedures) definitions
 """
 from pydantic import BaseModel, Field
-from typing import Literal, Dict, Any, List, Optional
 class ExplanationSOP(BaseModel):
@@ -13,28 +14,28 @@ class ExplanationSOP(BaseModel):
     This is the 'genome' that controls the entire RAG pipeline behavior.
     The Outer Loop (Director) will evolve these parameters to improve performance.
     """
     # === Agent Behavior Parameters ===
     biomarker_analyzer_threshold: float = Field(
         default=0.15,
         description="Percentage deviation from normal range to trigger a warning flag (0.15 = 15%)"
     )
     disease_explainer_k: int = Field(
         default=5,
         description="Number of top PDF chunks to retrieve for disease explanation"
     )
     linker_retrieval_k: int = Field(
         default=3,
         description="Number of chunks for biomarker-disease linking"
     )
     guideline_retrieval_k: int = Field(
         default=3,
         description="Number of chunks for clinical guidelines"
     )
     # === Prompts (Evolvable) ===
     planner_prompt: str = Field(
         default="""You are a medical AI coordinator. Create a structured execution plan for analyzing patient biomarkers and explaining a disease prediction.
@@ -49,7 +50,7 @@ Available specialist agents:
 Output a JSON with key 'plan' containing a list of tasks. Each task must have 'agent', 'task_description', and 'dependencies' keys.""",
         description="System prompt for the Planner Agent"
     )
     synthesizer_prompt: str = Field(
         default="""You are a medical communication specialist. Your task is to synthesize findings from specialist agents into a clear, patient-friendly clinical explanation.
@@ -64,39 +65,39 @@ Output a JSON with key 'plan' containing a list of tasks. Each task must have 'a
 Structure your output as specified in the output schema.""",
         description="System prompt for the Response Synthesizer"
     )
     explainer_detail_level: Literal["concise", "detailed", "comprehensive"] = Field(
         default="detailed",
         description="Level of detail in disease mechanism explanations"
     )
     # === Feature Flags ===
     use_guideline_agent: bool = Field(
         default=True,
         description="Whether to retrieve clinical guidelines and recommendations"
     )
     include_alternative_diagnoses: bool = Field(
         default=True,
         description="Whether to discuss alternative diagnoses from prediction probabilities"
     )
     require_pdf_citations: bool = Field(
         default=True,
         description="Whether to require PDF citations for all claims"
     )
     use_confidence_assessor: bool = Field(
         default=True,
         description="Whether to evaluate and report prediction confidence"
     )
     # === Safety Settings ===
     critical_value_alert_mode: Literal["strict", "moderate", "permissive"] = Field(
         default="strict",
         description="Threshold for critical value alerts"
     )
     # === Model Selection ===
     synthesizer_model: str = Field(
         default="default",

 Core configuration and SOP (Standard Operating Procedures) definitions
 """
+from typing import Literal
 from pydantic import BaseModel, Field
 class ExplanationSOP(BaseModel):
     This is the 'genome' that controls the entire RAG pipeline behavior.
     The Outer Loop (Director) will evolve these parameters to improve performance.
     """
     # === Agent Behavior Parameters ===
     biomarker_analyzer_threshold: float = Field(
         default=0.15,
         description="Percentage deviation from normal range to trigger a warning flag (0.15 = 15%)"
     )
     disease_explainer_k: int = Field(
         default=5,
         description="Number of top PDF chunks to retrieve for disease explanation"
     )
     linker_retrieval_k: int = Field(
         default=3,
         description="Number of chunks for biomarker-disease linking"
     )
     guideline_retrieval_k: int = Field(
         default=3,
         description="Number of chunks for clinical guidelines"
     )
     # === Prompts (Evolvable) ===
     planner_prompt: str = Field(
         default="""You are a medical AI coordinator. Create a structured execution plan for analyzing patient biomarkers and explaining a disease prediction.
 Output a JSON with key 'plan' containing a list of tasks. Each task must have 'agent', 'task_description', and 'dependencies' keys.""",
         description="System prompt for the Planner Agent"
     )
     synthesizer_prompt: str = Field(
         default="""You are a medical communication specialist. Your task is to synthesize findings from specialist agents into a clear, patient-friendly clinical explanation.
 Structure your output as specified in the output schema.""",
         description="System prompt for the Response Synthesizer"
     )
     explainer_detail_level: Literal["concise", "detailed", "comprehensive"] = Field(
         default="detailed",
         description="Level of detail in disease mechanism explanations"
     )
     # === Feature Flags ===
     use_guideline_agent: bool = Field(
         default=True,
         description="Whether to retrieve clinical guidelines and recommendations"
     )
     include_alternative_diagnoses: bool = Field(
         default=True,
         description="Whether to discuss alternative diagnoses from prediction probabilities"
     )
     require_pdf_citations: bool = Field(
         default=True,
         description="Whether to require PDF citations for all claims"
     )
     use_confidence_assessor: bool = Field(
         default=True,
         description="Whether to evaluate and report prediction confidence"
     )
     # === Safety Settings ===
     critical_value_alert_mode: Literal["strict", "moderate", "permissive"] = Field(
         default="strict",
         description="Threshold for critical value alerts"
     )
     # === Model Selection ===
     synthesizer_model: str = Field(
         default="default",

src/database.py CHANGED Viewed

@@ -6,11 +6,11 @@ Provides SQLAlchemy engine/session factories and the declarative Base.
 from __future__ import annotations
 from functools import lru_cache
-from typing import Generator
 from sqlalchemy import create_engine
-from sqlalchemy.orm import Session, sessionmaker, DeclarativeBase
 from src.settings import get_settings

 from __future__ import annotations
+from collections.abc import Generator
 from functools import lru_cache
 from sqlalchemy import create_engine
+from sqlalchemy.orm import DeclarativeBase, Session, sessionmaker
 from src.settings import get_settings

src/dependencies.py CHANGED Viewed

@@ -6,9 +6,6 @@ Provides factory functions and ``Depends()`` for services used across routers.
 from __future__ import annotations
-from functools import lru_cache
-from src.settings import Settings, get_settings
 from src.services.cache.redis_cache import RedisCache, make_redis_cache
 from src.services.embeddings.service import EmbeddingService, make_embedding_service
 from src.services.langfuse.tracer import LangfuseTracer, make_langfuse_tracer

 from __future__ import annotations
 from src.services.cache.redis_cache import RedisCache, make_redis_cache
 from src.services.embeddings.service import EmbeddingService, make_embedding_service
 from src.services.langfuse.tracer import LangfuseTracer, make_langfuse_tracer

src/evaluation/__init__.py CHANGED Viewed

@@ -4,23 +4,23 @@ Exports 5D quality assessment framework components
 """
 from .evaluators import (
-    GradedScore,
     EvaluationResult,
-    evaluate_clinical_accuracy,
-    evaluate_evidence_grounding,
     evaluate_actionability,
     evaluate_clarity,
     evaluate_safety_completeness,
-    run_full_evaluation
 )
 __all__ = [
-    'GradedScore',
     'EvaluationResult',
-    'evaluate_clinical_accuracy',
-    'evaluate_evidence_grounding',
     'evaluate_actionability',
     'evaluate_clarity',
     'evaluate_safety_completeness',
     'run_full_evaluation'
 ]

 """
 from .evaluators import (
     EvaluationResult,
+    GradedScore,
     evaluate_actionability,
     evaluate_clarity,
+    evaluate_clinical_accuracy,
+    evaluate_evidence_grounding,
     evaluate_safety_completeness,
+    run_full_evaluation,
 )
 __all__ = [
     'EvaluationResult',
+    'GradedScore',
     'evaluate_actionability',
     'evaluate_clarity',
+    'evaluate_clinical_accuracy',
+    'evaluate_evidence_grounding',
     'evaluate_safety_completeness',
     'run_full_evaluation'
 ]

src/evaluation/evaluators.py CHANGED Viewed

@@ -22,11 +22,13 @@ Usage:
     print(f"Average score: {result.average_score():.2f}")
 """
-import os
-from pydantic import BaseModel, Field
-from typing import Dict, Any, List
 import json
 from langchain_core.prompts import ChatPromptTemplate
 from src.llm_config import get_chat_model
 # Set to True for deterministic evaluation (testing)
@@ -46,8 +48,8 @@ class EvaluationResult(BaseModel):
     actionability: GradedScore
     clarity: GradedScore
     safety_completeness: GradedScore
-    def to_vector(self) -> List[float]:
         """Extract scores as a vector for Pareto analysis"""
         return [
             self.clinical_accuracy.score,
@@ -56,7 +58,7 @@ class EvaluationResult(BaseModel):
             self.clarity.score,
             self.safety_completeness.score
         ]
     def average_score(self) -> float:
         """Calculate average of all 5 dimensions"""
         scores = self.to_vector()
@@ -65,7 +67,7 @@ class EvaluationResult(BaseModel):
 # Evaluator 1: Clinical Accuracy (LLM-as-Judge)
 def evaluate_clinical_accuracy(
-    final_response: Dict[str, Any],
     pubmed_context: str
 ) -> GradedScore:
     """
@@ -77,13 +79,13 @@ def evaluate_clinical_accuracy(
     # Deterministic mode for testing
     if DETERMINISTIC_MODE:
         return _deterministic_clinical_accuracy(final_response, pubmed_context)
     # Use cloud LLM for evaluation (FREE via Groq/Gemini)
     evaluator_llm = get_chat_model(
         temperature=0.0,
         json_mode=True
     )
     prompt = ChatPromptTemplate.from_messages([
         ("system", """You are a medical expert evaluating clinical accuracy.
@@ -113,7 +115,7 @@ Respond ONLY with valid JSON in this format:
 {context}
 """)
     ])
     chain = prompt | evaluator_llm
     result = chain.invoke({
         "patient_summary": final_response['patient_summary'],
@@ -121,7 +123,7 @@ Respond ONLY with valid JSON in this format:
         "recommendations": final_response['clinical_recommendations'],
         "context": pubmed_context
     })
     # Parse JSON response
     try:
         content = result.content if isinstance(result.content, str) else str(result.content)
@@ -134,7 +136,7 @@ Respond ONLY with valid JSON in this format:
 # Evaluator 2: Evidence Grounding (Programmatic + LLM)
 def evaluate_evidence_grounding(
-    final_response: Dict[str, Any]
 ) -> GradedScore:
     """
     Checks if all claims are backed by citations.
@@ -143,32 +145,32 @@ def evaluate_evidence_grounding(
     # Count citations
     pdf_refs = final_response['prediction_explanation'].get('pdf_references', [])
     citation_count = len(pdf_refs)
     # Check key drivers have evidence
     key_drivers = final_response['prediction_explanation'].get('key_drivers', [])
     drivers_with_evidence = sum(1 for d in key_drivers if d.get('evidence'))
     # Citation coverage score
     if len(key_drivers) > 0:
         coverage = drivers_with_evidence / len(key_drivers)
     else:
         coverage = 0.0
     # Base score from programmatic checks
     base_score = min(1.0, citation_count / 5.0) * 0.5 + coverage * 0.5
     reasoning = f"""
     Citations found: {citation_count}
     Key drivers with evidence: {drivers_with_evidence}/{len(key_drivers)}
     Citation coverage: {coverage:.1%}
     """
     return GradedScore(score=base_score, reasoning=reasoning.strip())
 # Evaluator 3: Clinical Actionability (LLM-as-Judge)
 def evaluate_actionability(
-    final_response: Dict[str, Any]
 ) -> GradedScore:
     """
     Evaluates if recommendations are actionable and safe.
@@ -179,13 +181,13 @@ def evaluate_actionability(
     # Deterministic mode for testing
     if DETERMINISTIC_MODE:
         return _deterministic_actionability(final_response)
     # Use cloud LLM for evaluation (FREE via Groq/Gemini)
     evaluator_llm = get_chat_model(
         temperature=0.0,
         json_mode=True
     )
     prompt = ChatPromptTemplate.from_messages([
         ("system", """You are a clinical care coordinator evaluating actionability.
@@ -216,7 +218,7 @@ Respond ONLY with valid JSON in this format:
 {confidence}
 """)
     ])
     chain = prompt | evaluator_llm
     recs = final_response['clinical_recommendations']
     result = chain.invoke({
@@ -225,7 +227,7 @@ Respond ONLY with valid JSON in this format:
         "monitoring": recs.get('monitoring', []),
         "confidence": final_response['confidence_assessment']
     })
     # Parse JSON response
     try:
         parsed = json.loads(result.content if isinstance(result.content, str) else str(result.content))
@@ -237,7 +239,7 @@ Respond ONLY with valid JSON in this format:
 # Evaluator 4: Explainability Clarity (Programmatic)
 def evaluate_clarity(
-    final_response: Dict[str, Any]
 ) -> GradedScore:
     """
     Measures readability and patient-friendliness.
@@ -248,16 +250,16 @@ def evaluate_clarity(
     # Deterministic mode for testing
     if DETERMINISTIC_MODE:
         return _deterministic_clarity(final_response)
     try:
         import textstat
         has_textstat = True
     except ImportError:
         has_textstat = False
     # Get patient narrative
     narrative = final_response['patient_summary'].get('narrative', '')
     if has_textstat:
         # Calculate readability (Flesch Reading Ease)
         # Score 60-70 = Standard (8th-9th grade)
@@ -275,24 +277,24 @@ def evaluate_clarity(
             readability_score = 0.9
         else:
             readability_score = max(0.5, 1.0 - (avg_words - 20) * 0.02)
     # Medical jargon detection (simple heuristic)
     medical_terms = [
         'pathophysiology', 'etiology', 'hemostasis', 'coagulation',
         'thrombocytopenia', 'erythropoiesis', 'gluconeogenesis'
     ]
     jargon_count = sum(1 for term in medical_terms if term.lower() in narrative.lower())
     # Length check (too short = vague, too long = overwhelming)
     word_count = len(narrative.split())
     optimal_length = 50 <= word_count <= 150
     # Scoring
     jargon_penalty = max(0.0, 1.0 - (jargon_count * 0.2))
     length_score = 1.0 if optimal_length else 0.7
     final_score = (readability_score * 0.5 + jargon_penalty * 0.3 + length_score * 0.2)
     if has_textstat:
         reasoning = f"""
     Flesch Reading Ease: {flesch_score:.1f} (Target: 60-70)
@@ -307,63 +309,63 @@ def evaluate_clarity(
     Word count: {word_count} (Optimal: 50-150)
     Note: textstat not available, using fallback metrics
     """
     return GradedScore(score=final_score, reasoning=reasoning.strip())
 # Evaluator 5: Safety & Completeness (Programmatic)
 def evaluate_safety_completeness(
-    final_response: Dict[str, Any],
-    biomarkers: Dict[str, float]
 ) -> GradedScore:
     """
     Checks if all safety concerns are flagged.
     Programmatic validation.
     """
     from src.biomarker_validator import BiomarkerValidator
     # Initialize validator
     validator = BiomarkerValidator()
     # Count out-of-range biomarkers
     out_of_range_count = 0
     critical_count = 0
     for name, value in biomarkers.items():
         result = validator.validate_biomarker(name, value)  # Fixed: use validate_biomarker instead of validate_single
         if result.status in ['HIGH', 'LOW', 'CRITICAL_HIGH', 'CRITICAL_LOW']:
             out_of_range_count += 1
         if result.status in ['CRITICAL_HIGH', 'CRITICAL_LOW']:
             critical_count += 1
     # Count safety alerts in output
     safety_alerts = final_response.get('safety_alerts', [])
     alert_count = len(safety_alerts)
     critical_alerts = sum(1 for a in safety_alerts if a.get('severity') == 'CRITICAL')
     # Check if all critical values have alerts
     critical_coverage = critical_alerts / critical_count if critical_count > 0 else 1.0
     # Check for disclaimer
     has_disclaimer = 'disclaimer' in final_response.get('metadata', {})
     # Check for uncertainty acknowledgment
     limitations = final_response['confidence_assessment'].get('limitations', [])
     acknowledges_uncertainty = len(limitations) > 0
     # Scoring
     alert_score = min(1.0, alert_count / max(1, out_of_range_count))
     critical_score = min(1.0, critical_coverage)
     disclaimer_score = 1.0 if has_disclaimer else 0.0
     uncertainty_score = 1.0 if acknowledges_uncertainty else 0.5
     final_score = min(1.0, (
         alert_score * 0.4 +
         critical_score * 0.3 +
         disclaimer_score * 0.2 +
         uncertainty_score * 0.1
     ))
     reasoning = f"""
     Out-of-range biomarkers: {out_of_range_count}
     Critical values: {critical_count}
@@ -373,15 +375,15 @@ def evaluate_safety_completeness(
     Has disclaimer: {has_disclaimer}
     Acknowledges uncertainty: {acknowledges_uncertainty}
     """
     return GradedScore(score=final_score, reasoning=reasoning.strip())
 # Master Evaluation Function
 def run_full_evaluation(
-    final_response: Dict[str, Any],
-    agent_outputs: List[Any],
-    biomarkers: Dict[str, float]
 ) -> EvaluationResult:
     """
     Orchestrates all 5 evaluators and returns complete assessment.
@@ -389,7 +391,7 @@ def run_full_evaluation(
     print("=" * 70)
     print("RUNNING 5D EVALUATION GAUNTLET")
     print("=" * 70)
     # Extract context from agent outputs
     pubmed_context = ""
     for output in agent_outputs:
@@ -402,27 +404,27 @@ def run_full_evaluation(
             else:
                 pubmed_context = str(findings)
             break
     # Run all evaluators
     print("\n1. Evaluating Clinical Accuracy...")
     clinical_accuracy = evaluate_clinical_accuracy(final_response, pubmed_context)
     print("2. Evaluating Evidence Grounding...")
     evidence_grounding = evaluate_evidence_grounding(final_response)
     print("3. Evaluating Clinical Actionability...")
     actionability = evaluate_actionability(final_response)
     print("4. Evaluating Explainability Clarity...")
     clarity = evaluate_clarity(final_response)
     print("5. Evaluating Safety & Completeness...")
     safety_completeness = evaluate_safety_completeness(final_response, biomarkers)
     print("\n" + "=" * 70)
     print("EVALUATION COMPLETE")
     print("=" * 70)
     return EvaluationResult(
         clinical_accuracy=clinical_accuracy,
         evidence_grounding=evidence_grounding,
@@ -437,26 +439,26 @@ def run_full_evaluation(
 # ---------------------------------------------------------------------------
 def _deterministic_clinical_accuracy(
-    final_response: Dict[str, Any],
     pubmed_context: str
 ) -> GradedScore:
     """Heuristic-based clinical accuracy (deterministic)."""
     score = 0.5
     reasons = []
     # Check if response has expected structure
     if final_response.get('patient_summary'):
         score += 0.1
         reasons.append("Has patient summary")
     if final_response.get('prediction_explanation'):
         score += 0.1
         reasons.append("Has prediction explanation")
     if final_response.get('clinical_recommendations'):
         score += 0.1
         reasons.append("Has clinical recommendations")
     # Check for citations
     pred = final_response.get('prediction_explanation', {})
     if isinstance(pred, dict):
@@ -464,7 +466,7 @@ def _deterministic_clinical_accuracy(
         if refs:
             score += min(0.2, len(refs) * 0.05)
             reasons.append(f"Has {len(refs)} citations")
     return GradedScore(
         score=min(1.0, score),
         reasoning="[DETERMINISTIC] " + "; ".join(reasons)
@@ -472,12 +474,12 @@ def _deterministic_clinical_accuracy(
 def _deterministic_actionability(
-    final_response: Dict[str, Any]
 ) -> GradedScore:
     """Heuristic-based actionability (deterministic)."""
     score = 0.5
     reasons = []
     recs = final_response.get('clinical_recommendations', {})
     if isinstance(recs, dict):
         if recs.get('immediate_actions'):
@@ -489,7 +491,7 @@ def _deterministic_actionability(
         if recs.get('monitoring'):
             score += 0.1
             reasons.append("Has monitoring recommendations")
     return GradedScore(
         score=min(1.0, score),
         reasoning="[DETERMINISTIC] " + "; ".join(reasons) if reasons else "[DETERMINISTIC] Missing recommendations"
@@ -497,12 +499,12 @@ def _deterministic_actionability(
 def _deterministic_clarity(
-    final_response: Dict[str, Any]
 ) -> GradedScore:
     """Heuristic-based clarity (deterministic)."""
     score = 0.5
     reasons = []
     summary = final_response.get('patient_summary', '')
     if isinstance(summary, str):
         word_count = len(summary.split())
@@ -512,16 +514,16 @@ def _deterministic_clarity(
         elif word_count > 0:
             score += 0.1
             reasons.append("Has summary")
     # Check for structured output
     if final_response.get('biomarker_flags'):
         score += 0.15
         reasons.append("Has biomarker flags")
     if final_response.get('key_findings'):
         score += 0.15
         reasons.append("Has key findings")
     return GradedScore(
         score=min(1.0, score),
         reasoning="[DETERMINISTIC] " + "; ".join(reasons) if reasons else "[DETERMINISTIC] Limited structure"

     print(f"Average score: {result.average_score():.2f}")
 """
 import json
+import os
+from typing import Any
 from langchain_core.prompts import ChatPromptTemplate
+from pydantic import BaseModel, Field
 from src.llm_config import get_chat_model
 # Set to True for deterministic evaluation (testing)
     actionability: GradedScore
     clarity: GradedScore
     safety_completeness: GradedScore
+    def to_vector(self) -> list[float]:
         """Extract scores as a vector for Pareto analysis"""
         return [
             self.clinical_accuracy.score,
             self.clarity.score,
             self.safety_completeness.score
         ]
     def average_score(self) -> float:
         """Calculate average of all 5 dimensions"""
         scores = self.to_vector()
 # Evaluator 1: Clinical Accuracy (LLM-as-Judge)
 def evaluate_clinical_accuracy(
+    final_response: dict[str, Any],
     pubmed_context: str
 ) -> GradedScore:
     """
     # Deterministic mode for testing
     if DETERMINISTIC_MODE:
         return _deterministic_clinical_accuracy(final_response, pubmed_context)
     # Use cloud LLM for evaluation (FREE via Groq/Gemini)
     evaluator_llm = get_chat_model(
         temperature=0.0,
         json_mode=True
     )
     prompt = ChatPromptTemplate.from_messages([
         ("system", """You are a medical expert evaluating clinical accuracy.
 {context}
 """)
     ])
     chain = prompt | evaluator_llm
     result = chain.invoke({
         "patient_summary": final_response['patient_summary'],
         "recommendations": final_response['clinical_recommendations'],
         "context": pubmed_context
     })
     # Parse JSON response
     try:
         content = result.content if isinstance(result.content, str) else str(result.content)
 # Evaluator 2: Evidence Grounding (Programmatic + LLM)
 def evaluate_evidence_grounding(
+    final_response: dict[str, Any]
 ) -> GradedScore:
     """
     Checks if all claims are backed by citations.
     # Count citations
     pdf_refs = final_response['prediction_explanation'].get('pdf_references', [])
     citation_count = len(pdf_refs)
     # Check key drivers have evidence
     key_drivers = final_response['prediction_explanation'].get('key_drivers', [])
     drivers_with_evidence = sum(1 for d in key_drivers if d.get('evidence'))
     # Citation coverage score
     if len(key_drivers) > 0:
         coverage = drivers_with_evidence / len(key_drivers)
     else:
         coverage = 0.0
     # Base score from programmatic checks
     base_score = min(1.0, citation_count / 5.0) * 0.5 + coverage * 0.5
     reasoning = f"""
     Citations found: {citation_count}
     Key drivers with evidence: {drivers_with_evidence}/{len(key_drivers)}
     Citation coverage: {coverage:.1%}
     """
     return GradedScore(score=base_score, reasoning=reasoning.strip())
 # Evaluator 3: Clinical Actionability (LLM-as-Judge)
 def evaluate_actionability(
+    final_response: dict[str, Any]
 ) -> GradedScore:
     """
     Evaluates if recommendations are actionable and safe.
     # Deterministic mode for testing
     if DETERMINISTIC_MODE:
         return _deterministic_actionability(final_response)
     # Use cloud LLM for evaluation (FREE via Groq/Gemini)
     evaluator_llm = get_chat_model(
         temperature=0.0,
         json_mode=True
     )
     prompt = ChatPromptTemplate.from_messages([
         ("system", """You are a clinical care coordinator evaluating actionability.
 {confidence}
 """)
     ])
     chain = prompt | evaluator_llm
     recs = final_response['clinical_recommendations']
     result = chain.invoke({
         "monitoring": recs.get('monitoring', []),
         "confidence": final_response['confidence_assessment']
     })
     # Parse JSON response
     try:
         parsed = json.loads(result.content if isinstance(result.content, str) else str(result.content))
 # Evaluator 4: Explainability Clarity (Programmatic)
 def evaluate_clarity(
+    final_response: dict[str, Any]
 ) -> GradedScore:
     """
     Measures readability and patient-friendliness.
     # Deterministic mode for testing
     if DETERMINISTIC_MODE:
         return _deterministic_clarity(final_response)
     try:
         import textstat
         has_textstat = True
     except ImportError:
         has_textstat = False
     # Get patient narrative
     narrative = final_response['patient_summary'].get('narrative', '')
     if has_textstat:
         # Calculate readability (Flesch Reading Ease)
         # Score 60-70 = Standard (8th-9th grade)
             readability_score = 0.9
         else:
             readability_score = max(0.5, 1.0 - (avg_words - 20) * 0.02)
     # Medical jargon detection (simple heuristic)
     medical_terms = [
         'pathophysiology', 'etiology', 'hemostasis', 'coagulation',
         'thrombocytopenia', 'erythropoiesis', 'gluconeogenesis'
     ]
     jargon_count = sum(1 for term in medical_terms if term.lower() in narrative.lower())
     # Length check (too short = vague, too long = overwhelming)
     word_count = len(narrative.split())
     optimal_length = 50 <= word_count <= 150
     # Scoring
     jargon_penalty = max(0.0, 1.0 - (jargon_count * 0.2))
     length_score = 1.0 if optimal_length else 0.7
     final_score = (readability_score * 0.5 + jargon_penalty * 0.3 + length_score * 0.2)
     if has_textstat:
         reasoning = f"""
     Flesch Reading Ease: {flesch_score:.1f} (Target: 60-70)
     Word count: {word_count} (Optimal: 50-150)
     Note: textstat not available, using fallback metrics
     """
     return GradedScore(score=final_score, reasoning=reasoning.strip())
 # Evaluator 5: Safety & Completeness (Programmatic)
 def evaluate_safety_completeness(
+    final_response: dict[str, Any],
+    biomarkers: dict[str, float]
 ) -> GradedScore:
     """
     Checks if all safety concerns are flagged.
     Programmatic validation.
     """
     from src.biomarker_validator import BiomarkerValidator
     # Initialize validator
     validator = BiomarkerValidator()
     # Count out-of-range biomarkers
     out_of_range_count = 0
     critical_count = 0
     for name, value in biomarkers.items():
         result = validator.validate_biomarker(name, value)  # Fixed: use validate_biomarker instead of validate_single
         if result.status in ['HIGH', 'LOW', 'CRITICAL_HIGH', 'CRITICAL_LOW']:
             out_of_range_count += 1
         if result.status in ['CRITICAL_HIGH', 'CRITICAL_LOW']:
             critical_count += 1
     # Count safety alerts in output
     safety_alerts = final_response.get('safety_alerts', [])
     alert_count = len(safety_alerts)
     critical_alerts = sum(1 for a in safety_alerts if a.get('severity') == 'CRITICAL')
     # Check if all critical values have alerts
     critical_coverage = critical_alerts / critical_count if critical_count > 0 else 1.0
     # Check for disclaimer
     has_disclaimer = 'disclaimer' in final_response.get('metadata', {})
     # Check for uncertainty acknowledgment
     limitations = final_response['confidence_assessment'].get('limitations', [])
     acknowledges_uncertainty = len(limitations) > 0
     # Scoring
     alert_score = min(1.0, alert_count / max(1, out_of_range_count))
     critical_score = min(1.0, critical_coverage)
     disclaimer_score = 1.0 if has_disclaimer else 0.0
     uncertainty_score = 1.0 if acknowledges_uncertainty else 0.5
     final_score = min(1.0, (
         alert_score * 0.4 +
         critical_score * 0.3 +
         disclaimer_score * 0.2 +
         uncertainty_score * 0.1
     ))
     reasoning = f"""
     Out-of-range biomarkers: {out_of_range_count}
     Critical values: {critical_count}
     Has disclaimer: {has_disclaimer}
     Acknowledges uncertainty: {acknowledges_uncertainty}
     """
     return GradedScore(score=final_score, reasoning=reasoning.strip())
 # Master Evaluation Function
 def run_full_evaluation(
+    final_response: dict[str, Any],
+    agent_outputs: list[Any],
+    biomarkers: dict[str, float]
 ) -> EvaluationResult:
     """
     Orchestrates all 5 evaluators and returns complete assessment.
     print("=" * 70)
     print("RUNNING 5D EVALUATION GAUNTLET")
     print("=" * 70)
     # Extract context from agent outputs
     pubmed_context = ""
     for output in agent_outputs:
             else:
                 pubmed_context = str(findings)
             break
     # Run all evaluators
     print("\n1. Evaluating Clinical Accuracy...")
     clinical_accuracy = evaluate_clinical_accuracy(final_response, pubmed_context)
     print("2. Evaluating Evidence Grounding...")
     evidence_grounding = evaluate_evidence_grounding(final_response)
     print("3. Evaluating Clinical Actionability...")
     actionability = evaluate_actionability(final_response)
     print("4. Evaluating Explainability Clarity...")
     clarity = evaluate_clarity(final_response)
     print("5. Evaluating Safety & Completeness...")
     safety_completeness = evaluate_safety_completeness(final_response, biomarkers)
     print("\n" + "=" * 70)
     print("EVALUATION COMPLETE")
     print("=" * 70)
     return EvaluationResult(
         clinical_accuracy=clinical_accuracy,
         evidence_grounding=evidence_grounding,
 # ---------------------------------------------------------------------------
 def _deterministic_clinical_accuracy(
+    final_response: dict[str, Any],
     pubmed_context: str
 ) -> GradedScore:
     """Heuristic-based clinical accuracy (deterministic)."""
     score = 0.5
     reasons = []
     # Check if response has expected structure
     if final_response.get('patient_summary'):
         score += 0.1
         reasons.append("Has patient summary")
     if final_response.get('prediction_explanation'):
         score += 0.1
         reasons.append("Has prediction explanation")
     if final_response.get('clinical_recommendations'):
         score += 0.1
         reasons.append("Has clinical recommendations")
     # Check for citations
     pred = final_response.get('prediction_explanation', {})
     if isinstance(pred, dict):
         if refs:
             score += min(0.2, len(refs) * 0.05)
             reasons.append(f"Has {len(refs)} citations")
     return GradedScore(
         score=min(1.0, score),
         reasoning="[DETERMINISTIC] " + "; ".join(reasons)
 def _deterministic_actionability(
+    final_response: dict[str, Any]
 ) -> GradedScore:
     """Heuristic-based actionability (deterministic)."""
     score = 0.5
     reasons = []
     recs = final_response.get('clinical_recommendations', {})
     if isinstance(recs, dict):
         if recs.get('immediate_actions'):
         if recs.get('monitoring'):
             score += 0.1
             reasons.append("Has monitoring recommendations")
     return GradedScore(
         score=min(1.0, score),
         reasoning="[DETERMINISTIC] " + "; ".join(reasons) if reasons else "[DETERMINISTIC] Missing recommendations"
 def _deterministic_clarity(
+    final_response: dict[str, Any]
 ) -> GradedScore:
     """Heuristic-based clarity (deterministic)."""
     score = 0.5
     reasons = []
     summary = final_response.get('patient_summary', '')
     if isinstance(summary, str):
         word_count = len(summary.split())
         elif word_count > 0:
             score += 0.1
             reasons.append("Has summary")
     # Check for structured output
     if final_response.get('biomarker_flags'):
         score += 0.15
         reasons.append("Has biomarker flags")
     if final_response.get('key_findings'):
         score += 0.15
         reasons.append("Has key findings")
     return GradedScore(
         score=min(1.0, score),
         reasoning="[DETERMINISTIC] " + "; ".join(reasons) if reasons else "[DETERMINISTIC] Limited structure"

src/exceptions.py CHANGED Viewed

@@ -6,15 +6,14 @@ Each service layer raises its own exception type so callers can handle
 failures precisely without leaking implementation details.
 """
-from typing import Any, Dict, Optional
 # ── Base ──────────────────────────────────────────────────────────────────────
 class MediGuardError(Exception):
     """Root exception for the entire MediGuard AI application."""
-    def __init__(self, message: str = "", *, details: Optional[Dict[str, Any]] = None):
         self.details = details or {}
         super().__init__(message)

 failures precisely without leaking implementation details.
 """
+from typing import Any
 # ── Base ──────────────────────────────────────────────────────────────────────
 class MediGuardError(Exception):
     """Root exception for the entire MediGuard AI application."""
+    def __init__(self, message: str = "", *, details: dict[str, Any] | None = None):
         self.details = details or {}
         super().__init__(message)

src/gradio_app.py CHANGED Viewed

@@ -17,15 +17,33 @@ logger = logging.getLogger(__name__)
 API_BASE = os.getenv("MEDIGUARD_API_URL", "http://localhost:8000")
-def _call_ask(question: str) -> str:
-    """Call the /ask endpoint."""
     try:
-        with httpx.Client(timeout=60.0) as client:
-            resp = client.post(f"{API_BASE}/ask", json={"question": question})
             resp.raise_for_status()
-            return resp.json().get("answer", "No answer returned.")
     except Exception as exc:
-        return f"Error: {exc}"
 def _call_analyze(biomarkers_json: str) -> str:
@@ -47,7 +65,7 @@ def _call_analyze(biomarkers_json: str) -> str:
         return f"Error: {exc}"
-def launch_gradio(share: bool = False) -> None:
     """Launch the Gradio interface."""
     try:
         import gradio as gr
@@ -62,14 +80,27 @@ def launch_gradio(share: bool = False) -> None:
         )
         with gr.Tab("Ask a Question"):
-            question_input = gr.Textbox(
-                label="Medical Question",
-                placeholder="e.g., What does a high HbA1c level indicate?",
-                lines=3,
-            )
-            ask_btn = gr.Button("Ask", variant="primary")
-            answer_output = gr.Textbox(label="Answer", lines=15, interactive=False)
-            ask_btn.click(fn=_call_ask, inputs=question_input, outputs=answer_output)
         with gr.Tab("Analyze Biomarkers"):
             bio_input = gr.Textbox(
@@ -82,20 +113,28 @@ def launch_gradio(share: bool = False) -> None:
             analyze_btn.click(fn=_call_analyze, inputs=bio_input, outputs=analysis_output)
         with gr.Tab("Search Knowledge Base"):
-            search_input = gr.Textbox(
-                label="Search Query",
-                placeholder="e.g., diabetes management guidelines",
-                lines=2,
-            )
             search_btn = gr.Button("Search", variant="primary")
             search_output = gr.Textbox(label="Results", lines=15, interactive=False)
-            def _call_search(query: str) -> str:
                 try:
                     with httpx.Client(timeout=30.0) as client:
                         resp = client.post(
                             f"{API_BASE}/search",
-                            json={"query": query, "top_k": 5, "mode": "hybrid"},
                         )
                         resp.raise_for_status()
                         data = resp.json()
@@ -112,10 +151,11 @@ def launch_gradio(share: bool = False) -> None:
                 except Exception as exc:
                     return f"Error: {exc}"
-            search_btn.click(fn=_call_search, inputs=search_input, outputs=search_output)
-    demo.launch(server_name="0.0.0.0", server_port=7860, share=share)
 if __name__ == "__main__":
-    launch_gradio()

 API_BASE = os.getenv("MEDIGUARD_API_URL", "http://localhost:8000")
+def ask_stream(question: str, history: list, model: str):
+    """Call the /ask/stream endpoint."""
+    history = history or []
+    if not question.strip():
+        yield "", history
+        return
+    history.append((question, ""))
     try:
+        with httpx.stream("POST", f"{API_BASE}/ask/stream", json={"question": question}, timeout=60.0) as resp:
             resp.raise_for_status()
+            for line in resp.iter_lines():
+                if line.startswith("data: "):
+                    content = line[6:]
+                    if content == "[DONE]":
+                        break
+                    try:
+                        data = json.loads(content)
+                        current_bot_msg = history[-1][1] + data.get("text", "")
+                        history[-1] = (question, current_bot_msg)
+                        yield "", history
+                    except Exception as trace_exc:
+                        logger.debug("Failed to parse streaming chunk: %s", trace_exc)
     except Exception as exc:
+        history[-1] = (question, f"Error: {exc}")
+        yield "", history
 def _call_analyze(biomarkers_json: str) -> str:
         return f"Error: {exc}"
+def launch_gradio(share: bool = False, server_port: int = 7860) -> None:
     """Launch the Gradio interface."""
     try:
         import gradio as gr
         )
         with gr.Tab("Ask a Question"):
+            with gr.Row():
+                with gr.Column(scale=3):
+                    chatbot = gr.Chatbot(label="Medical Q&A History", height=400)
+                    question_input = gr.Textbox(
+                        label="Medical Question",
+                        placeholder="e.g., What does a high HbA1c level indicate?",
+                        lines=2,
+                    )
+                    with gr.Row():
+                        ask_btn = gr.Button("Ask (Streaming)", variant="primary")
+                        clear_btn = gr.Button("Clear History")
+                with gr.Column(scale=1):
+                    model_selector = gr.Dropdown(
+                        choices=["llama-3.3-70b-versatile", "gemini-2.0-flash", "llama3.1:8b"],
+                        value="llama-3.3-70b-versatile",
+                        label="LLM Provider/Model"
+                    )
+            ask_btn.click(fn=ask_stream, inputs=[question_input, chatbot, model_selector], outputs=[question_input, chatbot])
+            clear_btn.click(fn=lambda: ([], ""), outputs=[chatbot, question_input])
         with gr.Tab("Analyze Biomarkers"):
             bio_input = gr.Textbox(
             analyze_btn.click(fn=_call_analyze, inputs=bio_input, outputs=analysis_output)
         with gr.Tab("Search Knowledge Base"):
+            with gr.Row():
+                search_input = gr.Textbox(
+                    label="Search Query",
+                    placeholder="e.g., diabetes management guidelines",
+                    lines=2,
+                    scale=3
+                )
+                search_mode = gr.Radio(
+                    choices=["hybrid", "bm25", "vector"],
+                    value="hybrid",
+                    label="Search Strategy",
+                    scale=1
+                )
             search_btn = gr.Button("Search", variant="primary")
             search_output = gr.Textbox(label="Results", lines=15, interactive=False)
+            def _call_search(query: str, mode: str) -> str:
                 try:
                     with httpx.Client(timeout=30.0) as client:
                         resp = client.post(
                             f"{API_BASE}/search",
+                            json={"query": query, "top_k": 5, "mode": mode},
                         )
                         resp.raise_for_status()
                         data = resp.json()
                 except Exception as exc:
                     return f"Error: {exc}"
+            search_btn.click(fn=_call_search, inputs=[search_input, search_mode], outputs=search_output)
+    demo.launch(server_name="0.0.0.0", server_port=server_port, share=share)
 if __name__ == "__main__":
+    port = int(os.environ.get("GRADIO_PORT", 7860))
+    launch_gradio(server_port=port)

src/llm_config.py CHANGED Viewed

@@ -14,7 +14,8 @@ Environment Variables (supports both naming conventions):
 import os
 import threading
-from typing import Literal, Optional
 from dotenv import load_dotenv
 # Load environment variables
@@ -64,8 +65,8 @@ DEFAULT_LLM_PROVIDER = get_default_llm_provider()
 def get_chat_model(
-    provider: Optional[Literal["groq", "gemini", "ollama"]] = None,
-    model: Optional[str] = None,
     temperature: float = 0.0,
     json_mode: bool = False
 ):
@@ -83,61 +84,61 @@ def get_chat_model(
     """
     # Use dynamic lookup to get current provider from environment
     provider = provider or get_default_llm_provider()
     if provider == "groq":
         from langchain_groq import ChatGroq
         api_key = get_groq_api_key()
         if not api_key:
             raise ValueError(
                 "GROQ_API_KEY not found in environment.\n"
                 "Get your FREE API key at: https://console.groq.com/keys"
             )
         # Use model from environment or default
         model = model or get_groq_model()
         return ChatGroq(
             model=model,
             temperature=temperature,
             api_key=api_key,
             model_kwargs={"response_format": {"type": "json_object"}} if json_mode else {}
         )
     elif provider == "gemini":
         from langchain_google_genai import ChatGoogleGenerativeAI
         api_key = get_google_api_key()
         if not api_key:
             raise ValueError(
                 "GOOGLE_API_KEY not found in environment.\n"
                 "Get your FREE API key at: https://aistudio.google.com/app/apikey"
             )
         # Use model from environment or default
         model = model or get_gemini_model()
         return ChatGoogleGenerativeAI(
             model=model,
             temperature=temperature,
             google_api_key=api_key,
             convert_system_message_to_human=True
         )
     elif provider == "ollama":
         try:
             from langchain_ollama import ChatOllama
         except ImportError:
             from langchain_community.chat_models import ChatOllama
         model = model or "llama3.1:8b"
         return ChatOllama(
             model=model,
             temperature=temperature,
             format='json' if json_mode else None
         )
     else:
         raise ValueError(f"Unknown provider: {provider}. Use 'groq', 'gemini', or 'ollama'")
@@ -147,7 +148,7 @@ def get_embedding_provider() -> str:
     return _get_env_with_fallback("EMBEDDING_PROVIDER", "EMBEDDING__PROVIDER", "huggingface")
-def get_embedding_model(provider: Optional[Literal["jina", "google", "huggingface", "ollama"]] = None):
     """
     Get embedding model for vector search.
@@ -162,7 +163,7 @@ def get_embedding_model(provider: Optional[Literal["jina", "google", "huggingfac
         which has automatic fallback chain: Jina → Google → HuggingFace.
     """
     provider = provider or get_embedding_provider()
     if provider == "jina":
         # Try Jina AI embeddings first (high quality, 1024d)
         jina_key = _get_env_with_fallback("JINA_API_KEY", "EMBEDDING__JINA_API_KEY", "")
@@ -178,15 +179,15 @@ def get_embedding_model(provider: Optional[Literal["jina", "google", "huggingfac
         else:
             print("WARN: JINA_API_KEY not found. Falling back to Google embeddings.")
             return get_embedding_model("google")
     elif provider == "google":
         from langchain_google_genai import GoogleGenerativeAIEmbeddings
         api_key = get_google_api_key()
         if not api_key:
             print("WARN: GOOGLE_API_KEY not found. Falling back to HuggingFace embeddings.")
             return get_embedding_model("huggingface")
         try:
             return GoogleGenerativeAIEmbeddings(
                 model="models/text-embedding-004",
@@ -196,33 +197,33 @@ def get_embedding_model(provider: Optional[Literal["jina", "google", "huggingfac
             print(f"WARN: Google embeddings failed: {e}")
             print("INFO: Falling back to HuggingFace embeddings...")
             return get_embedding_model("huggingface")
     elif provider == "huggingface":
         try:
             from langchain_huggingface import HuggingFaceEmbeddings
         except ImportError:
             from langchain_community.embeddings import HuggingFaceEmbeddings
         return HuggingFaceEmbeddings(
             model_name="sentence-transformers/all-MiniLM-L6-v2"
         )
     elif provider == "ollama":
         try:
             from langchain_ollama import OllamaEmbeddings
         except ImportError:
             from langchain_community.embeddings import OllamaEmbeddings
         return OllamaEmbeddings(model="nomic-embed-text")
     else:
         raise ValueError(f"Unknown embedding provider: {provider}")
 class LLMConfig:
     """Central configuration for all LLM models"""
-    def __init__(self, provider: Optional[str] = None, lazy: bool = True):
         """
         Initialize all model clients.
@@ -236,7 +237,7 @@ class LLMConfig:
         self._initialized = False
         self._initialized_provider = None  # Track which provider was initialized
         self._lock = threading.Lock()
         # Lazy-initialized model instances
         self._planner = None
         self._analyzer = None
@@ -245,15 +246,15 @@ class LLMConfig:
         self._synthesizer_8b = None
         self._director = None
         self._embedding_model = None
         if not lazy:
             self._initialize_models()
     @property
     def provider(self) -> str:
         """Get current provider (dynamic lookup if not explicitly set)."""
         return self._explicit_provider or get_default_llm_provider()
     def _check_provider_change(self):
         """Check if provider changed and reinitialize if needed."""
         current = self.provider
@@ -266,120 +267,120 @@ class LLMConfig:
             self._synthesizer_7b = None
             self._synthesizer_8b = None
             self._director = None
     def _initialize_models(self):
         """Initialize all model clients (called on first use if lazy)"""
         self._check_provider_change()
         if self._initialized:
             return
         with self._lock:
             # Double-checked locking
             if self._initialized:
                 return
             print(f"Initializing LLM models with provider: {self.provider.upper()}")
         # Fast model for structured tasks (planning, analysis)
         self._planner = get_chat_model(
             provider=self.provider,
             temperature=0.0,
             json_mode=True
         )
         # Fast model for biomarker analysis and quick tasks
         self._analyzer = get_chat_model(
             provider=self.provider,
             temperature=0.0
         )
         # Medium model for RAG retrieval and explanation
         self._explainer = get_chat_model(
             provider=self.provider,
             temperature=0.2
         )
         # Configurable synthesizers
         self._synthesizer_7b = get_chat_model(
             provider=self.provider,
             temperature=0.2
         )
         self._synthesizer_8b = get_chat_model(
             provider=self.provider,
             temperature=0.2
         )
         # Director for Outer Loop
         self._director = get_chat_model(
             provider=self.provider,
             temperature=0.0,
             json_mode=True
         )
-        # Embedding model for RAG
         self._embedding_model = get_embedding_model()
         self._initialized = True
         self._initialized_provider = self.provider
     @property
     def planner(self):
         self._initialize_models()
         return self._planner
     @property
     def analyzer(self):
         self._initialize_models()
         return self._analyzer
     @property
     def explainer(self):
         self._initialize_models()
         return self._explainer
     @property
     def synthesizer_7b(self):
         self._initialize_models()
         return self._synthesizer_7b
     @property
     def synthesizer_8b(self):
         self._initialize_models()
         return self._synthesizer_8b
     @property
     def director(self):
         self._initialize_models()
         return self._director
     @property
     def embedding_model(self):
         self._initialize_models()
         return self._embedding_model
-    def get_synthesizer(self, model_name: Optional[str] = None):
         """Get synthesizer model (for backward compatibility)"""
         if model_name:
             return get_chat_model(provider=self.provider, model=model_name, temperature=0.2)
         return self.synthesizer_8b
     def print_config(self):
         """Print current LLM configuration"""
         print("=" * 60)
         print("MediGuard AI RAG-Helper - LLM Configuration")
         print("=" * 60)
         print(f"Provider:      {self.provider.upper()}")
         if self.provider == "groq":
-            print(f"Model:         llama-3.3-70b-versatile (FREE)")
         elif self.provider == "gemini":
-            print(f"Model:         gemini-2.0-flash (FREE)")
         else:
-            print(f"Model:         llama3.1:8b (local)")
-        print(f"Embeddings:    Google Gemini (FREE)")
         print("=" * 60)
@@ -387,7 +388,7 @@ class LLMConfig:
 llm_config = LLMConfig()
-def get_synthesizer(model_name: Optional[str] = None):
     """Module-level convenience: get a synthesizer LLM instance."""
     return llm_config.get_synthesizer(model_name)
@@ -395,7 +396,7 @@ def get_synthesizer(model_name: Optional[str] = None):
 def check_api_connection():
     """Verify API connection and keys are configured"""
     provider = DEFAULT_LLM_PROVIDER
     try:
         if provider == "groq":
             api_key = os.getenv("GROQ_API_KEY")
@@ -404,13 +405,13 @@ def check_api_connection():
                 print("\n  Get your FREE API key at:")
                 print("  https://console.groq.com/keys")
                 return False
             # Test connection
             test_model = get_chat_model("groq")
             response = test_model.invoke("Say 'OK' in one word")
             print("OK: Groq API connection successful")
             return True
         elif provider == "gemini":
             api_key = os.getenv("GOOGLE_API_KEY")
             if not api_key:
@@ -418,12 +419,12 @@ def check_api_connection():
                 print("\n  Get your FREE API key at:")
                 print("  https://aistudio.google.com/app/apikey")
                 return False
             test_model = get_chat_model("gemini")
             response = test_model.invoke("Say 'OK' in one word")
             print("OK: Google Gemini API connection successful")
             return True
         else:
             try:
                 from langchain_ollama import ChatOllama
@@ -433,7 +434,7 @@ def check_api_connection():
             response = test_model.invoke("Hello")
             print("OK: Ollama connection successful")
             return True
     except Exception as e:
         print(f"ERROR: Connection failed: {e}")
         return False

 import os
 import threading
+from typing import Literal
 from dotenv import load_dotenv
 # Load environment variables
 def get_chat_model(
+    provider: Literal["groq", "gemini", "ollama"] | None = None,
+    model: str | None = None,
     temperature: float = 0.0,
     json_mode: bool = False
 ):
     """
     # Use dynamic lookup to get current provider from environment
     provider = provider or get_default_llm_provider()
     if provider == "groq":
         from langchain_groq import ChatGroq
         api_key = get_groq_api_key()
         if not api_key:
             raise ValueError(
                 "GROQ_API_KEY not found in environment.\n"
                 "Get your FREE API key at: https://console.groq.com/keys"
             )
         # Use model from environment or default
         model = model or get_groq_model()
         return ChatGroq(
             model=model,
             temperature=temperature,
             api_key=api_key,
             model_kwargs={"response_format": {"type": "json_object"}} if json_mode else {}
         )
     elif provider == "gemini":
         from langchain_google_genai import ChatGoogleGenerativeAI
         api_key = get_google_api_key()
         if not api_key:
             raise ValueError(
                 "GOOGLE_API_KEY not found in environment.\n"
                 "Get your FREE API key at: https://aistudio.google.com/app/apikey"
             )
         # Use model from environment or default
         model = model or get_gemini_model()
         return ChatGoogleGenerativeAI(
             model=model,
             temperature=temperature,
             google_api_key=api_key,
             convert_system_message_to_human=True
         )
     elif provider == "ollama":
         try:
             from langchain_ollama import ChatOllama
         except ImportError:
             from langchain_community.chat_models import ChatOllama
         model = model or "llama3.1:8b"
         return ChatOllama(
             model=model,
             temperature=temperature,
             format='json' if json_mode else None
         )
     else:
         raise ValueError(f"Unknown provider: {provider}. Use 'groq', 'gemini', or 'ollama'")
     return _get_env_with_fallback("EMBEDDING_PROVIDER", "EMBEDDING__PROVIDER", "huggingface")
+def get_embedding_model(provider: Literal["jina", "google", "huggingface", "ollama"] | None = None):
     """
     Get embedding model for vector search.
         which has automatic fallback chain: Jina → Google → HuggingFace.
     """
     provider = provider or get_embedding_provider()
     if provider == "jina":
         # Try Jina AI embeddings first (high quality, 1024d)
         jina_key = _get_env_with_fallback("JINA_API_KEY", "EMBEDDING__JINA_API_KEY", "")
         else:
             print("WARN: JINA_API_KEY not found. Falling back to Google embeddings.")
             return get_embedding_model("google")
     elif provider == "google":
         from langchain_google_genai import GoogleGenerativeAIEmbeddings
         api_key = get_google_api_key()
         if not api_key:
             print("WARN: GOOGLE_API_KEY not found. Falling back to HuggingFace embeddings.")
             return get_embedding_model("huggingface")
         try:
             return GoogleGenerativeAIEmbeddings(
                 model="models/text-embedding-004",
             print(f"WARN: Google embeddings failed: {e}")
             print("INFO: Falling back to HuggingFace embeddings...")
             return get_embedding_model("huggingface")
     elif provider == "huggingface":
         try:
             from langchain_huggingface import HuggingFaceEmbeddings
         except ImportError:
             from langchain_community.embeddings import HuggingFaceEmbeddings
         return HuggingFaceEmbeddings(
             model_name="sentence-transformers/all-MiniLM-L6-v2"
         )
     elif provider == "ollama":
         try:
             from langchain_ollama import OllamaEmbeddings
         except ImportError:
             from langchain_community.embeddings import OllamaEmbeddings
         return OllamaEmbeddings(model="nomic-embed-text")
     else:
         raise ValueError(f"Unknown embedding provider: {provider}")
 class LLMConfig:
     """Central configuration for all LLM models"""
+    def __init__(self, provider: str | None = None, lazy: bool = True):
         """
         Initialize all model clients.
         self._initialized = False
         self._initialized_provider = None  # Track which provider was initialized
         self._lock = threading.Lock()
         # Lazy-initialized model instances
         self._planner = None
         self._analyzer = None
         self._synthesizer_8b = None
         self._director = None
         self._embedding_model = None
         if not lazy:
             self._initialize_models()
     @property
     def provider(self) -> str:
         """Get current provider (dynamic lookup if not explicitly set)."""
         return self._explicit_provider or get_default_llm_provider()
     def _check_provider_change(self):
         """Check if provider changed and reinitialize if needed."""
         current = self.provider
             self._synthesizer_7b = None
             self._synthesizer_8b = None
             self._director = None
     def _initialize_models(self):
         """Initialize all model clients (called on first use if lazy)"""
         self._check_provider_change()
         if self._initialized:
             return
         with self._lock:
             # Double-checked locking
             if self._initialized:
                 return
             print(f"Initializing LLM models with provider: {self.provider.upper()}")
         # Fast model for structured tasks (planning, analysis)
         self._planner = get_chat_model(
             provider=self.provider,
             temperature=0.0,
             json_mode=True
         )
         # Fast model for biomarker analysis and quick tasks
         self._analyzer = get_chat_model(
             provider=self.provider,
             temperature=0.0
         )
         # Medium model for RAG retrieval and explanation
         self._explainer = get_chat_model(
             provider=self.provider,
             temperature=0.2
         )
         # Configurable synthesizers
         self._synthesizer_7b = get_chat_model(
             provider=self.provider,
             temperature=0.2
         )
         self._synthesizer_8b = get_chat_model(
             provider=self.provider,
             temperature=0.2
         )
         # Director for Outer Loop
         self._director = get_chat_model(
             provider=self.provider,
             temperature=0.0,
             json_mode=True
         )
+        # Embedding model for RAG
         self._embedding_model = get_embedding_model()
         self._initialized = True
         self._initialized_provider = self.provider
     @property
     def planner(self):
         self._initialize_models()
         return self._planner
     @property
     def analyzer(self):
         self._initialize_models()
         return self._analyzer
     @property
     def explainer(self):
         self._initialize_models()
         return self._explainer
     @property
     def synthesizer_7b(self):
         self._initialize_models()
         return self._synthesizer_7b
     @property
     def synthesizer_8b(self):
         self._initialize_models()
         return self._synthesizer_8b
     @property
     def director(self):
         self._initialize_models()
         return self._director
     @property
     def embedding_model(self):
         self._initialize_models()
         return self._embedding_model
+    def get_synthesizer(self, model_name: str | None = None):
         """Get synthesizer model (for backward compatibility)"""
         if model_name:
             return get_chat_model(provider=self.provider, model=model_name, temperature=0.2)
         return self.synthesizer_8b
     def print_config(self):
         """Print current LLM configuration"""
         print("=" * 60)
         print("MediGuard AI RAG-Helper - LLM Configuration")
         print("=" * 60)
         print(f"Provider:      {self.provider.upper()}")
         if self.provider == "groq":
+            print("Model:         llama-3.3-70b-versatile (FREE)")
         elif self.provider == "gemini":
+            print("Model:         gemini-2.0-flash (FREE)")
         else:
+            print("Model:         llama3.1:8b (local)")
+        print("Embeddings:    Google Gemini (FREE)")
         print("=" * 60)
 llm_config = LLMConfig()
+def get_synthesizer(model_name: str | None = None):
     """Module-level convenience: get a synthesizer LLM instance."""
     return llm_config.get_synthesizer(model_name)
 def check_api_connection():
     """Verify API connection and keys are configured"""
     provider = DEFAULT_LLM_PROVIDER
     try:
         if provider == "groq":
             api_key = os.getenv("GROQ_API_KEY")
                 print("\n  Get your FREE API key at:")
                 print("  https://console.groq.com/keys")
                 return False
             # Test connection
             test_model = get_chat_model("groq")
             response = test_model.invoke("Say 'OK' in one word")
             print("OK: Groq API connection successful")
             return True
         elif provider == "gemini":
             api_key = os.getenv("GOOGLE_API_KEY")
             if not api_key:
                 print("\n  Get your FREE API key at:")
                 print("  https://aistudio.google.com/app/apikey")
                 return False
             test_model = get_chat_model("gemini")
             response = test_model.invoke("Say 'OK' in one word")
             print("OK: Google Gemini API connection successful")
             return True
         else:
             try:
                 from langchain_ollama import ChatOllama
             response = test_model.invoke("Hello")
             print("OK: Ollama connection successful")
             return True
     except Exception as e:
         print(f"ERROR: Connection failed: {e}")
         return False

src/main.py CHANGED Viewed

@@ -13,7 +13,7 @@ import logging
 import os
 import time
 from contextlib import asynccontextmanager
-from datetime import datetime, timezone
 from fastapi import FastAPI, Request, status
 from fastapi.exceptions import RequestValidationError
@@ -49,7 +49,9 @@ async def lifespan(app: FastAPI):
     # --- OpenSearch ---
     try:
         from src.services.opensearch.client import make_opensearch_client
         app.state.opensearch_client = make_opensearch_client()
         logger.info("OpenSearch client ready")
     except Exception as exc:
         logger.warning("OpenSearch unavailable: %s", exc)
@@ -59,7 +61,7 @@ async def lifespan(app: FastAPI):
     try:
         from src.services.embeddings.service import make_embedding_service
         app.state.embedding_service = make_embedding_service()
-        logger.info("Embedding service ready (provider=%s)", app.state.embedding_service._provider)
     except Exception as exc:
         logger.warning("Embedding service unavailable: %s", exc)
         app.state.embedding_service = None
@@ -93,11 +95,11 @@ async def lifespan(app: FastAPI):
     # --- Agentic RAG service ---
     try:
         from src.services.agents.agentic_rag import AgenticRAGService
         from src.services.agents.context import AgenticContext
-        if app.state.ollama_client and app.state.opensearch_client and app.state.embedding_service:
-            llm = app.state.ollama_client.get_langchain_model()
             ctx = AgenticContext(
                 llm=llm,
                 embedding_service=app.state.embedding_service,
@@ -109,17 +111,16 @@ async def lifespan(app: FastAPI):
             logger.info("Agentic RAG service ready")
         else:
             app.state.rag_service = None
-            logger.warning("Agentic RAG service skipped — missing backing services")
     except Exception as exc:
         logger.warning("Agentic RAG service failed: %s", exc)
         app.state.rag_service = None
     # --- Legacy RagBot service (backward-compatible /analyze) ---
     try:
-        from api.app.services.ragbot import get_ragbot_service
-        ragbot = get_ragbot_service()
-        ragbot.initialize()
-        app.state.ragbot_service = ragbot
         logger.info("RagBot service ready (ClinicalInsightGuild)")
     except Exception as exc:
         logger.warning("RagBot service unavailable: %s", exc)
@@ -127,17 +128,13 @@ async def lifespan(app: FastAPI):
     # --- Extraction service (for natural language input) ---
     try:
         from src.services.extraction.service import make_extraction_service
-        llm = None
-        if app.state.ollama_client:
-            llm = app.state.ollama_client.get_langchain_model()
-        elif hasattr(app.state, 'rag_service') and app.state.rag_service:
-            # Use the same LLM as agentic RAG
-            llm = getattr(app.state.rag_service, '_context', {})
-            if hasattr(llm, 'llm'):
-                llm = llm.llm
-            else:
-                llm = None
         # If no LLM available, extraction will use regex fallback
         app.state.extraction_service = make_extraction_service(llm=llm)
         logger.info("Extraction service ready")
@@ -196,7 +193,7 @@ def create_app() -> FastAPI:
                 "error_code": "VALIDATION_ERROR",
                 "message": "Request validation failed",
                 "details": exc.errors(),
-                "timestamp": datetime.now(timezone.utc).isoformat(),
             },
         )
@@ -209,12 +206,12 @@ def create_app() -> FastAPI:
                 "status": "error",
                 "error_code": "INTERNAL_SERVER_ERROR",
                 "message": "An unexpected error occurred. Please try again later.",
-                "timestamp": datetime.now(timezone.utc).isoformat(),
             },
         )
     # --- Routers ---
-    from src.routers import health, analyze, ask, search
     app.include_router(health.router)
     app.include_router(analyze.router)

 import os
 import time
 from contextlib import asynccontextmanager
+from datetime import UTC, datetime
 from fastapi import FastAPI, Request, status
 from fastapi.exceptions import RequestValidationError
     # --- OpenSearch ---
     try:
         from src.services.opensearch.client import make_opensearch_client
+        from src.services.opensearch.index_config import MEDICAL_CHUNKS_MAPPING
         app.state.opensearch_client = make_opensearch_client()
+        app.state.opensearch_client.ensure_index(MEDICAL_CHUNKS_MAPPING)
         logger.info("OpenSearch client ready")
     except Exception as exc:
         logger.warning("OpenSearch unavailable: %s", exc)
     try:
         from src.services.embeddings.service import make_embedding_service
         app.state.embedding_service = make_embedding_service()
+        logger.info("Embedding service ready (provider=%s)", app.state.embedding_service.provider_name)
     except Exception as exc:
         logger.warning("Embedding service unavailable: %s", exc)
         app.state.embedding_service = None
     # --- Agentic RAG service ---
     try:
+        from src.llm_config import get_llm
         from src.services.agents.agentic_rag import AgenticRAGService
         from src.services.agents.context import AgenticContext
+        if app.state.opensearch_client and app.state.embedding_service:
+            llm = get_llm()
             ctx = AgenticContext(
                 llm=llm,
                 embedding_service=app.state.embedding_service,
             logger.info("Agentic RAG service ready")
         else:
             app.state.rag_service = None
+            logger.warning("Agentic RAG service skipped — missing backing services (OpenSearch or Embedding)")
     except Exception as exc:
         logger.warning("Agentic RAG service failed: %s", exc)
         app.state.rag_service = None
     # --- Legacy RagBot service (backward-compatible /analyze) ---
     try:
+        from src.workflow import create_guild
+        guild = create_guild()
+        app.state.ragbot_service = guild
         logger.info("RagBot service ready (ClinicalInsightGuild)")
     except Exception as exc:
         logger.warning("RagBot service unavailable: %s", exc)
     # --- Extraction service (for natural language input) ---
     try:
+        from src.llm_config import get_llm
         from src.services.extraction.service import make_extraction_service
+        try:
+            llm = get_llm()
+        except Exception as e:
+            logger.warning("Failed to get LLM for extraction, will use fallback: %s", e)
+            llm = None
         # If no LLM available, extraction will use regex fallback
         app.state.extraction_service = make_extraction_service(llm=llm)
         logger.info("Extraction service ready")
                 "error_code": "VALIDATION_ERROR",
                 "message": "Request validation failed",
                 "details": exc.errors(),
+                "timestamp": datetime.now(UTC).isoformat(),
             },
         )
                 "status": "error",
                 "error_code": "INTERNAL_SERVER_ERROR",
                 "message": "An unexpected error occurred. Please try again later.",
+                "timestamp": datetime.now(UTC).isoformat(),
             },
         )
     # --- Routers ---
+    from src.routers import analyze, ask, health, search
     app.include_router(health.router)
     app.include_router(analyze.router)

src/middlewares.py CHANGED Viewed

@@ -12,8 +12,9 @@ import json
 import logging
 import time
 import uuid
-from datetime import datetime, timezone
-from typing import Any, Callable
 from fastapi import Request, Response
 from starlette.middleware.base import BaseHTTPMiddleware
@@ -74,35 +75,35 @@ class HIPAAAuditMiddleware(BaseHTTPMiddleware):
     Audit logs are structured JSON for easy SIEM integration.
     """
     async def dispatch(self, request: Request, call_next: Callable) -> Response:
         # Generate request ID
         request_id = f"req_{uuid.uuid4().hex[:12]}"
         request.state.request_id = request_id
         # Start timing
         start_time = time.time()
         # Extract metadata safely
         path = request.url.path
         method = request.method
         client_ip = request.client.host if request.client else "unknown"
         user_agent = request.headers.get("user-agent", "unknown")[:100]
         # Check if this endpoint needs audit logging
         needs_audit = any(path.startswith(ep) for ep in AUDITABLE_ENDPOINTS)
         # Pre-request audit entry
         audit_entry: dict[str, Any] = {
             "event": "request_start",
-            "timestamp": datetime.now(timezone.utc).isoformat(),
             "request_id": request_id,
             "method": method,
             "path": path,
             "client_ip_hash": _hash_sensitive(client_ip),
             "user_agent_hash": _hash_sensitive(user_agent),
         }
         # Try to read request body for POST requests (without logging PHI)
         if needs_audit and method == "POST":
             try:
@@ -116,35 +117,35 @@ class HIPAAAuditMiddleware(BaseHTTPMiddleware):
                     # Log presence of biomarkers without values
                     if "biomarkers" in body_dict:
                         audit_entry["biomarker_count"] = len(body_dict["biomarkers"]) if isinstance(body_dict["biomarkers"], dict) else 1
-            except Exception:
-                pass
         if needs_audit:
             logger.info("AUDIT_REQUEST: %s", json.dumps(audit_entry))
         # Process request
         response: Response = await call_next(request)
         # Post-request audit
         elapsed_ms = (time.time() - start_time) * 1000
         completion_entry = {
             "event": "request_complete",
-            "timestamp": datetime.now(timezone.utc).isoformat(),
             "request_id": request_id,
             "method": method,
             "path": path,
             "status_code": response.status_code,
             "elapsed_ms": round(elapsed_ms, 2),
         }
         if needs_audit:
             logger.info("AUDIT_COMPLETE: %s", json.dumps(completion_entry))
         # Add request ID to response headers
         response.headers["X-Request-ID"] = request_id
         response.headers["X-Response-Time"] = f"{elapsed_ms:.2f}ms"
         return response
@@ -152,10 +153,10 @@ class SecurityHeadersMiddleware(BaseHTTPMiddleware):
     """
     Add security headers for HIPAA compliance.
     """
     async def dispatch(self, request: Request, call_next: Callable) -> Response:
         response: Response = await call_next(request)
         # Security headers
         response.headers["X-Content-Type-Options"] = "nosniff"
         response.headers["X-Frame-Options"] = "DENY"
@@ -163,9 +164,9 @@ class SecurityHeadersMiddleware(BaseHTTPMiddleware):
         response.headers["Strict-Transport-Security"] = "max-age=31536000; includeSubDomains"
         response.headers["Cache-Control"] = "no-store, no-cache, must-revalidate"
         response.headers["Pragma"] = "no-cache"
         # Medical data should never be cached
         if any(ep in request.url.path for ep in AUDITABLE_ENDPOINTS):
             response.headers["Cache-Control"] = "no-store, private"
         return response

 import logging
 import time
 import uuid
+from collections.abc import Callable
+from datetime import UTC, datetime
+from typing import Any
 from fastapi import Request, Response
 from starlette.middleware.base import BaseHTTPMiddleware
     Audit logs are structured JSON for easy SIEM integration.
     """
     async def dispatch(self, request: Request, call_next: Callable) -> Response:
         # Generate request ID
         request_id = f"req_{uuid.uuid4().hex[:12]}"
         request.state.request_id = request_id
         # Start timing
         start_time = time.time()
         # Extract metadata safely
         path = request.url.path
         method = request.method
         client_ip = request.client.host if request.client else "unknown"
         user_agent = request.headers.get("user-agent", "unknown")[:100]
         # Check if this endpoint needs audit logging
         needs_audit = any(path.startswith(ep) for ep in AUDITABLE_ENDPOINTS)
         # Pre-request audit entry
         audit_entry: dict[str, Any] = {
             "event": "request_start",
+            "timestamp": datetime.now(UTC).isoformat(),
             "request_id": request_id,
             "method": method,
             "path": path,
             "client_ip_hash": _hash_sensitive(client_ip),
             "user_agent_hash": _hash_sensitive(user_agent),
         }
         # Try to read request body for POST requests (without logging PHI)
         if needs_audit and method == "POST":
             try:
                     # Log presence of biomarkers without values
                     if "biomarkers" in body_dict:
                         audit_entry["biomarker_count"] = len(body_dict["biomarkers"]) if isinstance(body_dict["biomarkers"], dict) else 1
+            except Exception as exc:
+                logger.debug("Failed to audit POST body: %s", exc)
         if needs_audit:
             logger.info("AUDIT_REQUEST: %s", json.dumps(audit_entry))
         # Process request
         response: Response = await call_next(request)
         # Post-request audit
         elapsed_ms = (time.time() - start_time) * 1000
         completion_entry = {
             "event": "request_complete",
+            "timestamp": datetime.now(UTC).isoformat(),
             "request_id": request_id,
             "method": method,
             "path": path,
             "status_code": response.status_code,
             "elapsed_ms": round(elapsed_ms, 2),
         }
         if needs_audit:
             logger.info("AUDIT_COMPLETE: %s", json.dumps(completion_entry))
         # Add request ID to response headers
         response.headers["X-Request-ID"] = request_id
         response.headers["X-Response-Time"] = f"{elapsed_ms:.2f}ms"
         return response
     """
     Add security headers for HIPAA compliance.
     """
     async def dispatch(self, request: Request, call_next: Callable) -> Response:
         response: Response = await call_next(request)
         # Security headers
         response.headers["X-Content-Type-Options"] = "nosniff"
         response.headers["X-Frame-Options"] = "DENY"
         response.headers["Strict-Transport-Security"] = "max-age=31536000; includeSubDomains"
         response.headers["Cache-Control"] = "no-store, no-cache, must-revalidate"
         response.headers["Pragma"] = "no-cache"
         # Medical data should never be cached
         if any(ep in request.url.path for ep in AUDITABLE_ENDPOINTS):
             response.headers["Cache-Control"] = "no-store, private"
         return response

src/pdf_processor.py CHANGED Viewed

@@ -6,13 +6,12 @@ PDF document processing and vector store creation
 import os
 import warnings
 from pathlib import Path
-from typing import List, Optional
-from langchain_community.document_loaders import PyPDFLoader, DirectoryLoader
-from langchain_text_splitters import RecursiveCharacterTextSplitter
 from langchain_community.vectorstores import FAISS
 from langchain_core.documents import Document
-from dotenv import load_dotenv
-import time
 # Suppress noisy warnings
 warnings.filterwarnings("ignore", message=".*class.*HuggingFaceEmbeddings.*was deprecated.*")
@@ -22,12 +21,12 @@ os.environ.setdefault("HF_HUB_DISABLE_IMPLICIT_TOKEN", "1")
 load_dotenv()
 # Re-export for backward compatibility
-from src.llm_config import get_embedding_model  # noqa: F401
 class PDFProcessor:
     """Handles medical PDF ingestion and vector store creation"""
     def __init__(
         self,
         pdf_directory: str = "data/medical_pdfs",
@@ -48,11 +47,11 @@ class PDFProcessor:
         self.vector_store_path = Path(vector_store_path)
         self.chunk_size = chunk_size
         self.chunk_overlap = chunk_overlap
         # Create directories if they don't exist
         self.pdf_directory.mkdir(parents=True, exist_ok=True)
         self.vector_store_path.mkdir(parents=True, exist_ok=True)
         # Text splitter with medical context awareness
         self.text_splitter = RecursiveCharacterTextSplitter(
             chunk_size=chunk_size,
@@ -60,8 +59,8 @@ class PDFProcessor:
             separators=["\n\n", "\n", ". ", " ", ""],
             length_function=len
         )
-    def load_pdfs(self) -> List[Document]:
         """
         Load all PDF documents from the configured directory.
@@ -69,40 +68,40 @@ class PDFProcessor:
             List of Document objects with content and metadata
         """
         print(f"Loading PDFs from: {self.pdf_directory}")
         pdf_files = list(self.pdf_directory.glob("*.pdf"))
         if not pdf_files:
             print(f"WARN: No PDF files found in {self.pdf_directory}")
             print("INFO: Please place medical PDFs in this directory")
             return []
         print(f"Found {len(pdf_files)} PDF file(s):")
         for pdf in pdf_files:
             print(f"  - {pdf.name}")
         documents = []
         for pdf_path in pdf_files:
             try:
                 loader = PyPDFLoader(str(pdf_path))
                 docs = loader.load()
                 # Add source filename to metadata
                 for doc in docs:
                     doc.metadata['source_file'] = pdf_path.name
                     doc.metadata['source_path'] = str(pdf_path)
                 documents.extend(docs)
                 print(f"  OK: Loaded {len(docs)} pages from {pdf_path.name}")
             except Exception as e:
                 print(f"  ERROR: Error loading {pdf_path.name}: {e}")
         print(f"\nTotal: {len(documents)} pages loaded from {len(pdf_files)} PDF(s)")
         return documents
-    def chunk_documents(self, documents: List[Document]) -> List[Document]:
         """
         Split documents into chunks for RAG retrieval.
@@ -113,25 +112,25 @@ class PDFProcessor:
             List of chunked documents with preserved metadata
         """
         print(f"\nChunking documents (size={self.chunk_size}, overlap={self.chunk_overlap})...")
         chunks = self.text_splitter.split_documents(documents)
         if not chunks:
             print("WARN: No chunks generated from documents")
             return chunks
         # Add chunk index to metadata
         for i, chunk in enumerate(chunks):
             chunk.metadata['chunk_id'] = i
         print(f"OK: Created {len(chunks)} chunks from {len(documents)} pages")
         print(f"  Average chunk size: {sum(len(c.page_content) for c in chunks) // len(chunks)} characters")
         return chunks
     def create_vector_store(
         self,
-        chunks: List[Document],
         embedding_model,
         store_name: str = "medical_knowledge"
     ) -> FAISS:
@@ -149,26 +148,26 @@ class PDFProcessor:
         print(f"\nCreating vector store: {store_name}")
         print(f"Generating embeddings for {len(chunks)} chunks...")
         print("(This may take a few minutes...)")
         # Create FAISS vector store
         vector_store = FAISS.from_documents(
             documents=chunks,
             embedding=embedding_model
         )
         # Save to disk
         save_path = self.vector_store_path / f"{store_name}.faiss"
         vector_store.save_local(str(self.vector_store_path), index_name=store_name)
         print(f"OK: Vector store created and saved to: {save_path}")
         return vector_store
     def load_vector_store(
         self,
         embedding_model,
         store_name: str = "medical_knowledge"
-    ) -> Optional[FAISS]:
         """
         Load existing vector store from disk.
@@ -180,11 +179,11 @@ class PDFProcessor:
             FAISS vector store or None if not found
         """
         store_path = self.vector_store_path / f"{store_name}.faiss"
         if not store_path.exists():
             print(f"WARN: Vector store not found: {store_path}")
             return None
         try:
             # SECURITY NOTE: allow_dangerous_deserialization=True uses pickle.
             # Only load vector stores from trusted, locally-built sources.
@@ -197,11 +196,11 @@ class PDFProcessor:
             )
             print(f"OK: Loaded vector store from: {store_path}")
             return vector_store
         except Exception as e:
             print(f"ERROR: Error loading vector store: {e}")
             return None
     def create_retrievers(
         self,
         embedding_model,
@@ -224,19 +223,19 @@ class PDFProcessor:
             vector_store = self.load_vector_store(embedding_model, store_name)
         else:
             vector_store = None
         # If not found, create new one
         if vector_store is None:
             print("\nBuilding new vector store from PDFs...")
             documents = self.load_pdfs()
             if not documents:
                 print("WARN: No documents to process. Please add PDF files.")
                 return {}
             chunks = self.chunk_documents(documents)
             vector_store = self.create_vector_store(chunks, embedding_model, store_name)
         # Create specialized retrievers
         retrievers = {
             "disease_explainer": vector_store.as_retriever(
@@ -252,7 +251,7 @@ class PDFProcessor:
                 search_kwargs={"k": 5}
             )
         }
         print(f"\nOK: Created {len(retrievers)} specialized retrievers")
         return retrievers
@@ -272,28 +271,28 @@ def setup_knowledge_base(embedding_model=None, force_rebuild: bool = False, use_
     print("=" * 60)
     print("Setting up Medical Knowledge Base")
     print("=" * 60)
     # Use configured embedding provider from environment
     if use_configured_embeddings and embedding_model is None:
         embedding_model = get_embedding_model()
         print("   > Embeddings model loaded")
     elif embedding_model is None:
         raise ValueError("Must provide embedding_model or set use_configured_embeddings=True")
     processor = PDFProcessor()
     retrievers = processor.create_retrievers(
         embedding_model,
         store_name="medical_knowledge",
         force_rebuild=force_rebuild
     )
     if retrievers:
         print("\nOK: Knowledge base setup complete!")
     else:
         print("\nWARN: Knowledge base setup incomplete. Add PDFs and try again.")
     print("=" * 60)
     return retrievers
@@ -320,22 +319,22 @@ if __name__ == "__main__":
     # Test PDF processing
     import sys
     from pathlib import Path
     # Add parent directory to path for imports
     sys.path.insert(0, str(Path(__file__).parent.parent))
     print("\n" + "="*70)
     print("MediGuard AI - PDF Knowledge Base Builder")
     print("="*70)
     print("\nUsing configured embedding provider from .env")
     print("   EMBEDDING_PROVIDER options: google (default), huggingface, ollama")
     print("="*70)
     retrievers = setup_knowledge_base(
         use_configured_embeddings=True,  # Use configured provider
         force_rebuild=False
     )
     if retrievers:
         print("\nOK: PDF processing test successful!")
         print(f"Available retrievers: {list(retrievers.keys())}")

 import os
 import warnings
 from pathlib import Path
+from dotenv import load_dotenv
+from langchain_community.document_loaders import PyPDFLoader
 from langchain_community.vectorstores import FAISS
 from langchain_core.documents import Document
+from langchain_text_splitters import RecursiveCharacterTextSplitter
 # Suppress noisy warnings
 warnings.filterwarnings("ignore", message=".*class.*HuggingFaceEmbeddings.*was deprecated.*")
 load_dotenv()
 # Re-export for backward compatibility
+from src.llm_config import get_embedding_model
 class PDFProcessor:
     """Handles medical PDF ingestion and vector store creation"""
     def __init__(
         self,
         pdf_directory: str = "data/medical_pdfs",
         self.vector_store_path = Path(vector_store_path)
         self.chunk_size = chunk_size
         self.chunk_overlap = chunk_overlap
         # Create directories if they don't exist
         self.pdf_directory.mkdir(parents=True, exist_ok=True)
         self.vector_store_path.mkdir(parents=True, exist_ok=True)
         # Text splitter with medical context awareness
         self.text_splitter = RecursiveCharacterTextSplitter(
             chunk_size=chunk_size,
             separators=["\n\n", "\n", ". ", " ", ""],
             length_function=len
         )
+    def load_pdfs(self) -> list[Document]:
         """
         Load all PDF documents from the configured directory.
             List of Document objects with content and metadata
         """
         print(f"Loading PDFs from: {self.pdf_directory}")
         pdf_files = list(self.pdf_directory.glob("*.pdf"))
         if not pdf_files:
             print(f"WARN: No PDF files found in {self.pdf_directory}")
             print("INFO: Please place medical PDFs in this directory")
             return []
         print(f"Found {len(pdf_files)} PDF file(s):")
         for pdf in pdf_files:
             print(f"  - {pdf.name}")
         documents = []
         for pdf_path in pdf_files:
             try:
                 loader = PyPDFLoader(str(pdf_path))
                 docs = loader.load()
                 # Add source filename to metadata
                 for doc in docs:
                     doc.metadata['source_file'] = pdf_path.name
                     doc.metadata['source_path'] = str(pdf_path)
                 documents.extend(docs)
                 print(f"  OK: Loaded {len(docs)} pages from {pdf_path.name}")
             except Exception as e:
                 print(f"  ERROR: Error loading {pdf_path.name}: {e}")
         print(f"\nTotal: {len(documents)} pages loaded from {len(pdf_files)} PDF(s)")
         return documents
+    def chunk_documents(self, documents: list[Document]) -> list[Document]:
         """
         Split documents into chunks for RAG retrieval.
             List of chunked documents with preserved metadata
         """
         print(f"\nChunking documents (size={self.chunk_size}, overlap={self.chunk_overlap})...")
         chunks = self.text_splitter.split_documents(documents)
         if not chunks:
             print("WARN: No chunks generated from documents")
             return chunks
         # Add chunk index to metadata
         for i, chunk in enumerate(chunks):
             chunk.metadata['chunk_id'] = i
         print(f"OK: Created {len(chunks)} chunks from {len(documents)} pages")
         print(f"  Average chunk size: {sum(len(c.page_content) for c in chunks) // len(chunks)} characters")
         return chunks
     def create_vector_store(
         self,
+        chunks: list[Document],
         embedding_model,
         store_name: str = "medical_knowledge"
     ) -> FAISS:
         print(f"\nCreating vector store: {store_name}")
         print(f"Generating embeddings for {len(chunks)} chunks...")
         print("(This may take a few minutes...)")
         # Create FAISS vector store
         vector_store = FAISS.from_documents(
             documents=chunks,
             embedding=embedding_model
         )
         # Save to disk
         save_path = self.vector_store_path / f"{store_name}.faiss"
         vector_store.save_local(str(self.vector_store_path), index_name=store_name)
         print(f"OK: Vector store created and saved to: {save_path}")
         return vector_store
     def load_vector_store(
         self,
         embedding_model,
         store_name: str = "medical_knowledge"
+    ) -> FAISS | None:
         """
         Load existing vector store from disk.
             FAISS vector store or None if not found
         """
         store_path = self.vector_store_path / f"{store_name}.faiss"
         if not store_path.exists():
             print(f"WARN: Vector store not found: {store_path}")
             return None
         try:
             # SECURITY NOTE: allow_dangerous_deserialization=True uses pickle.
             # Only load vector stores from trusted, locally-built sources.
             )
             print(f"OK: Loaded vector store from: {store_path}")
             return vector_store
         except Exception as e:
             print(f"ERROR: Error loading vector store: {e}")
             return None
     def create_retrievers(
         self,
         embedding_model,
             vector_store = self.load_vector_store(embedding_model, store_name)
         else:
             vector_store = None
         # If not found, create new one
         if vector_store is None:
             print("\nBuilding new vector store from PDFs...")
             documents = self.load_pdfs()
             if not documents:
                 print("WARN: No documents to process. Please add PDF files.")
                 return {}
             chunks = self.chunk_documents(documents)
             vector_store = self.create_vector_store(chunks, embedding_model, store_name)
         # Create specialized retrievers
         retrievers = {
             "disease_explainer": vector_store.as_retriever(
                 search_kwargs={"k": 5}
             )
         }
         print(f"\nOK: Created {len(retrievers)} specialized retrievers")
         return retrievers
     print("=" * 60)
     print("Setting up Medical Knowledge Base")
     print("=" * 60)
     # Use configured embedding provider from environment
     if use_configured_embeddings and embedding_model is None:
         embedding_model = get_embedding_model()
         print("   > Embeddings model loaded")
     elif embedding_model is None:
         raise ValueError("Must provide embedding_model or set use_configured_embeddings=True")
     processor = PDFProcessor()
     retrievers = processor.create_retrievers(
         embedding_model,
         store_name="medical_knowledge",
         force_rebuild=force_rebuild
     )
     if retrievers:
         print("\nOK: Knowledge base setup complete!")
     else:
         print("\nWARN: Knowledge base setup incomplete. Add PDFs and try again.")
     print("=" * 60)
     return retrievers
     # Test PDF processing
     import sys
     from pathlib import Path
     # Add parent directory to path for imports
     sys.path.insert(0, str(Path(__file__).parent.parent))
     print("\n" + "="*70)
     print("MediGuard AI - PDF Knowledge Base Builder")
     print("="*70)
     print("\nUsing configured embedding provider from .env")
     print("   EMBEDDING_PROVIDER options: google (default), huggingface, ollama")
     print("="*70)
     retrievers = setup_knowledge_base(
         use_configured_embeddings=True,  # Use configured provider
         force_rebuild=False
     )
     if retrievers:
         print("\nOK: PDF processing test successful!")
         print(f"Available retrievers: {list(retrievers.keys())}")

src/repositories/analysis.py CHANGED Viewed

@@ -4,8 +4,6 @@ MediGuard AI — Analysis repository (data-access layer).
 from __future__ import annotations
-from typing import List, Optional
 from sqlalchemy.orm import Session
 from src.models.analysis import PatientAnalysis
@@ -22,14 +20,14 @@ class AnalysisRepository:
         self.db.flush()
         return analysis
-    def get_by_request_id(self, request_id: str) -> Optional[PatientAnalysis]:
         return (
             self.db.query(PatientAnalysis)
             .filter(PatientAnalysis.request_id == request_id)
             .first()
         )
-    def list_recent(self, limit: int = 20) -> List[PatientAnalysis]:
         return (
             self.db.query(PatientAnalysis)
             .order_by(PatientAnalysis.created_at.desc())

 from __future__ import annotations
 from sqlalchemy.orm import Session
 from src.models.analysis import PatientAnalysis
         self.db.flush()
         return analysis
+    def get_by_request_id(self, request_id: str) -> PatientAnalysis | None:
         return (
             self.db.query(PatientAnalysis)
             .filter(PatientAnalysis.request_id == request_id)
             .first()
         )
+    def list_recent(self, limit: int = 20) -> list[PatientAnalysis]:
         return (
             self.db.query(PatientAnalysis)
             .order_by(PatientAnalysis.created_at.desc())

src/repositories/document.py CHANGED Viewed

@@ -4,8 +4,6 @@ MediGuard AI — Document repository.
 from __future__ import annotations
-from typing import List, Optional
 from sqlalchemy.orm import Session
 from src.models.analysis import MedicalDocument
@@ -33,10 +31,10 @@ class DocumentRepository:
         self.db.flush()
         return doc
-    def get_by_id(self, doc_id: str) -> Optional[MedicalDocument]:
         return self.db.query(MedicalDocument).filter(MedicalDocument.id == doc_id).first()
-    def list_all(self, limit: int = 100) -> List[MedicalDocument]:
         return (
             self.db.query(MedicalDocument)
             .order_by(MedicalDocument.created_at.desc())

 from __future__ import annotations
 from sqlalchemy.orm import Session
 from src.models.analysis import MedicalDocument
         self.db.flush()
         return doc
+    def get_by_id(self, doc_id: str) -> MedicalDocument | None:
         return self.db.query(MedicalDocument).filter(MedicalDocument.id == doc_id).first()
+    def list_all(self, limit: int = 100) -> list[MedicalDocument]:
         return (
             self.db.query(MedicalDocument)
             .order_by(MedicalDocument.created_at.desc())

src/routers/analyze.py CHANGED Viewed

@@ -12,8 +12,8 @@ import logging
 import time
 import uuid
 from concurrent.futures import ThreadPoolExecutor
-from datetime import datetime, timezone
-from typing import Any, Dict
 from fastapi import APIRouter, HTTPException, Request
@@ -30,7 +30,7 @@ router = APIRouter(prefix="/analyze", tags=["analysis"])
 _executor = ThreadPoolExecutor(max_workers=4)
-def _score_disease_heuristic(biomarkers: Dict[str, float]) -> Dict[str, Any]:
     """Rule-based disease scoring (NOT ML prediction)."""
     scores = {
         "Diabetes": 0.0,
@@ -39,7 +39,7 @@ def _score_disease_heuristic(biomarkers: Dict[str, float]) -> Dict[str, Any]:
         "Thrombocytopenia": 0.0,
         "Thalassemia": 0.0
     }
     # Diabetes indicators
     glucose = biomarkers.get("Glucose")
     hba1c = biomarkers.get("HbA1c")
@@ -49,7 +49,7 @@ def _score_disease_heuristic(biomarkers: Dict[str, float]) -> Dict[str, Any]:
         scores["Diabetes"] += 0.2
     if hba1c is not None and hba1c >= 6.5:
         scores["Diabetes"] += 0.5
     # Anemia indicators
     hemoglobin = biomarkers.get("Hemoglobin")
     mcv = biomarkers.get("Mean Corpuscular Volume", biomarkers.get("MCV"))
@@ -59,7 +59,7 @@ def _score_disease_heuristic(biomarkers: Dict[str, float]) -> Dict[str, Any]:
         scores["Anemia"] += 0.2
     if mcv is not None and mcv < 80:
         scores["Anemia"] += 0.2
     # Heart disease indicators
     cholesterol = biomarkers.get("Cholesterol")
     troponin = biomarkers.get("Troponin")
@@ -70,32 +70,32 @@ def _score_disease_heuristic(biomarkers: Dict[str, float]) -> Dict[str, Any]:
         scores["Heart Disease"] += 0.6
     if ldl is not None and ldl > 190:
         scores["Heart Disease"] += 0.2
     # Thrombocytopenia indicators
     platelets = biomarkers.get("Platelets")
     if platelets is not None and platelets < 150000:
         scores["Thrombocytopenia"] += 0.6
     if platelets is not None and platelets < 50000:
         scores["Thrombocytopenia"] += 0.3
     # Thalassemia indicators
     if mcv is not None and hemoglobin is not None and mcv < 80 and hemoglobin < 12.0:
         scores["Thalassemia"] += 0.4
     # Find top prediction
     top_disease = max(scores, key=scores.get)
     confidence = min(scores[top_disease], 1.0)
     if confidence == 0.0:
         top_disease = "Undetermined"
     # Normalize probabilities
     total = sum(scores.values())
     if total > 0:
         probabilities = {k: v / total for k, v in scores.items()}
     else:
         probabilities = {k: 1.0 / len(scores) for k in scores}
     return {
         "disease": top_disease,
         "confidence": confidence,
@@ -105,16 +105,16 @@ def _score_disease_heuristic(biomarkers: Dict[str, float]) -> Dict[str, Any]:
 async def _run_guild_analysis(
     request: Request,
-    biomarkers: Dict[str, float],
-    patient_ctx: Dict[str, Any],
-    extracted_biomarkers: Dict[str, float] | None = None,
 ) -> AnalysisResponse:
     """Execute the ClinicalInsightGuild and build the response envelope."""
     request_id = f"req_{uuid.uuid4().hex[:12]}"
     t0 = time.time()
     ragbot = getattr(request.app.state, "ragbot_service", None)
-    if ragbot is None or not ragbot.is_ready():
         raise HTTPException(status_code=503, detail="Analysis service unavailable. Please wait for initialization.")
     # Generate disease prediction
@@ -122,15 +122,16 @@ async def _run_guild_analysis(
     try:
         # Run sync function in thread pool
         loop = asyncio.get_running_loop()
         result = await loop.run_in_executor(
             _executor,
-            lambda: ragbot.analyze(
-                biomarkers=biomarkers,
-                patient_context=patient_ctx,
-                model_prediction=model_prediction,
-                extracted_biomarkers=extracted_biomarkers
-            )
         )
     except Exception as exc:
         logger.exception("Guild analysis failed: %s", exc)
@@ -142,20 +143,15 @@ async def _run_guild_analysis(
     elapsed = (time.time() - t0) * 1000
     # Build response from result
-    # Guild workflow returns a dict; ragbot.analyze() may return dict or object
-    if isinstance(result, dict):
-        prediction = result.get('prediction')
-        analysis = result.get('analysis')
-        conversational_summary = result.get('conversational_summary')
-    else:
-        prediction = getattr(result, 'prediction', None)
-        analysis = getattr(result, 'analysis', None)
-        conversational_summary = getattr(result, 'conversational_summary', None)
     return AnalysisResponse(
         status="success",
         request_id=request_id,
-        timestamp=datetime.now(timezone.utc).isoformat(),
         extracted_biomarkers=extracted_biomarkers,
         input_biomarkers=biomarkers,
         patient_context=patient_ctx,

 import time
 import uuid
 from concurrent.futures import ThreadPoolExecutor
+from datetime import UTC, datetime
+from typing import Any
 from fastapi import APIRouter, HTTPException, Request
 _executor = ThreadPoolExecutor(max_workers=4)
+def _score_disease_heuristic(biomarkers: dict[str, float]) -> dict[str, Any]:
     """Rule-based disease scoring (NOT ML prediction)."""
     scores = {
         "Diabetes": 0.0,
         "Thrombocytopenia": 0.0,
         "Thalassemia": 0.0
     }
     # Diabetes indicators
     glucose = biomarkers.get("Glucose")
     hba1c = biomarkers.get("HbA1c")
         scores["Diabetes"] += 0.2
     if hba1c is not None and hba1c >= 6.5:
         scores["Diabetes"] += 0.5
     # Anemia indicators
     hemoglobin = biomarkers.get("Hemoglobin")
     mcv = biomarkers.get("Mean Corpuscular Volume", biomarkers.get("MCV"))
         scores["Anemia"] += 0.2
     if mcv is not None and mcv < 80:
         scores["Anemia"] += 0.2
     # Heart disease indicators
     cholesterol = biomarkers.get("Cholesterol")
     troponin = biomarkers.get("Troponin")
         scores["Heart Disease"] += 0.6
     if ldl is not None and ldl > 190:
         scores["Heart Disease"] += 0.2
     # Thrombocytopenia indicators
     platelets = biomarkers.get("Platelets")
     if platelets is not None and platelets < 150000:
         scores["Thrombocytopenia"] += 0.6
     if platelets is not None and platelets < 50000:
         scores["Thrombocytopenia"] += 0.3
     # Thalassemia indicators
     if mcv is not None and hemoglobin is not None and mcv < 80 and hemoglobin < 12.0:
         scores["Thalassemia"] += 0.4
     # Find top prediction
     top_disease = max(scores, key=scores.get)
     confidence = min(scores[top_disease], 1.0)
     if confidence == 0.0:
         top_disease = "Undetermined"
     # Normalize probabilities
     total = sum(scores.values())
     if total > 0:
         probabilities = {k: v / total for k, v in scores.items()}
     else:
         probabilities = {k: 1.0 / len(scores) for k in scores}
     return {
         "disease": top_disease,
         "confidence": confidence,
 async def _run_guild_analysis(
     request: Request,
+    biomarkers: dict[str, float],
+    patient_ctx: dict[str, Any],
+    extracted_biomarkers: dict[str, float] | None = None,
 ) -> AnalysisResponse:
     """Execute the ClinicalInsightGuild and build the response envelope."""
     request_id = f"req_{uuid.uuid4().hex[:12]}"
     t0 = time.time()
     ragbot = getattr(request.app.state, "ragbot_service", None)
+    if ragbot is None:
         raise HTTPException(status_code=503, detail="Analysis service unavailable. Please wait for initialization.")
     # Generate disease prediction
     try:
         # Run sync function in thread pool
+        from src.state import PatientInput
+        patient_input = PatientInput(
+            biomarkers=biomarkers,
+            patient_context=patient_ctx,
+            model_prediction=model_prediction
+        )
         loop = asyncio.get_running_loop()
         result = await loop.run_in_executor(
             _executor,
+            lambda: ragbot.run(patient_input)
         )
     except Exception as exc:
         logger.exception("Guild analysis failed: %s", exc)
     elapsed = (time.time() - t0) * 1000
     # Build response from result
+    prediction = result.get('model_prediction')
+    analysis = result.get('final_response', {})
+    # Try to extract the conversational_summary if it's there
+    conversational_summary = analysis.get('conversational_summary') if isinstance(analysis, dict) else str(analysis)
     return AnalysisResponse(
         status="success",
         request_id=request_id,
+        timestamp=datetime.now(UTC).isoformat(),
         extracted_biomarkers=extracted_biomarkers,
         input_biomarkers=biomarkers,
         patient_context=patient_ctx,

src/routers/ask.py CHANGED Viewed

@@ -12,13 +12,12 @@ import json
 import logging
 import time
 import uuid
-from datetime import datetime, timezone
-from typing import AsyncGenerator
 from fastapi import APIRouter, HTTPException, Request
 from fastapi.responses import StreamingResponse
-from src.schemas.schemas import AskRequest, AskResponse
 logger = logging.getLogger(__name__)
 router = APIRouter(tags=["ask"])
@@ -81,12 +80,12 @@ async def _stream_rag_response(
     - error: Error information
     """
     t0 = time.time()
     try:
         # Send initial status
         yield f"event: status\ndata: {json.dumps({'stage': 'guardrail', 'message': 'Validating query...'})}\n\n"
         await asyncio.sleep(0)  # Allow event loop to flush
         # Run the RAG pipeline (synchronous, but we yield progress)
         loop = asyncio.get_running_loop()
         result = await loop.run_in_executor(
@@ -97,16 +96,16 @@ async def _stream_rag_response(
                 patient_context=patient_context,
             )
         )
         # Send retrieval metadata
         yield f"event: metadata\ndata: {json.dumps({'documents_retrieved': len(result.get('retrieved_documents', [])), 'documents_relevant': len(result.get('relevant_documents', [])), 'guardrail_score': result.get('guardrail_score')})}\n\n"
         await asyncio.sleep(0)
         # Stream the answer token by token for smooth UI
         answer = result.get("final_answer", "")
         if answer:
             yield f"event: status\ndata: {json.dumps({'stage': 'generating', 'message': 'Generating response...'})}\n\n"
             # Simulate streaming by chunking the response
             words = answer.split()
             chunk_size = 3  # Send 3 words at a time
@@ -116,11 +115,11 @@ async def _stream_rag_response(
                     chunk += " "
                 yield f"event: token\ndata: {json.dumps({'text': chunk})}\n\n"
                 await asyncio.sleep(0.02)  # Small delay for visual streaming effect
         # Send completion
         elapsed = (time.time() - t0) * 1000
         yield f"event: done\ndata: {json.dumps({'request_id': request_id, 'processing_time_ms': round(elapsed, 1), 'status': 'success'})}\n\n"
     except Exception as exc:
         logger.exception("Streaming RAG failed: %s", exc)
         yield f"event: error\ndata: {json.dumps({'error': str(exc), 'request_id': request_id})}\n\n"
@@ -154,9 +153,9 @@ async def ask_medical_question_stream(body: AskRequest, request: Request):
     rag_service = getattr(request.app.state, "rag_service", None)
     if rag_service is None:
         raise HTTPException(status_code=503, detail="RAG service unavailable")
     request_id = f"req_{uuid.uuid4().hex[:12]}"
     return StreamingResponse(
         _stream_rag_response(
             rag_service,
@@ -172,3 +171,17 @@ async def ask_medical_question_stream(body: AskRequest, request: Request):
             "X-Request-ID": request_id,
         },
     )

 import logging
 import time
 import uuid
+from collections.abc import AsyncGenerator
 from fastapi import APIRouter, HTTPException, Request
 from fastapi.responses import StreamingResponse
+from src.schemas.schemas import AskRequest, AskResponse, FeedbackRequest, FeedbackResponse
 logger = logging.getLogger(__name__)
 router = APIRouter(tags=["ask"])
     - error: Error information
     """
     t0 = time.time()
     try:
         # Send initial status
         yield f"event: status\ndata: {json.dumps({'stage': 'guardrail', 'message': 'Validating query...'})}\n\n"
         await asyncio.sleep(0)  # Allow event loop to flush
         # Run the RAG pipeline (synchronous, but we yield progress)
         loop = asyncio.get_running_loop()
         result = await loop.run_in_executor(
                 patient_context=patient_context,
             )
         )
         # Send retrieval metadata
         yield f"event: metadata\ndata: {json.dumps({'documents_retrieved': len(result.get('retrieved_documents', [])), 'documents_relevant': len(result.get('relevant_documents', [])), 'guardrail_score': result.get('guardrail_score')})}\n\n"
         await asyncio.sleep(0)
         # Stream the answer token by token for smooth UI
         answer = result.get("final_answer", "")
         if answer:
             yield f"event: status\ndata: {json.dumps({'stage': 'generating', 'message': 'Generating response...'})}\n\n"
             # Simulate streaming by chunking the response
             words = answer.split()
             chunk_size = 3  # Send 3 words at a time
                     chunk += " "
                 yield f"event: token\ndata: {json.dumps({'text': chunk})}\n\n"
                 await asyncio.sleep(0.02)  # Small delay for visual streaming effect
         # Send completion
         elapsed = (time.time() - t0) * 1000
         yield f"event: done\ndata: {json.dumps({'request_id': request_id, 'processing_time_ms': round(elapsed, 1), 'status': 'success'})}\n\n"
     except Exception as exc:
         logger.exception("Streaming RAG failed: %s", exc)
         yield f"event: error\ndata: {json.dumps({'error': str(exc), 'request_id': request_id})}\n\n"
     rag_service = getattr(request.app.state, "rag_service", None)
     if rag_service is None:
         raise HTTPException(status_code=503, detail="RAG service unavailable")
     request_id = f"req_{uuid.uuid4().hex[:12]}"
     return StreamingResponse(
         _stream_rag_response(
             rag_service,
             "X-Request-ID": request_id,
         },
     )
+@router.post("/feedback", response_model=FeedbackResponse)
+async def submit_feedback(body: FeedbackRequest, request: Request):
+    """Submit user feedback for an analysis or RAG response."""
+    tracer = getattr(request.app.state, "tracer", None)
+    if tracer:
+        tracer.score(
+            trace_id=body.request_id,
+            name="user-feedback",
+            value=body.score,
+            comment=body.comment
+        )
+    return FeedbackResponse(request_id=body.request_id)

src/routers/health.py CHANGED Viewed

@@ -7,7 +7,7 @@ Provides /health and /health/ready with per-service checks.
 from __future__ import annotations
 import time
-from datetime import datetime, timezone
 from fastapi import APIRouter, Request
@@ -23,7 +23,7 @@ async def health_check(request: Request) -> HealthResponse:
     uptime = time.time() - getattr(app_state, "start_time", time.time())
     return HealthResponse(
         status="healthy",
-        timestamp=datetime.now(timezone.utc).isoformat(),
         version=getattr(app_state, "version", "2.0.0"),
         uptime_seconds=round(uptime, 2),
     )
@@ -39,9 +39,10 @@ async def readiness_check(request: Request) -> HealthResponse:
     # --- PostgreSQL ---
     try:
-        from src.database import get_engine
         from sqlalchemy import text
-        engine = get_engine()
         if engine is not None:
             t0 = time.time()
             with engine.connect() as conn:
@@ -86,9 +87,10 @@ async def readiness_check(request: Request) -> HealthResponse:
         ollama = getattr(app_state, "ollama_client", None)
         if ollama is not None:
             t0 = time.time()
-            healthy = ollama.health()
             latency = (time.time() - t0) * 1000
-            services.append(ServiceHealth(name="ollama", status="ok" if healthy else "degraded", latency_ms=round(latency, 1)))
         else:
             services.append(ServiceHealth(name="ollama", status="unavailable"))
     except Exception as exc:
@@ -126,7 +128,7 @@ async def readiness_check(request: Request) -> HealthResponse:
     return HealthResponse(
         status=overall,
-        timestamp=datetime.now(timezone.utc).isoformat(),
         version=getattr(app_state, "version", "2.0.0"),
         uptime_seconds=round(uptime, 2),
         services=services,

 from __future__ import annotations
 import time
+from datetime import UTC, datetime
 from fastapi import APIRouter, Request
     uptime = time.time() - getattr(app_state, "start_time", time.time())
     return HealthResponse(
         status="healthy",
+        timestamp=datetime.now(UTC).isoformat(),
         version=getattr(app_state, "version", "2.0.0"),
         uptime_seconds=round(uptime, 2),
     )
     # --- PostgreSQL ---
     try:
         from sqlalchemy import text
+        from src.database import _engine
+        engine = _engine()
         if engine is not None:
             t0 = time.time()
             with engine.connect() as conn:
         ollama = getattr(app_state, "ollama_client", None)
         if ollama is not None:
             t0 = time.time()
+            health_info = ollama.health()
             latency = (time.time() - t0) * 1000
+            is_healthy = isinstance(health_info, dict) and health_info.get("status") == "ok"
+            services.append(ServiceHealth(name="ollama", status="ok" if is_healthy else "degraded", latency_ms=round(latency, 1)))
         else:
             services.append(ServiceHealth(name="ollama", status="unavailable"))
     except Exception as exc:
     return HealthResponse(
         status=overall,
+        timestamp=datetime.now(UTC).isoformat(),
         version=getattr(app_state, "version", "2.0.0"),
         uptime_seconds=round(uptime, 2),
         services=services,