Spaces:

samwell
/

medrax2

Paused

App Files Files Community

VictorLJZ commited on Aug 7, 2025

Commit

aff69d7

2 Parent(s): 1516987 7b3e756

Merge pull request #23 from bowang-lab/victor/benchmarking

Browse files

Files changed (9) hide show

.gitignore +3 -1
benchmarking/benchmarks/rexvqa_benchmark.py +6 -6
benchmarking/llm_providers/medrax_provider.py +8 -8
main.py +27 -21
medrax/docs/system_prompts.txt +5 -6
medrax/tools/__init__.py +0 -1
medrax/tools/medgemma.py +0 -225
medrax/tools/medgemma_client.py +0 -145
pyproject.toml +0 -3

.gitignore CHANGED Viewed

@@ -179,4 +179,6 @@ model-weights/
 .DS_Store
-benchmarking/data/

 .DS_Store
+benchmarking/data/
+model_cache/
+medgemma/

benchmarking/benchmarks/rexvqa_benchmark.py CHANGED Viewed

@@ -34,20 +34,20 @@ class ReXVQABenchmark(Benchmark):
             data_dir (str): Directory to store/cache downloaded data
             **kwargs: Additional configuration parameters
                 split (str): Dataset split to use (default: 'test')
-                cache_dir (str): Directory for caching HuggingFace datasets
                 trust_remote_code (bool): Whether to trust remote code (default: False)
                 max_questions (int): Maximum number of questions to load (default: None, load all)
                 images_dir (str): Directory containing extracted PNG images (default: None)
         """
         self.split = kwargs.get("split", "test")
-        self.cache_dir = kwargs.get("cache_dir", None)
         self.trust_remote_code = kwargs.get("trust_remote_code", False)
         self.max_questions = kwargs.get("max_questions", None)
-        self.images_dir = "benchmarking/data/rexvqa/images/deid_png"
         self.image_dataset = None
         self.image_mapping = {}  # Maps study_id to image data
         super().__init__(data_dir, **kwargs)
     @staticmethod
     def download_rexgradient_images(output_dir: str = "benchmarking/data/rexvqa", repo_id: str = "rajpurkarlab/ReXGradient-160K"):
@@ -166,8 +166,8 @@ class ReXVQABenchmark(Benchmark):
         """Load ReXVQA data from local JSON file."""
         try:
             # Check for images and test_vqa_data.json, download if missing
-            self.download_test_vqa_data_json()
-            self.download_rexgradient_images()
             # Construct path to the JSON file
             json_file_path = os.path.join("benchmarking", "data", "rexvqa", "metadata", "test_vqa_data.json")
@@ -197,7 +197,7 @@ class ReXVQABenchmark(Benchmark):
                 self.image_dataset = load_dataset(
                     "rajpurkarlab/ReXGradient-160K",
                     split="test",
-                    cache_dir=self.cache_dir,
                     trust_remote_code=self.trust_remote_code
                 )
                 print(f"Loaded {len(self.image_dataset)} image metadata entries from ReXGradient-160K")

             data_dir (str): Directory to store/cache downloaded data
             **kwargs: Additional configuration parameters
                 split (str): Dataset split to use (default: 'test')
                 trust_remote_code (bool): Whether to trust remote code (default: False)
                 max_questions (int): Maximum number of questions to load (default: None, load all)
                 images_dir (str): Directory containing extracted PNG images (default: None)
         """
         self.split = kwargs.get("split", "test")
         self.trust_remote_code = kwargs.get("trust_remote_code", False)
         self.max_questions = kwargs.get("max_questions", None)
         self.image_dataset = None
         self.image_mapping = {}  # Maps study_id to image data
         super().__init__(data_dir, **kwargs)
+        # Set images_dir after parent initialization
+        self.images_dir = f"{self.data_dir}/images/deid_png"
     @staticmethod
     def download_rexgradient_images(output_dir: str = "benchmarking/data/rexvqa", repo_id: str = "rajpurkarlab/ReXGradient-160K"):
         """Load ReXVQA data from local JSON file."""
         try:
             # Check for images and test_vqa_data.json, download if missing
+            self.download_test_vqa_data_json(self.data_dir)
+            self.download_rexgradient_images(self.data_dir)
             # Construct path to the JSON file
             json_file_path = os.path.join("benchmarking", "data", "rexvqa", "metadata", "test_vqa_data.json")
                 self.image_dataset = load_dataset(
                     "rajpurkarlab/ReXGradient-160K",
                     split="test",
+                    cache_dir=self.data_dir,
                     trust_remote_code=self.trust_remote_code
                 )
                 print(f"Loaded {len(self.image_dataset)} image metadata entries from ReXGradient-160K")

benchmarking/llm_providers/medrax_provider.py CHANGED Viewed

@@ -33,15 +33,15 @@ class MedRAXProvider(LLMProvider):
             print("Starting server...")
             selected_tools = [
-                "ChestXRayReportGeneratorTool",  # For generating medical reports from X-rays
-                "MedicalRAGTool",  # For retrieval-augmented generation with medical knowledge
-                "WebBrowserTool",  # For web browsing and search capabilities
                 "TorchXRayVisionClassifierTool",  # For classifying chest X-ray images using TorchXRayVision
                 "ArcPlusClassifierTool",  # For advanced chest X-ray classification using ArcPlus
-                "DuckDuckGoSearchTool",  # For privacy-focused web search using DuckDuckGo
-                "XRayVQATool",  # For visual question answering on X-rays
                 "XRayPhraseGroundingTool",  # For locating described features in X-rays
-                "MedGemmaVQATool"
             ]
             rag_config = RAGConfig(
@@ -64,11 +64,11 @@ class MedRAXProvider(LLMProvider):
             agent, tools_dict = initialize_agent(
                 prompt_file="medrax/docs/system_prompts.txt",
                 tools_to_use=selected_tools,
-                model_dir="/model-weights",
                 temp_dir="temp",  # Change this to the path of the temporary directory
                 device="cuda:0",
                 model=self.model_name,  # Change this to the model you want to use, e.g. gpt-4.1-2025-04-14, gemini-2.5-pro
-                temperature=0.3,
                 top_p=0.95,
                 model_kwargs=model_kwargs,
                 rag_config=rag_config,

             print("Starting server...")
             selected_tools = [
                 "TorchXRayVisionClassifierTool",  # For classifying chest X-ray images using TorchXRayVision
                 "ArcPlusClassifierTool",  # For advanced chest X-ray classification using ArcPlus
+                "ChestXRayReportGeneratorTool",  # For generating medical reports from X-rays
                 "XRayPhraseGroundingTool",  # For locating described features in X-rays
+                "MedGemmaVQATool",
+                # "XRayVQATool",  # For visual question answering on X-rays
+                # "MedicalRAGTool",  # For retrieval-augmented generation with medical knowledge
+                # "WebBrowserTool",  # For web browsing and search capabilities
+                # "DuckDuckGoSearchTool",  # For privacy-focused web search using DuckDuckGo
             ]
             rag_config = RAGConfig(
             agent, tools_dict = initialize_agent(
                 prompt_file="medrax/docs/system_prompts.txt",
                 tools_to_use=selected_tools,
+                model_dir="/scratch/ssd004/scratch/victorli/model-weights",
                 temp_dir="temp",  # Change this to the path of the temporary directory
                 device="cuda:0",
                 model=self.model_name,  # Change this to the model you want to use, e.g. gpt-4.1-2025-04-14, gemini-2.5-pro
+                temperature=1.0,
                 top_p=0.95,
                 model_kwargs=model_kwargs,
                 rag_config=rag_config,

main.py CHANGED Viewed

@@ -10,6 +10,7 @@ with different model weights, tools, and parameters.
 """
 import warnings
 from typing import Dict, List, Optional, Any
 from dotenv import load_dotenv
 from transformers import logging
@@ -33,11 +34,11 @@ _ = load_dotenv()
 def initialize_agent(
     prompt_file: str,
     tools_to_use: Optional[List[str]] = None,
-    model_dir: str = "/model-weights",
     temp_dir: str = "temp",
     device: str = "cpu",
-    model: str = "gpt-4.1-2025-04-14",
-    temperature: float = 0.7,
     top_p: float = 0.95,
     rag_config: Optional[RAGConfig] = None,
     model_kwargs: Dict[str, Any] = {},
@@ -67,7 +68,7 @@ def initialize_agent(
     prompt = prompts[system_prompt]
     # Define the URL of the MedGemma FastAPI service.
-    MEDGEMMA_API_URL = os.getenv("MEDGEMMA_API_URL", "http://127.0.0.1:8002")
     all_tools = {
         "TorchXRayVisionClassifierTool": lambda: TorchXRayVisionClassifierTool(device=device),
@@ -88,24 +89,29 @@ def initialize_agent(
         "DicomProcessorTool": lambda: DicomProcessorTool(temp_dir=temp_dir),
         "MedicalRAGTool": lambda: RAGTool(config=rag_config),
         "WebBrowserTool": lambda: WebBrowserTool(),
         "MedSAM2Tool": lambda: MedSAM2Tool(
             device=device, cache_dir=model_dir, temp_dir=temp_dir
         ),
         "MedGemmaVQATool": lambda: MedGemmaAPIClientTool(cache_dir=model_dir, device=device, api_url=MEDGEMMA_API_URL)
-    }
-    try:
-        tools_dict["PythonSandboxTool"] = create_python_sandbox()
-    except Exception as e:
-        print(f"Error creating PythonSandboxTool: {e}")
-        print("Skipping PythonSandboxTool")
     # Initialize only selected tools or all if none specified
     tools_dict: Dict[str, BaseTool] = {}
-    tools_to_use = tools_to_use or all_tools.keys()
     for tool_name in tools_to_use:
         if tool_name in all_tools:
             tools_dict[tool_name] = all_tools[tool_name]()
     # Set up checkpointing for conversation state
     checkpointer = MemorySaver()
@@ -145,20 +151,20 @@ if __name__ == "__main__":
     selected_tools = [
         "ImageVisualizerTool",  # For displaying images in the UI
         # "DicomProcessorTool",  # For processing DICOM medical image files
         "TorchXRayVisionClassifierTool",  # For classifying chest X-ray images using TorchXRayVision
         "ArcPlusClassifierTool",  # For advanced chest X-ray classification using ArcPlus
-        "ChestXRaySegmentationTool",  # For segmenting anatomical regions in chest X-rays
-        "ChestXRayReportGeneratorTool",  # For generating medical reports from X-rays
         "XRayVQATool",  # For visual question answering on X-rays
         # "LlavaMedTool",  # For multimodal medical image understanding
         "XRayPhraseGroundingTool",  # For locating described features in X-rays
-        # "ChestXRayGeneratorTool",  # For generating synthetic chest X-rays
         # "MedSAM2Tool",  # For advanced medical image segmentation using MedSAM2
         # "WebBrowserTool",  # For web browsing and search capabilities
         # "MedicalRAGTool",  # For retrieval-augmented generation with medical knowledge
         # "PythonSandboxTool",  # Add the Python sandbox tool
-        "MedGemmaVQATool" # Google MedGemma VQA tool
-        "DuckDuckGoSearchTool",  # For privacy-focused web search using DuckDuckGo
     ]
     # Setup the MedGemma environment if the MedGemmaVQATool is selected
@@ -187,11 +193,11 @@ if __name__ == "__main__":
     agent, tools_dict = initialize_agent(
         prompt_file="medrax/docs/system_prompts.txt",
         tools_to_use=selected_tools,
-        model_dir="/model-weights",
         temp_dir="temp",  # Change this to the path of the temporary directory
-        device="cuda:0",
-        model="gpt-4.1-2025-04-14",  # Change this to the model you want to use, e.g. gpt-4.1-2025-04-14, gemini-2.5-pro
-        temperature=0.7,
         top_p=0.95,
         model_kwargs=model_kwargs,
         rag_config=rag_config,

 """
 import warnings
+import os
 from typing import Dict, List, Optional, Any
 from dotenv import load_dotenv
 from transformers import logging
 def initialize_agent(
     prompt_file: str,
     tools_to_use: Optional[List[str]] = None,
+    model_dir: str = "model-weights",
     temp_dir: str = "temp",
     device: str = "cpu",
+    model: str = "gemini-2.5-pro",
+    temperature: float = 1.0,
     top_p: float = 0.95,
     rag_config: Optional[RAGConfig] = None,
     model_kwargs: Dict[str, Any] = {},
     prompt = prompts[system_prompt]
     # Define the URL of the MedGemma FastAPI service.
+    MEDGEMMA_API_URL = os.getenv("MEDGEMMA_API_URL", "http://172.17.8.141:8002")
     all_tools = {
         "TorchXRayVisionClassifierTool": lambda: TorchXRayVisionClassifierTool(device=device),
         "DicomProcessorTool": lambda: DicomProcessorTool(temp_dir=temp_dir),
         "MedicalRAGTool": lambda: RAGTool(config=rag_config),
         "WebBrowserTool": lambda: WebBrowserTool(),
+        "DuckDuckGoSearchTool": lambda: DuckDuckGoSearchTool(),
         "MedSAM2Tool": lambda: MedSAM2Tool(
             device=device, cache_dir=model_dir, temp_dir=temp_dir
         ),
         "MedGemmaVQATool": lambda: MedGemmaAPIClientTool(cache_dir=model_dir, device=device, api_url=MEDGEMMA_API_URL)
+    }
     # Initialize only selected tools or all if none specified
     tools_dict: Dict[str, BaseTool] = {}
+    if tools_to_use is None:
+        tools_to_use = []
     for tool_name in tools_to_use:
+        if tool_name == "PythonSandboxTool":
+            try:
+                tools_dict["PythonSandboxTool"] = create_python_sandbox()
+            except Exception as e:
+                print(f"Error creating PythonSandboxTool: {e}")
+                print("Skipping PythonSandboxTool")
         if tool_name in all_tools:
             tools_dict[tool_name] = all_tools[tool_name]()
     # Set up checkpointing for conversation state
     checkpointer = MemorySaver()
     selected_tools = [
         "ImageVisualizerTool",  # For displaying images in the UI
         # "DicomProcessorTool",  # For processing DICOM medical image files
+        # "ChestXRayGeneratorTool",  # For generating synthetic chest X-rays
+        "ChestXRayReportGeneratorTool",  # For generating medical reports from X-rays
         "TorchXRayVisionClassifierTool",  # For classifying chest X-ray images using TorchXRayVision
         "ArcPlusClassifierTool",  # For advanced chest X-ray classification using ArcPlus
+        "MedGemmaVQATool" # Google MedGemma VQA tool
         "XRayVQATool",  # For visual question answering on X-rays
         # "LlavaMedTool",  # For multimodal medical image understanding
         "XRayPhraseGroundingTool",  # For locating described features in X-rays
+        "ChestXRaySegmentationTool",  # For segmenting anatomical regions in chest X-rays
         # "MedSAM2Tool",  # For advanced medical image segmentation using MedSAM2
         # "WebBrowserTool",  # For web browsing and search capabilities
+        "DuckDuckGoSearchTool",  # For privacy-focused web search using DuckDuckGo
         # "MedicalRAGTool",  # For retrieval-augmented generation with medical knowledge
         # "PythonSandboxTool",  # Add the Python sandbox tool
     ]
     # Setup the MedGemma environment if the MedGemmaVQATool is selected
     agent, tools_dict = initialize_agent(
         prompt_file="medrax/docs/system_prompts.txt",
         tools_to_use=selected_tools,
+        model_dir="model-weights",
         temp_dir="temp",  # Change this to the path of the temporary directory
+        device="cpu",
+        model="gemini-2.5-pro",  # Change this to the model you want to use, e.g. gpt-4.1-2025-04-14, gemini-2.5-pro
+        temperature=1.0,
         top_p=0.95,
         model_kwargs=model_kwargs,
         rag_config=rag_config,

medrax/docs/system_prompts.txt CHANGED Viewed

@@ -17,10 +17,9 @@ Examples:
 - "Based on clinical guidelines [3], the recommended treatment approach is..."
 [CHESTAGENTBENCH_PROMPT]
-You are an expert medical AI assistant who can answer any medical questions and analyze medical images similar to a doctor.
-Solve using your own vision and reasoning and use tools (if available) to complement your reasoning.
-You can make multiple tool calls in parallel or in sequence as needed for comprehensive answers.
-Think critically about and criticize the tool outputs.
-If you need to look up some information before asking a follow up question, you are allowed to do that.
 When encountering a multiple-choice question, your final response should end with "Final answer: \boxed{A}" from list of possible choices A, B, C, D, E, F.
-It is extremely important that you strictly answer in the format mentioned above.

 - "Based on clinical guidelines [3], the recommended treatment approach is..."
 [CHESTAGENTBENCH_PROMPT]
+You are an expert medical assistant who can answer medical questions and analyze medical images with world-class accuracy.
+Use your state-of-the art reasoning and critical thinking skills to answer the questions that you are asked.
+You may use tools (if available) to complement your reasoning and you are allowed to make multiple tool calls in parallel or in sequence as needed for comprehensive answers.
+Think critically about how to best use the tools available to you and scrutinize the tool outputs.
 When encountering a multiple-choice question, your final response should end with "Final answer: \boxed{A}" from list of possible choices A, B, C, D, E, F.
+It is extremely important that you answer strictly in the format described above.

medrax/tools/__init__.py CHANGED Viewed

@@ -11,4 +11,3 @@ from .utils import *
 from .rag import *
 from .browsing import *
 from .python_tool import *
-from .medsam2 import *

 from .rag import *
 from .browsing import *
 from .python_tool import *

medrax/tools/medgemma.py DELETED Viewed

@@ -1,225 +0,0 @@
-from fastapi import FastAPI, File, UploadFile, Form, HTTPException
-from pydantic import BaseModel, Field
-from typing import List, Optional, Any, Dict, Tuple
-from pathlib import Path
-import torch
-from PIL import Image
-from transformers import pipeline, BitsAndBytesConfig
-import asyncio
-import uvicorn
-import os
-import uuid
-import traceback
-import sys
-import transformers
-print("--- ENVIRONMENT CHECK ---")
-print(f"Python Executable: {sys.executable}")
-print(f"PyTorch version: {torch.__version__}")
-print(f"Transformers version: {transformers.__version__}")
-print("-----------------------")
-# --- Configuration ---
-CACHE_DIR = "./model_cache"
-UPLOAD_DIR = "./uploaded_images"
-# Create directories if they don't exist
-os.makedirs(CACHE_DIR, exist_ok=True)
-os.makedirs(UPLOAD_DIR, exist_ok=True)
-# --- Pydantic Models for API ---
-class VQAInput(BaseModel):
-    prompt: str = Field(..., description="Question or instruction about the medical images")
-    system_prompt: Optional[str] = Field(
-        "You are an expert radiologist.",
-        description="System prompt to set the context for the model",
-    )
-    max_new_tokens: int = Field(
-        300, description="Maximum number of tokens to generate in the response"
-    )
-class VQAResponse(BaseModel):
-    response: str
-    metadata: Dict[str, Any]
-class ErrorResponse(BaseModel):
-    error: str
-    metadata: Dict[str, Any]
-# --- MedGemma Model Handling ---
-class MedGemmaModel:
-    _instance = None
-    def __new__(cls, *args, **kwargs):
-        if not cls._instance:
-            cls._instance = super(MedGemmaModel, cls).__new__(cls)
-        return cls._instance
-    def __init__(self,
-                 model_name: str = "google/medgemma-4b-it",
-                 device: Optional[str] = "cuda",
-                 dtype: torch.dtype = torch.bfloat16,
-                 load_in_4bit: bool = False):
-        if hasattr(self, 'pipe') and self.pipe is not None:
-            return
-        self.device = device if device and torch.cuda.is_available() else "cpu"
-        self.dtype = dtype
-        self.pipe = None
-        model_kwargs = {"torch_dtype": self.dtype, "cache_dir": CACHE_DIR}
-        if load_in_4bit:
-            model_kwargs["quantization_config"] = BitsAndBytesConfig(load_in_4bit=True)
-        model_kwargs["device_map"] = {"": self.device}
-        try:
-            self.pipe = pipeline("image-text-to-text",
-                                 model=model_name,
-                                 model_kwargs=model_kwargs,
-                                 trust_remote_code=True,
-                                 use_cache=True)
-        except Exception as e:
-            raise RuntimeError(f"Failed to initialize MedGemma pipeline: {str(e)}")
-    def _prepare_messages(
-        self, image_paths: List[str], prompt: str, system_prompt: str
-    ) -> Tuple[List[Dict[str, Any]], List[Image.Image]]:
-        images = []
-        for path in image_paths:
-            if not Path(path).is_file():
-                raise FileNotFoundError(f"Image file not found: {path}")
-            image = Image.open(path)
-            if image.mode != "RGB":
-                image = image.convert("RGB")
-            images.append(image)
-        messages = [
-            {"role": "system", "content": [{"type": "text", "text": system_prompt}]},
-            {
-                "role": "user",
-                "content": [{"type": "text", "text": prompt}]
-                + [{"type": "image", "image": img} for img in images],
-            },
-        ]
-        return messages, images
-    async def aget_response(self, image_paths: List[str], prompt: str, system_prompt: str, max_new_tokens: int) -> str:
-        loop = asyncio.get_event_loop()
-        messages, _ = await loop.run_in_executor(None, self._prepare_messages, image_paths, prompt, system_prompt)
-        def _generate():
-            return self.pipe(
-                text=messages,
-                max_new_tokens=max_new_tokens,
-                do_sample=False,
-            )
-        output = await loop.run_in_executor(None, _generate)
-        if (
-            isinstance(output, list)
-            and output
-            and isinstance(output[0].get("generated_text"), list)
-        ):
-            generated_text = output[0]["generated_text"]
-            if generated_text:
-                return generated_text[-1].get("content", "").strip()
-        return "No response generated"
-# --- FastAPI Application ---
-app = FastAPI(title="MedGemma VQA API",
-              description="API for medical visual question answering using Google's MedGemma model.")
-medgemma_model: Optional[MedGemmaModel] = None
-@app.on_event("startup")
-async def startup_event():
-    """Load the MedGemma model at application startup."""
-    global medgemma_model
-    try:
-        medgemma_model = MedGemmaModel()
-        print("MedGemma model loaded successfully.")
-    except RuntimeError as e:
-        print(f"Error loading MedGemma model: {e}")
-        # Depending on the desired behavior, you might want to exit the application
-        # if the model fails to load.
-        # exit(1)
-@app.post("/analyze-images/",
-            response_model=VQAResponse,
-            responses={500: {"model": ErrorResponse},
-                       404: {"model": ErrorResponse}},
-            summary="Analyze one or more medical images")
-async def analyze_images(
-    images: List[UploadFile] = File(..., description="List of medical image files to analyze (JPG or PNG)."),
-    prompt: str = Form(..., description="Question or instruction about the medical images."),
-    system_prompt: Optional[str] = Form("You are an expert radiologist.", description="System prompt to set the context for the model."),
-    max_new_tokens: int = Form(100, description="Maximum number of tokens to generate in the response.")
-):
-    """
-    Upload one or more medical images and a prompt to get an analysis from the MedGemma model.
-    """
-    if medgemma_model is None or medgemma_model.pipe is None:
-        raise HTTPException(status_code=503, detail="Model is not available. Please try again later.")
-    image_paths = []
-    for image in images:
-        if image.content_type not in ["image/jpeg", "image/png"]:
-            raise HTTPException(status_code=400, detail=f"Unsupported image format: {image.content_type}. Only JPG and PNG are supported.")
-        # Generate a unique filename to avoid overwrites
-        unique_filename = f"{uuid.uuid4()}_{image.filename}"
-        file_path = os.path.join(UPLOAD_DIR, unique_filename)
-        try:
-            with open(file_path, "wb") as buffer:
-                buffer.write(await image.read())
-            image_paths.append(file_path)
-        except Exception as e:
-            raise HTTPException(status_code=500, detail=f"Failed to save uploaded image: {str(e)}")
-    try:
-        response_text = await medgemma_model.aget_response(image_paths, prompt, system_prompt, max_new_tokens)
-        metadata = {
-            "image_paths": image_paths,
-            "prompt": prompt,
-            "system_prompt": system_prompt,
-            "max_new_tokens": max_new_tokens,
-            "num_images": len(image_paths),
-            "analysis_status": "completed",
-        }
-        return VQAResponse(response=response_text, metadata=metadata)
-    except FileNotFoundError as e:
-        raise HTTPException(status_code=404, detail=f"Image file not found: {str(e)}")
-    except Exception as e:
-        print("--- AN EXCEPTION OCCURRED IN THE ENDPOINT ---")
-        traceback.print_exc()
-        # Catch potential CUDA out-of-memory errors and other exceptions
-        error_message = "An unexpected error occurred during analysis."
-        if "CUDA out of memory" in str(e):
-            error_message = "GPU memory exhausted. Try reducing image resolution or max_new_tokens."
-        metadata = {
-            "image_paths": image_paths,
-            "prompt": prompt,
-            "analysis_status": "failed",
-            "error_details": str(e),
-        }
-        raise HTTPException(status_code=500, detail=error_message)
-    finally:
-        # Clean up saved images
-        for path in image_paths:
-            try:
-                os.remove(path)
-            except OSError:
-                # Log this error if needed, but don't let it crash the request
-                pass
-if __name__ == "__main__":
-    uvicorn.run(app, host="0.0.0.0", port=8002)

medrax/tools/medgemma_client.py DELETED Viewed

@@ -1,145 +0,0 @@
-import httpx
-from typing import Dict, List, Optional, Type, Any
-from langchain_core.tools import BaseTool
-from langchain_core.callbacks import (
-    AsyncCallbackManagerForToolRun,
-    CallbackManagerForToolRun,
-)
-from pydantic import BaseModel, Field
-import os
-# This input schema should be identical to the one in your original tool
-class MedGemmaVQAInput(BaseModel):
-    """Input schema for the MedGemma VQA Tool. The agent provides local paths to images."""
-    image_paths: List[str] = Field(
-        ...,
-        description="List of paths to medical image files to analyze. These are local paths accessible to the agent.",
-    )
-    prompt: str = Field(..., description="Question or instruction about the medical images")
-    system_prompt: Optional[str] = Field(
-        "You are an expert radiologist.",
-        description="System prompt to set the context for the model",
-    )
-    max_new_tokens: int = Field(
-        300, description="Maximum number of tokens to generate in the response"
-    )
-class MedGemmaAPIClientTool(BaseTool):
-    """
-    A client tool to interact with a remote MedGemma VQA FastAPI service.
-    This tool takes local image paths, reads them, and sends them to the API endpoint
-    for analysis.
-    """
-    name: str = "medgemma_medical_vqa_service"
-    description: str = (
-        "Sends medical images and a prompt to a specialized MedGemma VQA service for analysis. "
-        "Use this for expert-level reasoning, diagnosis assistance, and detailed image interpretation "
-        "across modalities like chest X-rays, dermatology, etc. Input must be local image paths and a prompt."
-    )
-    args_schema: Type[BaseModel] = MedGemmaVQAInput
-    api_url: str  # The URL of the running FastAPI service
-    def _run(
-        self,
-        image_paths: List[str],
-        prompt: str,
-        system_prompt: str = "You are an expert radiologist.",
-        max_new_tokens: int = 300,
-        run_manager: Optional[CallbackManagerForToolRun] = None,
-    ) -> str:
-        """Execute the tool synchronously."""
-        # httpx is a modern HTTP client that supports sync and async
-        timeout_config = httpx.Timeout(300.0, connect=10.0)
-        client = httpx.Client(timeout=timeout_config)
-        # Prepare the multipart form data
-        files_to_send = []
-        opened_files = []
-        try:
-            for path in image_paths:
-                f = open(path, "rb")
-                opened_files.append(f)
-                # The key 'images' must match the parameter name in the FastAPI endpoint
-                files_to_send.append(("images", (os.path.basename(path), f, "image/jpeg")))
-            data = {
-                "prompt": prompt,
-                "system_prompt": system_prompt,
-                "max_new_tokens": max_new_tokens,
-            }
-            response = client.post(
-                f"{self.api_url}/analyze-images/",
-                data=data,
-                files=files_to_send,
-            )
-            response.raise_for_status()  # Raise an exception for bad status codes (4xx or 5xx)
-            # The agent expects a string response from a tool
-            return response.json()["response"]
-        # --- KEY FIX 3: More specific exception handling for clearer errors ---
-        except httpx.TimeoutException:
-            return f"Error: The request to the MedGemma API timed out after {timeout_config.read} seconds. The server might be overloaded or the model is taking too long to load. Try again later."
-        except httpx.ConnectError:
-            return f"Error: Could not connect to the MedGemma API. Check if the server address '{self.api_url}' is correct and running."
-        except httpx.HTTPStatusError as e:
-            return f"Error: The MedGemma API returned an error (Status {e.response.status_code}): {e.response.text}"
-        except Exception as e:
-            return f"An unexpected error occurred in the MedGemma client tool: {str(e)}"
-        finally:
-            # Important: Ensure all opened files are closed.
-            for f in opened_files:
-                f.close()
-    async def _arun(
-        self,
-        image_paths: List[str],
-        prompt: str,
-        system_prompt: str = "You are an expert radiologist.",
-        max_new_tokens: int = 300,
-        run_manager: Optional[AsyncCallbackManagerForToolRun] = None,
-    ) -> str:
-        """Execute the tool asynchronously."""
-        async with httpx.AsyncClient() as client:
-            files_to_send = []
-            opened_files = []
-            try:
-                # Note: File I/O is blocking, for a truly async app you might use aiofiles
-                # But for this use case, this is generally acceptable.
-                for path in image_paths:
-                    f = open(path, "rb")
-                    opened_files.append(f)
-                    files_to_send.append(("images", (os.path.basename(path), f, "image/jpeg")))
-                data = {
-                    "prompt": prompt,
-                    "system_prompt": system_prompt,
-                    "max_new_tokens": max_new_tokens,
-                }
-                response = await client.post(
-                    f"{self.api_url}/analyze-images/",
-                    data=data,
-                    files=files_to_send,
-                    timeout=120.0
-                )
-                response.raise_for_status()
-                return response.json()["response"]
-            except httpx.HTTPStatusError as e:
-                return f"Error calling MedGemma API: {e.response.status_code} - {e.response.text}"
-            except Exception as e:
-                return f"An unexpected error occurred: {str(e)}"
-            finally:
-                for f in opened_files:
-                    f.close()
-if __name__ == "__main__":
-    client_tool = MedGemmaAPIClientTool(api_url="http://localhost:8002")
-    result = client_tool.run({
-        "image_paths": ["demo/chest/pneumonia1.jpg"],
-        "prompt": "What abnormality do you see?"
-    })
-    print(result)

pyproject.toml CHANGED Viewed

@@ -57,7 +57,6 @@ dependencies = [
     "torch>=2.2.0",
     "torchvision>=0.10.0",
     "scikit-image>=0.18.0",
-    "gradio>=5.0.0",
     "opencv-python>=4.8.0",
     "matplotlib>=3.8.0",
     "diffusers>=0.20.0",
@@ -65,13 +64,11 @@ dependencies = [
     "pylibjpeg>=1.0.0",
     "jupyter>=1.0.0",
     "albumentations>=1.0.0",
-    "pyarrow>=10.0.0",
     "chromadb>=0.0.10",
     "pinecone-client>=3.2.2",
     "langchain-pinecone>=0.0.1",
     "langchain-google-genai>=0.1.0",
     "ray>=2.9.0",
-    "langchain-sandbox>=0.0.6",
     "seaborn>=0.12.0",
     "huggingface_hub>=0.17.0",
     "iopath>=0.1.10",

     "torch>=2.2.0",
     "torchvision>=0.10.0",
     "scikit-image>=0.18.0",
     "opencv-python>=4.8.0",
     "matplotlib>=3.8.0",
     "diffusers>=0.20.0",
     "pylibjpeg>=1.0.0",
     "jupyter>=1.0.0",
     "albumentations>=1.0.0",
     "chromadb>=0.0.10",
     "pinecone-client>=3.2.2",
     "langchain-pinecone>=0.0.1",
     "langchain-google-genai>=0.1.0",
     "ray>=2.9.0",
     "seaborn>=0.12.0",
     "huggingface_hub>=0.17.0",
     "iopath>=0.1.10",