mosaic-zero / tests /test_fixtures.py
raylim's picture
Add GitHub Actions workflows and comprehensive test suite
4780d8d unverified
"""Shared fixtures and utilities for UI and CLI tests.
This module provides reusable fixtures for testing the Mosaic Gradio UI and CLI,
including mock file objects, settings DataFrames, cancer subtype mappings, and
utility functions for test setup/teardown.
"""
import tempfile
from pathlib import Path
from unittest.mock import Mock
import pandas as pd
import numpy as np
import pytest
from PIL import Image
# ============================================================================
# File and Path Fixtures
# ============================================================================
@pytest.fixture
def test_slide_path():
"""Path to actual test slide for integration tests."""
return Path("tests/testdata/948176.svs")
@pytest.fixture
def temp_output_dir():
"""Temporary directory for test outputs."""
with tempfile.TemporaryDirectory(prefix="mosaic_test_") as tmpdir:
yield Path(tmpdir)
@pytest.fixture
def mock_user_dir(temp_output_dir):
"""Mock user directory (same as temp_output_dir for simplicity)."""
return temp_output_dir
# ============================================================================
# Mock File Upload Fixtures
# ============================================================================
@pytest.fixture
def sample_files_single():
"""Mock single file upload."""
mock_file = Mock()
mock_file.name = "test_slide_1.svs"
return [mock_file]
@pytest.fixture
def sample_files_multiple():
"""Mock multiple file uploads (3 files)."""
files = []
for i in range(1, 4):
mock_file = Mock()
mock_file.name = f"test_slide_{i}.svs"
files.append(mock_file)
return files
def create_mock_file(filename):
"""Create a mock file object with specified filename.
Args:
filename: Name for the mock file
Returns:
Mock object with .name attribute
"""
mock_file = Mock()
mock_file.name = filename
return mock_file
# ============================================================================
# Settings DataFrame Fixtures
# ============================================================================
@pytest.fixture
def sample_settings_df():
"""Sample settings DataFrame with 3 slides."""
return pd.DataFrame(
{
"Slide": ["slide1.svs", "slide2.svs", "slide3.svs"],
"Site Type": ["Primary", "Metastatic", "Primary"],
"Sex": ["Unknown", "Female", "Male"],
"Tissue Site": ["Lung", "Liver", "Unknown"],
"Cancer Subtype": ["Unknown", "Lung Adenocarcinoma (LUAD)", "Unknown"],
"IHC Subtype": ["", "", ""],
"Segmentation Config": ["Biopsy", "Resection", "TCGA"],
}
)
def create_settings_df(n_rows, **kwargs):
"""Generate a test settings DataFrame with specified number of rows.
Args:
n_rows: Number of rows to generate
**kwargs: Column overrides (e.g., site_type="Metastatic")
Returns:
DataFrame with SETTINGS_COLUMNS
"""
defaults = {
"Slide": [f"slide_{i}.svs" for i in range(1, n_rows + 1)],
"Site Type": ["Primary"] * n_rows,
"Sex": ["Unknown"] * n_rows,
"Tissue Site": ["Unknown"] * n_rows,
"Cancer Subtype": ["Unknown"] * n_rows,
"IHC Subtype": [""] * n_rows,
"Segmentation Config": ["Biopsy"] * n_rows,
}
# Override with any provided kwargs
for key, value in kwargs.items():
column_name = key.replace("_", " ").title()
if column_name in defaults:
if isinstance(value, list):
defaults[column_name] = value
else:
defaults[column_name] = [value] * n_rows
return pd.DataFrame(defaults)
# ============================================================================
# CSV File Fixtures
# ============================================================================
@pytest.fixture
def sample_csv_valid():
"""Temporary CSV file with valid settings."""
with tempfile.NamedTemporaryFile(mode="w", suffix=".csv", delete=False) as f:
f.write(
"Slide,Site Type,Sex,Tissue Site,Cancer Subtype,IHC Subtype,Segmentation Config\n"
)
f.write("slide1.svs,Primary,Unknown,Lung,Unknown,,Biopsy\n")
f.write(
"slide2.svs,Metastatic,Female,Liver,Lung Adenocarcinoma (LUAD),,Resection\n"
)
f.write("slide3.svs,Primary,Male,Unknown,Unknown,,TCGA\n")
f.flush()
yield f.name
Path(f.name).unlink(missing_ok=True)
@pytest.fixture
def sample_csv_invalid():
"""Temporary CSV file with invalid values (for validation testing)."""
with tempfile.NamedTemporaryFile(mode="w", suffix=".csv", delete=False) as f:
f.write(
"Slide,Site Type,Sex,Tissue Site,Cancer Subtype,IHC Subtype,Segmentation Config\n"
)
f.write(
"slide1.svs,InvalidSite,InvalidSex,InvalidTissue,InvalidSubtype,InvalidIHC,InvalidConfig\n"
)
f.write(
"slide2.svs,Primary,Unknown,Lung,BRCA,HR+/HER2+,Biopsy\n"
) # Valid breast cancer
f.flush()
yield f.name
Path(f.name).unlink(missing_ok=True)
@pytest.fixture
def sample_csv_minimal():
"""Temporary CSV file with only required columns (missing optional columns)."""
with tempfile.NamedTemporaryFile(mode="w", suffix=".csv", delete=False) as f:
f.write("Slide,Site Type,Cancer Subtype\n")
f.write("slide1.svs,Primary,Unknown\n")
f.write("slide2.svs,Metastatic,LUAD\n")
f.flush()
yield f.name
Path(f.name).unlink(missing_ok=True)
# ============================================================================
# Cancer Subtype Mapping Fixtures
# ============================================================================
@pytest.fixture
def mock_cancer_subtype_maps():
"""Mock cancer subtype mappings for testing."""
cancer_subtype_name_map = {
"Unknown": "UNK",
"Lung Adenocarcinoma (LUAD)": "LUAD",
"Breast Invasive Carcinoma (BRCA)": "BRCA",
"Colorectal Adenocarcinoma (COAD)": "COAD",
"Prostate Adenocarcinoma (PRAD)": "PRAD",
}
reversed_cancer_subtype_name_map = {
"UNK": "Unknown",
"LUAD": "Lung Adenocarcinoma (LUAD)",
"BRCA": "Breast Invasive Carcinoma (BRCA)",
"COAD": "Colorectal Adenocarcinoma (COAD)",
"PRAD": "Prostate Adenocarcinoma (PRAD)",
}
cancer_subtypes = ["LUAD", "BRCA", "COAD", "PRAD"]
return cancer_subtype_name_map, reversed_cancer_subtype_name_map, cancer_subtypes
# ============================================================================
# Mock Analysis Results Fixtures
# ============================================================================
@pytest.fixture
def mock_analyze_slide_results():
"""Mock results from analyze_slide function."""
# Create a simple test mask image
mask = Image.new("RGB", (100, 100), color="red")
# Create Aeon results DataFrame
aeon_results = pd.DataFrame(
{
"Cancer Subtype": ["LUAD"],
"Confidence": [0.95],
}
)
# Create Paladin results DataFrame (NOTE: No "Slide" column - that gets added by CLI/UI)
paladin_results = pd.DataFrame(
{
"Cancer Subtype": ["LUAD", "LUAD", "LUAD"],
"Biomarker": ["TP53", "KRAS", "EGFR"],
"Score": [0.85, 0.72, 0.63],
}
)
return (mask, aeon_results, paladin_results)
@pytest.fixture
def mock_model_cache():
"""Mock ModelCache with test models."""
from unittest.mock import Mock
cache = Mock()
cache.ctranspath_model = Mock()
cache.optimus_model = Mock()
cache.marker_classifier = Mock()
cache.aeon_model = Mock()
cache.paladin_models = {}
cache.device = Mock()
cache.cleanup = Mock()
return cache
# ============================================================================
# CLI Argument Fixtures
# ============================================================================
@pytest.fixture
def cli_args_single():
"""Mock argparse Namespace for single-slide mode."""
from argparse import Namespace
return Namespace(
debug=False,
server_name="0.0.0.0",
server_port=None,
share=False,
slide_path="tests/testdata/948176.svs",
slide_csv=None,
output_dir="test_output",
site_type="Primary",
sex="Unknown",
tissue_site="Unknown",
cancer_subtype="Unknown",
ihc_subtype="",
segmentation_config="Biopsy",
num_workers=4,
)
@pytest.fixture
def cli_args_batch(sample_csv_valid):
"""Mock argparse Namespace for batch mode."""
from argparse import Namespace
return Namespace(
debug=False,
server_name="0.0.0.0",
server_port=None,
share=False,
slide_path=None,
slide_csv=sample_csv_valid,
output_dir="test_output",
site_type="Primary",
sex="Unknown",
tissue_site="Unknown",
cancer_subtype="Unknown",
ihc_subtype="",
segmentation_config="Biopsy",
num_workers=4,
)
# ============================================================================
# Utility Functions
# ============================================================================
def verify_csv_output(path, expected_columns):
"""Validate CSV file structure.
Args:
path: Path to CSV file
expected_columns: List of expected column names
Returns:
DataFrame loaded from CSV
Raises:
AssertionError: If CSV is invalid or missing columns
"""
assert Path(path).exists(), f"CSV file not found: {path}"
df = pd.read_csv(path)
assert not df.empty, f"CSV file is empty: {path}"
missing_cols = set(expected_columns) - set(df.columns)
assert not missing_cols, f"Missing columns in CSV: {missing_cols}"
return df
def mock_gradio_components():
"""Context manager to mock Gradio component classes.
Usage:
with mock_gradio_components() as mocks:
# Gradio components are mocked
result = function_that_returns_gr_components()
# Verify mocks
assert mocks['Dataframe'].called
"""
from unittest.mock import patch, Mock
mocks = {
"Dataframe": Mock(return_value=Mock()),
"File": Mock(return_value=Mock()),
"DownloadButton": Mock(return_value=Mock()),
"Dropdown": Mock(return_value=Mock()),
"Gallery": Mock(return_value=Mock()),
"Error": Exception, # gr.Error is an exception
"Warning": Mock(),
}
patches = []
for name, mock_obj in mocks.items():
patch_obj = patch(f"mosaic.ui.app.gr.{name}", mock_obj)
patches.append(patch_obj)
# Start all patches
for p in patches:
p.start()
try:
yield mocks
finally:
# Stop all patches
for p in patches:
p.stop()