Spaces:

Boopster
/

reachy_mini_minder

Running

App Files Files Community

reachy_mini_minder / tests /test_pattern_detector.py

Boopster

feat: Implement pattern detection and integrate graph query engine with session insights and new tools.

2880ca9 3 days ago

raw

history blame contribute delete

9.05 kB

	"""Tests for the PatternDetector and Insight formatting."""

	import pytest
	from unittest.mock import MagicMock

	from reachy_mini_conversation_app.pattern_detector import (
	PatternDetector,
	Insight,
	format_insights_for_prompt,
	)


	class TestInsight:
	"""Test the Insight dataclass."""

	def test_to_dict(self):
	insight = Insight(
	pattern_type="correlation",
	summary="Test summary",
	detail="Test detail",
	confidence=0.75,
	entities=["med1", "headache"],
	period_days=30,
	)
	d = insight.to_dict()
	assert d["pattern_type"] == "correlation"
	assert d["confidence"] == 0.75
	assert "med1" in d["entities"]

	def test_default_entities_and_period(self):
	insight = Insight(
	pattern_type="test",
	summary="s",
	detail="d",
	confidence=0.5,
	)
	assert insight.entities == []
	assert insight.period_days == 30


	class TestFormatInsightsForPrompt:
	"""Test formatting insights for system prompt injection."""

	def test_empty_insights_returns_empty(self):
	assert format_insights_for_prompt([]) == ""

	def test_single_insight_format(self):
	insights = [
	Insight(
	pattern_type="correlation",
	summary="Headache appeared on 5 days.",
	detail="detail",
	confidence=0.8,
	)
	]
	result = format_insights_for_prompt(insights)
	assert "Recent Health Insights" in result
	assert "Correlation" in result
	assert "80%" in result
	assert "Headache appeared on 5 days." in result

	def test_multiple_insights_numbered(self):
	insights = [
	Insight(
	pattern_type="correlation", summary="s1", detail="d1", confidence=0.9
	),
	Insight(
	pattern_type="frequency_change",
	summary="s2",
	detail="d2",
	confidence=0.7,
	),
	]
	result = format_insights_for_prompt(insights)
	assert "1." in result
	assert "2." in result

	def test_observational_language_guidance(self):
	"""Prompt should instruct the model to use observational language."""
	insights = [
	Insight(pattern_type="test", summary="s", detail="d", confidence=0.5),
	]
	result = format_insights_for_prompt(insights)
	assert "observational" in result.lower() or "I noticed" in result


	class TestPatternDetectorRunAnalysis:
	"""Test the run_analysis orchestration."""

	def test_returns_empty_when_disconnected(self):
	mock_graph = MagicMock()
	mock_graph.is_connected = False

	detector = PatternDetector(mock_graph)
	insights = detector.run_analysis("Elena", days=30)
	assert insights == []

	def test_returns_empty_when_no_graph(self):
	detector = PatternDetector(None)
	insights = detector.run_analysis("Elena", days=30)
	assert insights == []

	def test_continues_on_individual_detector_failure(self):
	"""If one detector fails, the others should still run."""
	mock_graph = MagicMock()
	mock_graph.is_connected = True
	# execute_read will raise on first call, return empty on subsequent
	mock_graph.execute_read.side_effect = [
	Exception("Neo4j error"), # medication_symptom_correlation
	[], # frequency_changes headache
	[], # frequency_changes migraine
	[], # frequency_changes confusion
	[], # missed_medication_impact
	[], # temporal_patterns
	]

	detector = PatternDetector(mock_graph)
	# Should not raise, just log warnings
	insights = detector.run_analysis("Elena", days=30)
	assert isinstance(insights, list)

	def test_sorts_by_confidence_descending(self):
	"""Insights should be sorted by confidence (highest first)."""
	mock_graph = MagicMock()
	mock_graph.is_connected = True
	# Mock medication_symptom_correlation to return data
	mock_graph.execute_read.side_effect = [
	# medication_symptom_correlation
	[
	{
	"medication": "Med A",
	"symptom": "headache",
	"co_occurrence_count": 10,
	"distinct_days": 8,
	},
	{
	"medication": "Med B",
	"symptom": "fatigue",
	"co_occurrence_count": 3,
	"distinct_days": 3,
	},
	],
	# All other detectors return empty
	[],
	[],
	[],
	[],
	[],
	]

	detector = PatternDetector(mock_graph)
	insights = detector.run_analysis("Elena", days=30)

	if len(insights) >= 2:
	assert insights[0].confidence >= insights[1].confidence

	def test_caps_at_five_insights(self):
	"""Should return at most 5 insights."""
	mock_graph = MagicMock()
	mock_graph.is_connected = True
	# Return lots of correlations
	mock_graph.execute_read.side_effect = [
	[
	{
	"medication": f"Med{i}",
	"symptom": f"sym{i}",
	"co_occurrence_count": 5,
	"distinct_days": 5,
	}
	for i in range(10)
	],
	[],
	[],
	[],
	[],
	[],
	]

	detector = PatternDetector(mock_graph)
	insights = detector.run_analysis("Elena", days=30)
	assert len(insights) <= 5


	class TestPatternDetectorInsightLanguage:
	"""Verify insights never use causal language."""

	def test_correlation_summary_is_neutral(self):
	mock_graph = MagicMock()
	mock_graph.is_connected = True
	mock_graph.execute_read.side_effect = [
	[
	{
	"medication": "Topiramate",
	"symptom": "headache",
	"co_occurrence_count": 5,
	"distinct_days": 5,
	}
	],
	[],
	[],
	[],
	[],
	[],
	]

	detector = PatternDetector(mock_graph)
	insights = detector.run_analysis("Elena", days=30)

	for insight in insights:
	summary_lower = insight.summary.lower()
	assert (
	"caused" not in summary_lower
	), f"Causal language in: {insight.summary}"
	assert (
	"triggered" not in summary_lower
	), f"Causal language in: {insight.summary}"
	assert (
	"because" not in summary_lower
	), f"Causal language in: {insight.summary}"


	class TestPatternDetectorFrequencyChanges:
	"""Test the frequency change detector."""

	def test_detects_increase(self):
	mock_graph = MagicMock()
	mock_graph.is_connected = True
	mock_graph.execute_read.return_value = [
	{"period": "prior", "event_count": 2},
	{"period": "recent", "event_count": 6},
	]

	detector = PatternDetector(mock_graph)
	insights = detector.detect_frequency_changes("Elena", "headache", days=30)

	assert len(insights) == 1
	assert "increased" in insights[0].summary.lower()

	def test_detects_decrease(self):
	mock_graph = MagicMock()
	mock_graph.is_connected = True
	mock_graph.execute_read.return_value = [
	{"period": "prior", "event_count": 10},
	{"period": "recent", "event_count": 3},
	]

	detector = PatternDetector(mock_graph)
	insights = detector.detect_frequency_changes("Elena", "headache", days=30)

	assert len(insights) == 1
	assert "decreased" in insights[0].summary.lower()

	def test_ignores_small_changes(self):
	"""Changes under 25% should not generate insights."""
	mock_graph = MagicMock()
	mock_graph.is_connected = True
	mock_graph.execute_read.return_value = [
	{"period": "prior", "event_count": 10},
	{"period": "recent", "event_count": 11},
	]

	detector = PatternDetector(mock_graph)
	insights = detector.detect_frequency_changes("Elena", "headache", days=30)
	assert len(insights) == 0

	def test_handles_insufficient_data(self):
	"""Should return nothing with fewer than MIN_SAMPLE_SIZE events."""
	mock_graph = MagicMock()
	mock_graph.is_connected = True
	mock_graph.execute_read.return_value = [
	{"period": "recent", "event_count": 1},
	]

	detector = PatternDetector(mock_graph)
	insights = detector.detect_frequency_changes("Elena", "headache", days=30)
	assert len(insights) == 0