Spaces:

MapoTofu9
/

why-agent

Sleeping

App Files Files Community

why-agent / tests /test_tools.py

MapoTofu9

deploy: HF Spaces

5d30bdc about 2 months ago

Raw

History Blame Contribute Delete

36 kB

	"""Smoke tests for agent/tools/schemas.py, run_sql.py, and inspect_schema.py.

	Tests verify shape and error-handling behaviour. Real in-memory DuckDB is used
	for run_sql; inspect_schema tests use a minimal in-memory YAML fixture.
	"""

	import duckdb
	import pytest

	from agent.tools.compare_periods import compare_periods
	from agent.tools.decompose_metric import decompose_metric
	from agent.tools.inspect_schema import inspect_schema
	from agent.tools.run_sql import build_connection, run_sql
	from agent.tools.schemas import (
	ComparePeriodsInput,
	DecomposeMetricInput,
	InspectSchemaInput,
	RunSqlInput,
	RunSqlOutput,
	TimeWindow,
	)

	# ---------------------------------------------------------------------------
	# Shared YAML fixture for inspect_schema tests
	# ---------------------------------------------------------------------------

	_MINIMAL_YAML = """\
	tables:
	items:
	file: items.parquet
	grain: "One row per item."
	description: "Grocery catalog."
	columns:
	id:
	type: BIGINT
	description: "Primary key."
	price:
	type: DOUBLE
	description: "Price in USD."
	joins:
	- "items.id = item_nutrition.item_id"
	orders:
	file: orders.parquet
	grain: "One row per order."
	description: "Order records."
	columns:
	id:
	type: BIGINT
	description: "Order ID."

	metrics:
	avg_price:
	description: "Mean price."
	sql: "SELECT AVG(price) AS value FROM items"
	time_column: null
	order_count:
	description: "Number of orders."
	sql: "SELECT COUNT(*) FROM orders"
	time_column: orders.created_at

	dimensions:
	store:
	description: "Store name."
	sql: "items.store"
	cardinality: 2

	joins:
	- name: items_to_orders
	left: items.id
	right: orders.item_id
	join_kind: inner
	notes: "Each order references one item."
	"""


	@pytest.fixture
	def sl_path(tmp_path: pytest.TempPathFactory) -> str:
	"""Write the minimal YAML to a temp file; return its path as a string."""
	p = tmp_path / "semantic_layer.yml"
	p.write_text(_MINIMAL_YAML)
	return str(p)


	# ---------------------------------------------------------------------------
	# compare_periods fixtures
	# ---------------------------------------------------------------------------

	_CP_YAML = """\
	tables:
	events:
	file: events.parquet
	grain: "One row per event."
	description: "Timestamped events with amounts."
	columns:
	ts:
	type: TIMESTAMP
	description: "Event time."
	amount:
	type: DOUBLE
	description: "Amount."
	category:
	type: VARCHAR
	description: "Category label."

	metrics:
	static_total:
	description: "Total amount across all events (static, no time filter)."
	sql: "SELECT SUM(amount) AS value FROM events"
	time_column: null

	windowed_count:
	description: "Count of events in a time window."
	sql: \|
	SELECT COUNT(*) AS value FROM events
	WHERE ts >= :start AND ts < :end
	time_column: events.ts

	windowed_sum:
	description: "Sum of amounts in a time window."
	sql: \|
	SELECT COALESCE(SUM(amount), 0.0) AS value FROM events
	WHERE ts >= :start AND ts < :end
	time_column: events.ts

	dimensions:
	category:
	description: "Event category."
	sql: "events.category"
	cardinality: 2
	"""


	@pytest.fixture
	def sl_cp(tmp_path: pytest.TempPathFactory) -> str:
	p = tmp_path / "cp_layer.yml"
	p.write_text(_CP_YAML)
	return str(p)


	@pytest.fixture
	def conn_cp() -> duckdb.DuckDBPyConnection:
	"""In-memory DuckDB with 4 events: 1 in Jan 2026, 3 in Feb 2026."""
	c = duckdb.connect()
	c.execute("""
	CREATE TABLE events AS SELECT * FROM (VALUES
	(TIMESTAMP '2026-01-10 00:00:00', 10.0, 'A'),
	(TIMESTAMP '2026-02-05 00:00:00', 20.0, 'B'),
	(TIMESTAMP '2026-02-10 00:00:00', 30.0, 'A'),
	(TIMESTAMP '2026-02-20 00:00:00', 40.0, 'B')
	) t(ts, amount, category)
	""")
	return c


	# ---------------------------------------------------------------------------
	# Fixtures
	# ---------------------------------------------------------------------------


	@pytest.fixture
	def conn() -> duckdb.DuckDBPyConnection:
	"""In-memory DuckDB with a small products table."""
	c = duckdb.connect()
	c.execute("""
	CREATE TABLE products AS
	SELECT * FROM (VALUES
	(1, 'Apple', 1.50, 'Fruit'),
	(2, 'Banana', 0.75, 'Fruit'),
	(3, 'Milk', 3.20, 'Dairy'),
	(4, 'Cheese', 8.99, 'Dairy'),
	(5, 'Bread', 2.50, 'Bakery')
	) t(id, name, price, category)
	""")
	return c


	# ---------------------------------------------------------------------------
	# RunSqlInput schema
	# ---------------------------------------------------------------------------


	class TestRunSqlInput:
	def test_valid_input(self) -> None:
	inp = RunSqlInput(query="SELECT 1", max_rows=50)
	assert inp.query == "SELECT 1"
	assert inp.max_rows == 50

	def test_default_max_rows(self) -> None:
	inp = RunSqlInput(query="SELECT 1")
	assert inp.max_rows == 100

	def test_max_rows_lower_bound_rejected(self) -> None:
	with pytest.raises(Exception):
	RunSqlInput(query="SELECT 1", max_rows=0)

	def test_max_rows_upper_bound_rejected(self) -> None:
	with pytest.raises(Exception):
	RunSqlInput(query="SELECT 1", max_rows=1001)


	# ---------------------------------------------------------------------------
	# RunSqlOutput schema
	# ---------------------------------------------------------------------------


	class TestRunSqlOutput:
	def test_success_output_has_no_error(self) -> None:
	out = RunSqlOutput(rows=[{"id": 1}], truncated=False, row_count=1, execution_ms=5.2)
	assert out.error is None
	assert out.hint is None

	def test_error_output_carries_hint(self) -> None:
	out = RunSqlOutput(
	rows=[],
	truncated=False,
	row_count=0,
	execution_ms=0.0,
	error="bad query",
	hint="check column names",
	)
	assert out.error == "bad query"
	assert out.hint == "check column names"


	# ---------------------------------------------------------------------------
	# TimeWindow schema
	# ---------------------------------------------------------------------------


	class TestTimeWindow:
	def test_valid_window(self) -> None:
	w = TimeWindow(start="2026-01-01", end="2026-02-01")
	assert w.start == "2026-01-01"
	assert w.end == "2026-02-01"

	def test_rejects_non_iso_string(self) -> None:
	with pytest.raises(Exception, match="ISO date"):
	TimeWindow(start="tomorrow", end="2026-02-01")

	def test_rejects_invalid_date(self) -> None:
	with pytest.raises(Exception):
	TimeWindow(start="2026-13-01", end="2026-02-01")


	# ---------------------------------------------------------------------------
	# InspectSchemaInput schema
	# ---------------------------------------------------------------------------


	class TestInspectSchemaInput:
	def test_defaults_to_no_table(self) -> None:
	assert InspectSchemaInput().table is None

	def test_accepts_table_name(self) -> None:
	assert InspectSchemaInput(table="items").table == "items"


	# ---------------------------------------------------------------------------
	# ComparePeriodsInput schema
	# ---------------------------------------------------------------------------


	class TestComparePeriodsInput:
	def test_valid_without_segment(self) -> None:
	inp = ComparePeriodsInput(
	metric="avg_price",
	before=TimeWindow(start="2026-01-01", end="2026-02-01"),
	after=TimeWindow(start="2026-02-01", end="2026-03-01"),
	)
	assert inp.segment is None

	def test_valid_with_segment(self) -> None:
	inp = ComparePeriodsInput(
	metric="avg_price",
	before=TimeWindow(start="2026-01-01", end="2026-02-01"),
	after=TimeWindow(start="2026-02-01", end="2026-03-01"),
	segment={"store": "WHOLE_FOODS"},
	)
	assert inp.segment == {"store": "WHOLE_FOODS"}


	# ---------------------------------------------------------------------------
	# DecomposeMetricInput schema
	# ---------------------------------------------------------------------------


	class TestDecomposeMetricInput:
	def test_valid_input(self) -> None:
	inp = DecomposeMetricInput(
	metric="avg_price",
	dimensions=["store", "category"],
	time_window=TimeWindow(start="2026-01-01", end="2026-04-01"),
	)
	assert len(inp.dimensions) == 2


	# ---------------------------------------------------------------------------
	# run_sql behaviour
	# ---------------------------------------------------------------------------


	class TestRunSql:
	def test_returns_expected_shape(self, conn: duckdb.DuckDBPyConnection) -> None:
	result = run_sql(RunSqlInput(query="SELECT id, name FROM products"), conn)

	assert isinstance(result, RunSqlOutput)
	assert result.error is None
	assert result.row_count == 5
	assert result.truncated is False
	assert result.execution_ms >= 0
	assert "id" in result.rows[0]
	assert "name" in result.rows[0]

	def test_truncation_at_max_rows(self, conn: duckdb.DuckDBPyConnection) -> None:
	result = run_sql(RunSqlInput(query="SELECT * FROM products", max_rows=3), conn)

	assert result.truncated is True
	assert result.row_count == 3
	assert len(result.rows) == 3

	def test_no_truncation_when_rows_fit(self, conn: duckdb.DuckDBPyConnection) -> None:
	result = run_sql(RunSqlInput(query="SELECT * FROM products", max_rows=100), conn)

	assert result.truncated is False

	def test_rejects_drop(self, conn: duckdb.DuckDBPyConnection) -> None:
	result = run_sql(RunSqlInput(query="DROP TABLE products"), conn)

	assert result.error is not None
	assert result.hint is not None
	assert result.row_count == 0

	def test_rejects_insert(self, conn: duckdb.DuckDBPyConnection) -> None:
	result = run_sql(RunSqlInput(query="INSERT INTO products VALUES (6, 'X', 1.0, 'Y')"), conn)

	assert result.error is not None

	def test_with_cte(self, conn: duckdb.DuckDBPyConnection) -> None:
	result = run_sql(
	RunSqlInput(
	query="WITH cheap AS (SELECT * FROM products WHERE price < 2) SELECT * FROM cheap"
	),
	conn,
	)

	assert result.error is None
	assert result.row_count == 2 # Apple (1.50) and Banana (0.75)

	def test_allows_leading_line_comments_before_select(
	self, conn: duckdb.DuckDBPyConnection
	) -> None:
	result = run_sql(
	RunSqlInput(
	query="-- check cheap products\nSELECT id, name FROM products WHERE price < 2"
	),
	conn,
	)

	assert result.error is None
	assert result.row_count == 2

	def test_allows_leading_block_comments_before_with(
	self, conn: duckdb.DuckDBPyConnection
	) -> None:
	result = run_sql(
	RunSqlInput(
	query=(
	"/* build a small subset */\n"
	"WITH cheap AS (SELECT * FROM products WHERE price < 2) SELECT * FROM cheap"
	)
	),
	conn,
	)

	assert result.error is None
	assert result.row_count == 2

	def test_rejects_write_statement_after_leading_comment(
	self, conn: duckdb.DuckDBPyConnection
	) -> None:
	result = run_sql(RunSqlInput(query="-- not actually safe\nDROP TABLE products"), conn)

	assert result.error is not None
	assert result.row_count == 0

	def test_bad_table_returns_error_dict(self, conn: duckdb.DuckDBPyConnection) -> None:
	result = run_sql(RunSqlInput(query="SELECT * FROM nonexistent"), conn)

	assert result.error is not None
	assert result.hint is not None
	assert result.rows == []

	def test_execution_ms_non_negative(self, conn: duckdb.DuckDBPyConnection) -> None:
	result = run_sql(RunSqlInput(query="SELECT 1"), conn)

	assert result.execution_ms >= 0

	def test_rows_are_dicts_with_correct_values(self, conn: duckdb.DuckDBPyConnection) -> None:
	result = run_sql(RunSqlInput(query="SELECT id, price FROM products WHERE id = 1"), conn)

	assert len(result.rows) == 1
	assert result.rows[0]["id"] == 1
	assert result.rows[0]["price"] == pytest.approx(1.50)

	def test_rejects_semicolon_injection(self, conn: duckdb.DuckDBPyConnection) -> None:
	result = run_sql(
	RunSqlInput(query="WITH x AS (SELECT 1) SELECT * FROM x; DROP TABLE products"),
	conn,
	)

	assert result.error is not None

	def test_no_conn_uses_parquet_dir(self, tmp_path: pytest.TempPathFactory) -> None:
	# Write a tiny parquet file, point build_connection at it, run a query.
	import pyarrow as pa
	import pyarrow.parquet as pq

	table = pa.table({"id": [1, 2], "val": ["a", "b"]})
	pq.write_table(table, tmp_path / "things.parquet")

	conn = build_connection(str(tmp_path))
	result = run_sql(RunSqlInput(query="SELECT COUNT(*) AS n FROM things"), conn)

	assert result.error is None
	assert result.rows[0]["n"] == 2


	# ---------------------------------------------------------------------------
	# inspect_schema behaviour
	# ---------------------------------------------------------------------------


	class TestInspectSchema:
	def test_list_all_returns_tables_metrics_dimensions(self, sl_path: str) -> None:
	result = inspect_schema(InspectSchemaInput(), sl_path)

	assert result.error is None
	assert result.tables is not None
	assert result.metrics is not None
	assert result.dimensions is not None
	assert result.table is None

	def test_list_all_table_names(self, sl_path: str) -> None:
	result = inspect_schema(InspectSchemaInput(), sl_path)

	assert set(result.tables) == {"items", "orders"}

	def test_list_all_metric_names(self, sl_path: str) -> None:
	result = inspect_schema(InspectSchemaInput(), sl_path)

	assert set(result.metrics) == {"avg_price", "order_count"}

	def test_list_all_dimension_names(self, sl_path: str) -> None:
	result = inspect_schema(InspectSchemaInput(), sl_path)

	assert result.dimensions == ["store"]

	def test_describe_table_returns_summary(self, sl_path: str) -> None:
	result = inspect_schema(InspectSchemaInput(table="items"), sl_path)

	assert result.error is None
	assert result.table is not None
	assert result.table.name == "items"
	assert result.table.description == "Grocery catalog."
	assert result.table.grain == "One row per item."
	assert result.tables is None
	assert result.metrics is None

	def test_describe_table_columns_shape(self, sl_path: str) -> None:
	result = inspect_schema(InspectSchemaInput(table="items"), sl_path)

	cols = result.table.columns
	assert len(cols) == 2
	assert cols[0].name == "id"
	assert cols[0].type == "BIGINT"
	assert cols[1].name == "price"

	def test_describe_table_joins(self, sl_path: str) -> None:
	result = inspect_schema(InspectSchemaInput(table="items"), sl_path)

	assert result.table.joins == ["items.id = item_nutrition.item_id"]

	def test_table_with_no_joins(self, sl_path: str) -> None:
	result = inspect_schema(InspectSchemaInput(table="orders"), sl_path)

	assert result.table.joins == []

	def test_unknown_table_returns_error(self, sl_path: str) -> None:
	result = inspect_schema(InspectSchemaInput(table="nonexistent"), sl_path)

	assert result.error is not None
	assert result.hint is not None
	assert "nonexistent" in result.error

	def test_missing_yaml_returns_error(self, tmp_path: pytest.TempPathFactory) -> None:
	result = inspect_schema(InspectSchemaInput(), str(tmp_path / "missing.yml"))

	assert result.error is not None
	assert result.hint is not None

	def test_null_yaml_values_do_not_raise(self, tmp_path: pytest.TempPathFactory) -> None:
	# `tables: null` in YAML — must not crash with AttributeError on .keys()
	p = tmp_path / "null.yml"
	p.write_text("tables:\nmetrics:\ndimensions:\n")
	result = inspect_schema(InspectSchemaInput(), str(p))

	assert result.error is None
	assert result.tables == []
	assert result.metrics == []
	assert result.dimensions == []

	def test_malformed_column_returns_error(self, tmp_path: pytest.TempPathFactory) -> None:
	# Column entry missing 'type' — must return {error, hint}, not raise
	p = tmp_path / "bad.yml"
	p.write_text(
	"tables:\n t:\n grain: g\n description: d\n columns:\n - name: x\n"
	)
	result = inspect_schema(InspectSchemaInput(table="t"), str(p))

	assert result.error is not None
	assert result.hint is not None

	def test_env_var_default_path(self, sl_path: str, monkeypatch: pytest.MonkeyPatch) -> None:
	monkeypatch.setenv("SEMANTIC_LAYER_PATH", sl_path)
	result = inspect_schema(InspectSchemaInput()) # no path arg — uses env var

	assert result.error is None
	assert "items" in result.tables

	def test_catalog_includes_joins(self, sl_path: str) -> None:
	result = inspect_schema(InspectSchemaInput(), sl_path)

	assert result.joins is not None
	assert len(result.joins) == 1
	j = result.joins[0]
	assert j.left_col == "items.id"
	assert j.right_col == "orders.item_id"
	assert j.join_kind == "INNER"
	assert "INNER JOIN" in j.sql
	assert "items.id" in j.sql
	assert "orders.item_id" in j.sql

	def test_catalog_no_joins_returns_empty_list(self, tmp_path) -> None:
	p = tmp_path / "nojoin.yml"
	p.write_text("tables:\nmetrics:\ndimensions:\n")
	result = inspect_schema(InspectSchemaInput(), str(p))

	assert result.joins == []

	def test_table_lookup_does_not_include_joins_field(self, sl_path: str) -> None:
	# joins are only in the catalog response, not per-table responses
	result = inspect_schema(InspectSchemaInput(table="items"), sl_path)

	assert result.joins is None

	def test_malformed_join_missing_left_is_skipped(self, tmp_path) -> None:
	p = tmp_path / "badjoin.yml"
	p.write_text(
	"tables:\nmetrics:\ndimensions:\n"
	"joins:\n - name: bad\n right: orders.item_id\n join_kind: inner\n"
	)
	result = inspect_schema(InspectSchemaInput(), str(p))

	assert result.joins == []

	def test_malformed_join_unqualified_right_is_skipped(self, tmp_path) -> None:
	p = tmp_path / "badjoin2.yml"
	p.write_text(
	"tables:\nmetrics:\ndimensions:\n"
	"joins:\n - name: bad\n left: items.id\n right: item_id\n join_kind: inner\n"
	)
	result = inspect_schema(InspectSchemaInput(), str(p))

	assert result.joins == []

	def test_catalog_includes_gotchas_for_critical_and_high(self, tmp_path) -> None:
	p = tmp_path / "gotchas.yml"
	p.write_text(
	"tables:\nmetrics:\ndimensions:\n"
	"gotchas:\n"
	" - name: watch_nulls\n severity: critical\n description: Always IS NOT TRUE.\n"
	" - name: medium_note\n severity: medium\n description: Less important.\n"
	)
	result = inspect_schema(InspectSchemaInput(), str(p))

	assert result.gotchas is not None
	# 1 YAML gotcha + 3 hardcoded SQL correctness rules
	assert len(result.gotchas) == 4
	yaml_gotcha = result.gotchas[0]
	assert "CRITICAL" in yaml_gotcha
	assert "watch_nulls" in yaml_gotcha

	def test_catalog_no_gotchas_returns_none(self, sl_path: str) -> None:
	# No YAML gotchas, but hardcoded SQL rules are always included
	result = inspect_schema(InspectSchemaInput(), sl_path)

	assert result.gotchas is not None
	assert all("sql_" in g for g in result.gotchas)

	def test_catalog_includes_dimension_notes(self, tmp_path) -> None:
	p = tmp_path / "dimnotes.yml"
	p.write_text(
	"tables:\nmetrics:\n"
	"dimensions:\n"
	" key_dim:\n"
	" description: The most important dimension.\n"
	" primary_for_demo: true\n"
	" notes: Always check this first.\n"
	" plain_dim:\n"
	" description: Just a regular dim.\n"
	)
	result = inspect_schema(InspectSchemaInput(), str(p))

	assert result.dimension_notes is not None
	assert "key_dim" in result.dimension_notes
	assert "PRIMARY DEMO DIMENSION" in result.dimension_notes["key_dim"]
	assert "plain_dim" in result.dimension_notes

	def test_derived_dimension_sql_included_in_notes(self, tmp_path) -> None:
	p = tmp_path / "derived.yml"
	p.write_text(
	"tables:\nmetrics:\n"
	"dimensions:\n"
	" is_holiday_window:\n"
	" derived: true\n"
	" description: Is the message within 3 days of a holiday?\n"
	' sql: "messages.date BETWEEN holidays.date - INTERVAL 3 DAY AND holidays.date"\n'
	" notes: Requires LEFT JOIN to holidays.\n"
	)
	result = inspect_schema(InspectSchemaInput(), str(p))

	assert result.dimension_notes is not None
	notes = result.dimension_notes["is_holiday_window"]
	assert "messages.date BETWEEN holidays.date" in notes
	assert "SQL:" in notes

	def test_non_derived_dimension_has_no_sql_label(self, tmp_path) -> None:
	p = tmp_path / "nonderived.yml"
	p.write_text(
	"tables:\nmetrics:\n"
	"dimensions:\n"
	" channel:\n"
	" description: Email or push channel.\n"
	" sql: messages.channel\n"
	)
	result = inspect_schema(InspectSchemaInput(), str(p))

	assert result.dimension_notes is not None
	# non-derived dimension should not expose raw SQL expression in notes
	assert "SQL:" not in (result.dimension_notes.get("channel") or "")

	def test_derived_dimension_without_sql_field_no_crash(self, tmp_path) -> None:
	p = tmp_path / "derived_nosql.yml"
	p.write_text(
	"tables:\nmetrics:\n"
	"dimensions:\n"
	" computed_flag:\n"
	" derived: true\n"
	" description: Some derived flag with no sql yet.\n"
	)
	result = inspect_schema(InspectSchemaInput(), str(p))

	assert result.error is None
	assert result.dimension_notes is not None
	assert "computed_flag" in result.dimension_notes
	assert "SQL:" not in result.dimension_notes["computed_flag"]

	def test_derived_dimension_sql_on_real_layer(self) -> None:
	import pathlib

	result = inspect_schema(
	InspectSchemaInput(),
	str(pathlib.Path(__file__).parent.parent / "data" / "semantic_layer_6w.yml"),
	)

	assert result.dimension_notes is not None
	notes = result.dimension_notes.get("is_holiday_window", "")
	assert "SQL:" in notes
	assert "holidays.date" in notes


	# ---------------------------------------------------------------------------
	# compare_periods behaviour
	# ---------------------------------------------------------------------------

	_JAN = TimeWindow(start="2026-01-01", end="2026-02-01")
	_FEB = TimeWindow(start="2026-02-01", end="2026-03-01")
	_EMPTY = TimeWindow(start="2025-01-01", end="2025-02-01")


	class TestComparePeriods:
	def test_static_metric_no_time_column_returns_error(
	self, conn_cp: duckdb.DuckDBPyConnection, sl_cp: str
	) -> None:
	# static_total has time_column: null — compare_periods must reject it
	# rather than silently returning the same global value for both windows.
	result = compare_periods(
	ComparePeriodsInput(metric="static_total", before=_JAN, after=_FEB), conn_cp, sl_cp
	)

	assert result.error is not None
	assert result.hint is not None
	assert "time_column" in result.error
	assert result.abs_delta is None
	assert result.before_value is None

	def test_windowed_count_positive_delta(
	self, conn_cp: duckdb.DuckDBPyConnection, sl_cp: str
	) -> None:
	# Jan: 1 event, Feb: 3 events → delta = +2
	result = compare_periods(
	ComparePeriodsInput(metric="windowed_count", before=_JAN, after=_FEB), conn_cp, sl_cp
	)

	assert result.error is None
	assert result.before_value == pytest.approx(1.0)
	assert result.after_value == pytest.approx(3.0)
	assert result.abs_delta == pytest.approx(2.0)
	assert result.pct_delta == pytest.approx(200.0)

	def test_windowed_sum_positive_delta(
	self, conn_cp: duckdb.DuckDBPyConnection, sl_cp: str
	) -> None:
	# Jan: 10.0, Feb: 20+30+40=90.0 → delta = +80
	result = compare_periods(
	ComparePeriodsInput(metric="windowed_sum", before=_JAN, after=_FEB), conn_cp, sl_cp
	)

	assert result.error is None
	assert result.before_value == pytest.approx(10.0)
	assert result.after_value == pytest.approx(90.0)
	assert result.abs_delta == pytest.approx(80.0)
	assert result.pct_delta == pytest.approx(800.0)

	def test_pct_delta_none_when_before_zero(
	self, conn_cp: duckdb.DuckDBPyConnection, sl_cp: str
	) -> None:
	# _EMPTY window has no events → windowed_sum = 0.0
	result = compare_periods(
	ComparePeriodsInput(metric="windowed_sum", before=_EMPTY, after=_JAN), conn_cp, sl_cp
	)

	assert result.error is None
	assert result.before_value == pytest.approx(0.0)
	assert result.pct_delta is None

	def test_output_shape_has_all_fields(
	self, conn_cp: duckdb.DuckDBPyConnection, sl_cp: str
	) -> None:
	result = compare_periods(
	ComparePeriodsInput(metric="windowed_count", before=_JAN, after=_FEB), conn_cp, sl_cp
	)

	assert hasattr(result, "before_value")
	assert hasattr(result, "after_value")
	assert hasattr(result, "abs_delta")
	assert hasattr(result, "pct_delta")

	def test_unknown_metric_returns_error(
	self, conn_cp: duckdb.DuckDBPyConnection, sl_cp: str
	) -> None:
	result = compare_periods(
	ComparePeriodsInput(metric="nonexistent", before=_JAN, after=_FEB), conn_cp, sl_cp
	)

	assert result.error is not None
	assert result.hint is not None
	assert "nonexistent" in result.error

	def test_missing_yaml_returns_error(
	self, conn_cp: duckdb.DuckDBPyConnection, tmp_path: pytest.TempPathFactory
	) -> None:
	result = compare_periods(
	ComparePeriodsInput(metric="windowed_count", before=_JAN, after=_FEB),
	conn_cp,
	str(tmp_path / "missing.yml"),
	)

	assert result.error is not None
	assert result.hint is not None

	def test_segment_filter_narrows_result(
	self, conn_cp: duckdb.DuckDBPyConnection, sl_cp: str
	) -> None:
	# Feb: category A = 1 event (30.0), category B = 2 events (20+40=60)
	result = compare_periods(
	ComparePeriodsInput(
	metric="windowed_count", before=_JAN, after=_FEB, segment={"category": "A"}
	),
	conn_cp,
	sl_cp,
	)

	assert result.error is None
	# Jan: 1 A event; Feb: 1 A event → delta = 0
	assert result.before_value == pytest.approx(1.0)
	assert result.after_value == pytest.approx(1.0)

	def test_unknown_segment_dimension_returns_error(
	self, conn_cp: duckdb.DuckDBPyConnection, sl_cp: str
	) -> None:
	result = compare_periods(
	ComparePeriodsInput(
	metric="windowed_count", before=_JAN, after=_FEB, segment={"bogus_dim": "x"}
	),
	conn_cp,
	sl_cp,
	)

	assert result.error is not None
	assert result.hint is not None


	# ---------------------------------------------------------------------------
	# decompose_metric fixtures
	# ---------------------------------------------------------------------------

	_DM_YAML = """\
	tables:
	events:
	file: events.parquet
	grain: "One row per event."
	description: "Timestamped events."
	columns:
	ts:
	type: TIMESTAMP
	description: "Event time."
	amount:
	type: DOUBLE
	description: "Amount."
	category:
	type: VARCHAR
	description: "Category."

	metrics:
	windowed_count:
	description: "Count of events in a time window."
	sql: \|
	SELECT COUNT(*) AS value FROM events
	WHERE ts >= :start AND ts < :end
	time_column: events.ts

	static_avg:
	description: "Average amount (static)."
	sql: "SELECT AVG(amount) AS value FROM events"
	time_column: null

	dimensions:
	category:
	description: "Event category."
	sql: "events.category"
	cardinality: 3
	amount_band:
	description: "Coarse amount tier."
	sql: \|
	CASE
	WHEN events.amount < 20 THEN 'low'
	ELSE 'high'
	END
	cardinality: 2
	"""

	_DM_WIN = TimeWindow(start="2026-01-01", end="2026-03-01")


	@pytest.fixture
	def sl_dm(tmp_path: pytest.TempPathFactory) -> str:
	p = tmp_path / "dm_layer.yml"
	p.write_text(_DM_YAML)
	return str(p)


	@pytest.fixture
	def conn_dm() -> duckdb.DuckDBPyConnection:
	"""In-memory DuckDB: 5 events across 3 categories (A×3, B×1, C×1)."""
	c = duckdb.connect()
	c.execute("""
	CREATE TABLE events AS SELECT * FROM (VALUES
	(TIMESTAMP '2026-01-10 00:00:00', 10.0, 'A'),
	(TIMESTAMP '2026-01-15 00:00:00', 15.0, 'A'),
	(TIMESTAMP '2026-01-20 00:00:00', 20.0, 'A'),
	(TIMESTAMP '2026-02-05 00:00:00', 30.0, 'B'),
	(TIMESTAMP '2026-02-28 00:00:00', 40.0, 'C')
	) t(ts, amount, category)
	""")
	return c


	# ---------------------------------------------------------------------------
	# decompose_metric behaviour
	# ---------------------------------------------------------------------------


	class TestDecomposeMetric:
	def test_returns_slices_list(self, conn_dm: duckdb.DuckDBPyConnection, sl_dm: str) -> None:
	result = decompose_metric(
	DecomposeMetricInput(
	metric="windowed_count", dimensions=["category"], time_window=_DM_WIN
	),
	conn_dm,
	sl_dm,
	)

	assert result.error is None
	assert isinstance(result.slices, list)
	assert len(result.slices) > 0

	def test_slice_count_matches_dimension_cardinality(
	self, conn_dm: duckdb.DuckDBPyConnection, sl_dm: str
	) -> None:
	result = decompose_metric(
	DecomposeMetricInput(
	metric="windowed_count", dimensions=["category"], time_window=_DM_WIN
	),
	conn_dm,
	sl_dm,
	)

	# 3 categories: A, B, C
	assert len(result.slices) == 3

	def test_slice_fields_populated(self, conn_dm: duckdb.DuckDBPyConnection, sl_dm: str) -> None:
	result = decompose_metric(
	DecomposeMetricInput(
	metric="windowed_count", dimensions=["category"], time_window=_DM_WIN
	),
	conn_dm,
	sl_dm,
	)

	s = result.slices[0]
	assert s.dimension == "category"
	assert s.value is not None
	assert s.metric_value is not None
	assert s.anomaly_score is not None

	def test_metric_values_correct(self, conn_dm: duckdb.DuckDBPyConnection, sl_dm: str) -> None:
	result = decompose_metric(
	DecomposeMetricInput(
	metric="windowed_count", dimensions=["category"], time_window=_DM_WIN
	),
	conn_dm,
	sl_dm,
	)

	by_val = {s.value: s.metric_value for s in result.slices}
	assert by_val["A"] == pytest.approx(3.0)
	assert by_val["B"] == pytest.approx(1.0)
	assert by_val["C"] == pytest.approx(1.0)

	def test_ranked_highest_anomaly_first(
	self, conn_dm: duckdb.DuckDBPyConnection, sl_dm: str
	) -> None:
	# A has 3 events vs mean of 5/3 ≈ 1.67 — highest deviation
	result = decompose_metric(
	DecomposeMetricInput(
	metric="windowed_count", dimensions=["category"], time_window=_DM_WIN
	),
	conn_dm,
	sl_dm,
	)

	scores = [s.anomaly_score for s in result.slices if s.anomaly_score is not None]
	assert scores == sorted(scores, reverse=True)
	assert result.slices[0].value == "A"

	def test_multiple_dimensions_combined(
	self, conn_dm: duckdb.DuckDBPyConnection, sl_dm: str
	) -> None:
	result = decompose_metric(
	DecomposeMetricInput(
	metric="windowed_count",
	dimensions=["category", "amount_band"],
	time_window=_DM_WIN,
	),
	conn_dm,
	sl_dm,
	)

	assert result.error is None
	# category (3 slices) + amount_band (2 slices) = 5 total
	assert len(result.slices) == 5
	dims_seen = {s.dimension for s in result.slices}
	assert dims_seen == {"category", "amount_band"}

	def test_static_metric_returns_error(
	self, conn_dm: duckdb.DuckDBPyConnection, sl_dm: str
	) -> None:
	# Static metrics (time_column: null) silently ignore the time window —
	# returning a clear error is safer than wrong results the agent can't detect.
	result = decompose_metric(
	DecomposeMetricInput(metric="static_avg", dimensions=["category"], time_window=_DM_WIN),
	conn_dm,
	sl_dm,
	)

	assert result.error is not None
	assert result.hint is not None
	assert "time_column" in result.error

	def test_unknown_metric_returns_error(
	self, conn_dm: duckdb.DuckDBPyConnection, sl_dm: str
	) -> None:
	result = decompose_metric(
	DecomposeMetricInput(
	metric="no_such_metric", dimensions=["category"], time_window=_DM_WIN
	),
	conn_dm,
	sl_dm,
	)

	assert result.error is not None
	assert result.hint is not None
	assert "no_such_metric" in result.error

	def test_unknown_dimension_returns_error(
	self, conn_dm: duckdb.DuckDBPyConnection, sl_dm: str
	) -> None:
	result = decompose_metric(
	DecomposeMetricInput(
	metric="windowed_count", dimensions=["bogus_dim"], time_window=_DM_WIN
	),
	conn_dm,
	sl_dm,
	)

	assert result.error is not None
	assert result.hint is not None

	def test_missing_yaml_returns_error(
	self, conn_dm: duckdb.DuckDBPyConnection, tmp_path: pytest.TempPathFactory
	) -> None:
	result = decompose_metric(
	DecomposeMetricInput(
	metric="windowed_count", dimensions=["category"], time_window=_DM_WIN
	),
	conn_dm,
	str(tmp_path / "missing.yml"),
	)

	assert result.error is not None
	assert result.hint is not None