engram / tests /test_integration_synthetic.py

test: upload 220 tests

2ece486 verified 7 days ago

6.29 kB

	"""
	ENGRAM Protocol — Synthetic Integration Test
	Full pipeline E2E with synthetic tensors — no real model needed.

	Pipeline: create KV → extract state → serialize .eng → load → index → query → retrieve
	"""

	from __future__ import annotations

	from pathlib import Path

	import pytest
	import torch
	from safetensors.torch import load_file

	from kvcos.core.cache_spec import LLAMA_3_1_8B
	from kvcos.core.serializer import EngramSerializer
	from kvcos.core.types import CompressionMethod, StateExtractionMode
	from kvcos.core.manifold_index import ManifoldIndex
	from kvcos.core.retriever import EGRRetriever
	from kvcos.core.state_extractor import MARStateExtractor
	from kvcos.storage.local import LocalStorageBackend
	from tests.conftest import make_synthetic_kv


	class TestFullPipeline:
	"""End-to-end: store → index → query → retrieve using synthetic data."""

	def test_serialize_round_trip(self, tmp_data_dir: Path) -> None:
	"""Step 1-4: Create → serialize → load → verify shape."""
	keys, values = make_synthetic_kv(LLAMA_3_1_8B, ctx_len=256)
	assert keys.shape == (32, 8, 256, 128)

	serializer = EngramSerializer()
	eng_path = tmp_data_dir / "roundtrip.eng"

	serializer.serialize(
	keys=keys, values=values,
	agent_id="integration-test", task_description="round-trip test",
	model_id=LLAMA_3_1_8B["model_id"], output_path=eng_path,
	compression=CompressionMethod.FP16,
	)
	assert eng_path.exists()

	# Verify valid safetensors
	tensors = load_file(str(eng_path))
	assert "layer_0_keys" in tensors

	k_out, v_out, meta = serializer.deserialize(eng_path)
	assert k_out.shape == keys.shape
	assert v_out.shape == values.shape

	@pytest.mark.parametrize("mode", list(StateExtractionMode))
	def test_extraction_all_modes(self, mode: StateExtractionMode) -> None:
	"""Step 2: Extract state vector in all 3 modes."""
	keys, _ = make_synthetic_kv(LLAMA_3_1_8B, ctx_len=256)
	extractor = MARStateExtractor(mode=mode, rank=128)
	result = extractor.extract(keys, LLAMA_3_1_8B)

	assert result.state_vec.dim() == 1
	assert result.state_vec.shape[0] > 0
	assert result.l2_norm > 0
	assert result.mode == mode

	def test_index_and_query(self, tmp_data_dir: Path) -> None:
	"""Step 5-6: Index state vector → query with different tensor → get result."""
	keys_a, _ = make_synthetic_kv(LLAMA_3_1_8B, ctx_len=256, seed=42)
	keys_b, _ = make_synthetic_kv(LLAMA_3_1_8B, ctx_len=256, seed=99)

	extractor = MARStateExtractor(
	mode=StateExtractionMode.MEAN_POOL,
	)
	dim = extractor.output_dim(LLAMA_3_1_8B)
	index = ManifoldIndex(dim=dim)

	# Extract and index first tensor
	from kvcos.core.manifold_index import IndexEntry

	result_a = extractor.extract(keys_a, LLAMA_3_1_8B)
	index.add(
	result_a.state_vec,
	IndexEntry(
	cache_id="test-cache-a",
	task_description="indexed engram",
	model_id=LLAMA_3_1_8B["model_id"],
	created_at="2026-01-01T00:00:00Z",
	context_len=256,
	l2_norm=result_a.l2_norm,
	),
	)

	# Query with second tensor
	result_b = extractor.extract(keys_b, LLAMA_3_1_8B)
	results = index.search(result_b.state_vec, top_k=1)

	assert len(results) >= 1
	assert results[0]["cache_id"] == "test-cache-a"

	def test_full_egr_pipeline(self, tmp_data_dir: Path) -> None:
	"""Step 7: Full EGR retrieval — store → index → query → retrieve."""
	keys, values = make_synthetic_kv(LLAMA_3_1_8B, ctx_len=256, seed=42)
	query_keys, _ = make_synthetic_kv(LLAMA_3_1_8B, ctx_len=256, seed=99)

	extractor = MARStateExtractor(
	mode=StateExtractionMode.MEAN_POOL,
	)
	dim = extractor.output_dim(LLAMA_3_1_8B)
	index = ManifoldIndex(dim=dim)
	storage = LocalStorageBackend(data_dir=tmp_data_dir)
	retriever = EGRRetriever(extractor, index, storage)

	# Store
	cache_id = retriever.index_engram(
	keys=keys, values=values, spec=LLAMA_3_1_8B,
	agent_id="integration-test",
	task_description="full pipeline test",
	model_id=LLAMA_3_1_8B["model_id"],
	output_dir=tmp_data_dir,
	)
	assert isinstance(cache_id, str)
	assert index.n_entries == 1

	# Retrieve
	response = retriever.retrieve(query_keys, LLAMA_3_1_8B, top_k=1)
	assert len(response.results) >= 1

	result = response.results[0]
	assert result.cache_id == cache_id
	assert result.keys.shape == keys.shape
	assert result.values.shape == values.shape
	assert result.similarity != 0.0

	def test_multi_engram_ranking(self, tmp_data_dir: Path) -> None:
	"""Store 3 engrams, query, verify results are ranked by similarity."""
	extractor = MARStateExtractor(mode=StateExtractionMode.MEAN_POOL)
	dim = extractor.output_dim(LLAMA_3_1_8B)
	index = ManifoldIndex(dim=dim)
	storage = LocalStorageBackend(data_dir=tmp_data_dir)
	retriever = EGRRetriever(extractor, index, storage)

	for seed in (10, 20, 30):
	keys, values = make_synthetic_kv(LLAMA_3_1_8B, ctx_len=64, seed=seed)
	retriever.index_engram(
	keys=keys, values=values, spec=LLAMA_3_1_8B,
	agent_id="test", task_description=f"seed-{seed}",
	model_id=LLAMA_3_1_8B["model_id"],
	output_dir=tmp_data_dir,
	)

	assert index.n_entries == 3

	query_keys, _ = make_synthetic_kv(LLAMA_3_1_8B, ctx_len=64, seed=10)
	response = retriever.retrieve(query_keys, LLAMA_3_1_8B, top_k=3)

	assert len(response.results) == 3
	# Results should be sorted by descending similarity
	sims = [r.similarity for r in response.results]
	assert sims == sorted(sims, reverse=True)
	# Closest match should be seed=10 (same as query)
	assert response.results[0].task_description == "seed-10"