Granis87 commited on Feb 22

Commit

c3a3710

verified ·

1 Parent(s): dbb04e4

Upload folder using huggingface_hub

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

.env.example +116 -0
.gitignore +1 -0
REFACTORING_TODO.md +8 -5
RELEASE_CHECKLIST.md +43 -65
config.yaml +1 -1
data/mnemocore_hnsw.faiss +0 -0
data/mnemocore_hnsw_idmap.json +1 -0
data/mnemocore_hnsw_vectors.npy +3 -0
data/subconscious_evolution.json +2 -2
docs/AGI_MEMORY_BLUEPRINT.md +713 -0
integrations/README.md +233 -0
integrations/aider/aider_wrap.sh +44 -0
integrations/claude_code/CLAUDE_memory_snippet.md +38 -0
integrations/claude_code/hooks/post_tool_store.py +96 -0
integrations/claude_code/hooks/pre_session_inject.py +93 -0
integrations/claude_code/hooks_config_fragment.json +28 -0
integrations/claude_code/mcp_config.json +13 -0
integrations/gemini_cli/GEMINI_memory_snippet.md +35 -0
integrations/gemini_cli/gemini_wrap.sh +47 -0
integrations/mnemo_bridge.py +177 -0
integrations/setup.ps1 +158 -0
integrations/setup.sh +299 -0
integrations/universal/context_inject.sh +29 -0
integrations/universal/store_session.sh +40 -0
mnemocore_verify.py +136 -0
src/mnemocore/agent_interface.py +145 -0
src/mnemocore/api/main.py +365 -1
src/mnemocore/core/agent_profile.py +65 -0
src/mnemocore/core/anticipatory.py +51 -0
src/mnemocore/core/binary_hdv.py +41 -31
src/mnemocore/core/confidence.py +196 -0
src/mnemocore/core/config.py +91 -11
src/mnemocore/core/container.py +24 -0
src/mnemocore/core/contradiction.py +336 -0
src/mnemocore/core/cross_domain.py +211 -0
src/mnemocore/core/emotional_tag.py +124 -0
src/mnemocore/core/engine.py +230 -55
src/mnemocore/core/episodic_store.py +144 -0
src/mnemocore/core/forgetting_curve.py +233 -0
src/mnemocore/core/hnsw_index.py +170 -140
src/mnemocore/core/memory_model.py +132 -0
src/mnemocore/core/meta_memory.py +70 -0
src/mnemocore/core/node.py +20 -1
src/mnemocore/core/prediction_store.py +294 -0
src/mnemocore/core/preference_store.py +53 -0
src/mnemocore/core/procedural_store.py +77 -0
src/mnemocore/core/provenance.py +297 -0
src/mnemocore/core/pulse.py +110 -0
src/mnemocore/core/qdrant_store.py +38 -16
src/mnemocore/core/semantic_consolidation.py +13 -0

.env.example ADDED Viewed

	@@ -0,0 +1,116 @@

+# MnemoCore Environment Configuration
+# ====================================
+# Copy this file to .env and fill in the values.
+# All variables can be overridden at runtime.
+# ===========================================
+# REQUIRED: API Security
+# ===========================================
+# API key for authentication (REQUIRED - must be set)
+# Generate a secure key: python -c "import secrets; print(secrets.token_urlsafe(32))"
+HAIM_API_KEY=your-secure-api-key-here
+# ===========================================
+# Redis Configuration
+# ===========================================
+# Redis connection URL
+# Format: redis://[username:password@]host:port/db
+REDIS_URL=redis://redis:6379/0
+# Redis stream key for pub/sub events
+REDIS_STREAM_KEY=haim:subconscious
+# Maximum Redis connections
+REDIS_MAX_CONNECTIONS=10
+# Redis socket timeout (seconds)
+REDIS_SOCKET_TIMEOUT=5
+# ===========================================
+# Qdrant Configuration
+# ===========================================
+# Qdrant connection URL
+QDRANT_URL=http://qdrant:6333
+# Collection names
+QDRANT_COLLECTION_HOT=haim_hot
+QDRANT_COLLECTION_WARM=haim_warm
+# ===========================================
+# Server Configuration
+# ===========================================
+# Host to bind the server
+HOST=0.0.0.0
+# Port to listen on
+PORT=8100
+# Number of uvicorn workers (1 recommended for stateful apps)
+WORKERS=1
+# ===========================================
+# Logging Configuration
+# ===========================================
+# Log level: DEBUG, INFO, WARNING, ERROR, CRITICAL
+LOG_LEVEL=INFO
+# Enable structured JSON logging
+STRUCTURED_LOGGING=true
+# ===========================================
+# Observability (Prometheus)
+# ===========================================
+# Port for Prometheus metrics
+METRICS_PORT=9090
+# ===========================================
+# Memory Tier Configuration
+# ===========================================
+# Hot tier max memories
+HOT_MAX_MEMORIES=2000
+# Warm tier max memories
+WARM_MAX_MEMORIES=100000
+# LTP decay rate
+LTP_DECAY_LAMBDA=0.01
+# ===========================================
+# GPU Configuration (Optional)
+# ===========================================
+# Enable GPU acceleration
+GPU_ENABLED=false
+# CUDA device (e.g., cuda:0)
+GPU_DEVICE=cuda:0
+# ===========================================
+# MCP Bridge Configuration (Optional)
+# ===========================================
+# Enable MCP bridge
+MCP_ENABLED=false
+# MCP transport: stdio, tcp
+MCP_TRANSPORT=stdio
+# MCP host and port (for TCP transport)
+MCP_HOST=127.0.0.1
+MCP_PORT=8110
+# ===========================================
+# CORS Configuration (Optional)
+# ===========================================
+# Allowed CORS origins (comma-separated)
+# CORS_ORIGINS=http://localhost:3000,https://example.com
+# ===========================================
+# Rate Limiting (Optional)
+# ===========================================
+# Enable rate limiting
+RATE_LIMIT_ENABLED=true
+# Requests per window
+RATE_LIMIT_REQUESTS=100
+# Window size in seconds
+RATE_LIMIT_WINDOW=60

.gitignore CHANGED Viewed

@@ -38,6 +38,7 @@ ENV/
 htmlcov/
 .tox/
 .nox/
 # Data (runtime generated)
 data/memory.jsonl

 htmlcov/
 .tox/
 .nox/
+.hypothesis/
 # Data (runtime generated)
 data/memory.jsonl

REFACTORING_TODO.md CHANGED Viewed

@@ -26,7 +26,7 @@ Status för kodoptimering inför kommande funktionalitet.
 ---
 ### 2. Ofullständiga features
-**Status:** Pending
 **Problem:**
 - Flera TODOs i produktionskod som lämnats oimplementerade
@@ -44,8 +44,10 @@ Line 320: # TODO: orchestrate_orch_or() not implemented
 ```
 **Åtgärd:**
-- Implementera funktionerna
-- Eller ta bort dödkod
 ---
@@ -165,7 +167,7 @@ Import-stilen följer redan rekommenderad Python-praxis. Ingen åtgärd behövs.
 ## Förbättra testtäckning
 ```bash
-pytest --cov=src --cov-report=html
 ```
 Kör för att identifiera luckor i testtäckningen.
@@ -187,13 +189,14 @@ Kör för att identifiera luckor i testtäckningen.
 ## Framsteg
 - [x] Punkt 1: HDV-konsolidering ✅
-- [ ] Punkt 2: Ofullständiga features
 - [ ] Punkt 3: Felhantering
 - [ ] Punkt 4: Singleton-reduktion 📋 Roadmap
 - [ ] Punkt 5: Stora funktioner 📋 Roadmap
 - [x] Punkt 6: Circuit breakers ✅
 - [x] Punkt 7: Hårkodade sökvägar ✅
 - [x] Punkt 8: Import-stil ✅ (redan konsekvent)
 ---

 ---
 ### 2. Ofullständiga features
+**Status:** ✅ Verified / Resolved
 **Problem:**
 - Flera TODOs i produktionskod som lämnats oimplementerade
 ```
 **Åtgärd:**
+- `superposition_query`: Implemented as `_superposition_query` in `HAIMLLMIntegrator`.
+- `orchestrate_orch_or`: Implemented in `HAIMEngine`.
+- LLM Calls: Code now supports generic providers (OpenAI, Gemini via `google.generativeai`, etc) with safe fallbacks (`_mock_llm_response`) if not configured.
+- `_concept_to_memory_id`: Implemented in `MultiAgentHAIM`.
 ---
 ## Förbättra testtäckning
 ```bash
+pytest --cov=mnemocore --cov-report=html
 ```
 Kör för att identifiera luckor i testtäckningen.
 ## Framsteg
 - [x] Punkt 1: HDV-konsolidering ✅
+- [x] Punkt 2: Ofullständiga features ✅
 - [ ] Punkt 3: Felhantering
 - [ ] Punkt 4: Singleton-reduktion 📋 Roadmap
 - [ ] Punkt 5: Stora funktioner 📋 Roadmap
 - [x] Punkt 6: Circuit breakers ✅
 - [x] Punkt 7: Hårkodade sökvägar ✅
 - [x] Punkt 8: Import-stil ✅ (redan konsekvent)
+- [x] Test-suite import fixad (src. -> mnemocore.) ✅
 ---

RELEASE_CHECKLIST.md CHANGED Viewed

@@ -1,59 +1,44 @@
-# MnemoCore Public Beta Release Checklist
-## Status: ðŸŸ  ORANGE â†’ ðŸŸ¢ GREEN
 ---
-## âœ… Completed
 - [x] LICENSE file (MIT)
 - [x] .gitignore created
 - [x] data/memory.jsonl removed (no stored memories)
 - [x] No leaked API keys or credentials
-- [x] 82 unit tests passing
 ---
-## ðŸ”§ Code TODOs (Known Limitations)
-These are documented gaps that can ship as "Phase 4 roadmap" items:
-### 1. `src/core/tier_manager.py:338`
-```python
-pass # TODO: Implement full consolidation with Qdrant
-```
-**Impact:** Warmâ†’Cold tier consolidation limited
-**Workaround:** Hotâ†’Warm works, Cold is filesystem-based
-**Fix:** Implement Qdrant batch scroll API for full archival
-### 2. `src/core/engine.py:192`
-```python
-# TODO: Phase 3.5 Qdrant search for WARM/COLD
-```
-**Impact:** Query only searches HOT tier currently
-**Workaround:** Promote memories before querying
-**Fix:** Add async Qdrant similarity search in query()
-### 3. `src/llm_integration.py:55-57, 128-129`
-```python
-# TODO: Call Gemini 3 Pro via OpenClaw API
-reconstruction = "TODO: Call Gemini 3 Pro"
-```
-**Impact:** LLM reconstruction not functional
-**Workaround:** Raw vector similarity works
-**Fix:** Implement LLM client or make it pluggable
-### 4. `src/nightlab/engine.py:339`
-```python
-# TODO: Notion API integration
-```
-**Impact:** Session documentation not auto-pushed
-**Workaround:** Written to local markdown files
-**Fix:** Add optional Notion connector
 ---
-## ðŸ“‹ Pre-Release Actions
 ### Before git push:
@@ -62,7 +47,8 @@ reconstruction = "TODO: Call Gemini 3 Pro"
 rm -rf .pytest_cache __pycache__ */__pycache__ *.pyc
 # 2. Verify tests pass
-source .venv/bin/activate && python -m pytest tests/ -v
 # 3. Verify import works
 python -c "from mnemocore.core.engine import HAIMEngine; print('OK')"
@@ -72,54 +58,46 @@ grep -r "sk-" src/ --include="*.py"
 grep -r "api_key.*=" src/ --include="*.py" | grep -v "api_key=\"\""
 # 5. Initialize fresh data files
 touch data/memory.jsonl data/codebook.json data/concepts.json data/synapses.json
 ```
 ### Update README.md:
-- [ ] Add: "Beta Release - See RELEASE_CHECKLIST.md for known limitations"
-- [ ] Add: "Installation" section with `pip install -r requirements.txt`
-- [ ] Add: "Quick Start" example
-- [ ] Add: "Roadmap" section linking TODOs above
 ---
-## ðŸš€ Release Command Sequence
 ```bash
-cd /home/dev-robin/Desktop/mnemocore
 # Verify clean state
 git status
-# Stage public files (exclude .venv)
-git add LICENSE .gitignore RELEASE_CHECKLIST.md
-git add src/ tests/ config.yaml requirements.txt pytest.ini
-git add README.md studycase.md docker-compose.yml
-git add data/.gitkeep  # If exists, or create empty dirs
 # Commit
-git commit -m "Initial public beta release (MIT)
-Known limitations documented in RELEASE_CHECKLIST.md"
 # Tag
-git tag -a v0.1.0-beta -m "Public Beta Release"
-# Push (when ready)
 git push origin main --tags
 ```
 ---
-## Post-Release
-- [ ] Create GitHub repository
-- [ ] Add repository topics: `vsa`, `holographic-memory`, `active-inference`, `vector-symbolic-architecture`
-- [ ] Enable GitHub Issues for community feedback
-- [ ] Publish whitepaper/blog post
----
-*Generated: 2026-02-15*

+# MnemoCore Public Beta Release Checklist
+## Status: 🟢 GREEN
 ---
+## ✅ Completed
 - [x] LICENSE file (MIT)
 - [x] .gitignore created
 - [x] data/memory.jsonl removed (no stored memories)
 - [x] No leaked API keys or credentials
+- [x] 377 unit tests passing (Coverage increased from 82)
+- [x] Test suite import paths fixed (`src.` -> `mnemocore.`)
+- [x] Critical TODOs addressed or verified as safe
 ---
+## 🔧 Resolved/Verified Items
+The following items were previously listed as known limitations but have been verified as resolved or robustly handled:
+1. **Qdrant Consolidation:** `src/core/tier_manager.py` implements `consolidate_warm_to_cold` with full Qdrant batch scrolling.
+2. **Qdrant Search:** `src/core/engine.py` query pipeline correctly delegates to `TierManager.search` which queries Qdrant for WARM tier results.
+3. **LLM Integration:** `src/llm_integration.py` includes `_mock_llm_response` fallbacks when no provider is configured, ensuring stability even without API keys.
+---
+## 📝 Remaining Roadmap Items (Non-Blocking)
+### 1. `src/llm_integration.py` - Advanced LLM Features
+- **Status:** Functional with generic providers.
+- **Task:** Implement specific "OpenClaw" or "Gemini 3 Pro" adapters if required in future. Current implementation supports generic OpenAI/Anthropic/Gemini/Ollama clients.
+### 2. Full Notion Integration
+- **Status:** Not currently present in `src/mnemocore`.
+- **Task:** Re-introduce `nightlab` or similar module if Notion support is needed in Phase 5.
 ---
+## 📋 Pre-Release Actions
 ### Before git push:
 rm -rf .pytest_cache __pycache__ */__pycache__ *.pyc
 # 2. Verify tests pass
+# Note: Ensure you are in the environment where mnemocore is installed
+python -m pytest
 # 3. Verify import works
 python -c "from mnemocore.core.engine import HAIMEngine; print('OK')"
 grep -r "api_key.*=" src/ --include="*.py" | grep -v "api_key=\"\""
 # 5. Initialize fresh data files
+# Ensure data directory exists
+mkdir -p data
 touch data/memory.jsonl data/codebook.json data/concepts.json data/synapses.json
 ```
 ### Update README.md:
+- [x] Add: "Beta Release - See RELEASE_CHECKLIST.md for known limitations"
+- [x] Add: "Installation" section with `pip install -r requirements.txt`
+- [x] Add: "Quick Start" example
+- [x] Add: "Roadmap" section linking TODOs above
 ---
+## 🚀 Release Command Sequence
 ```bash
 # Verify clean state
 git status
+# Stage public files
+git add LICENSE .gitignore RELEASE_CHECKLIST.md REFACTORING_TODO.md
+git add src/ tests/ config.yaml requirements.txt pytest.ini pyproject.toml
+git add README.md docker-compose.yml
+git add data/.gitkeep  # If exists
 # Commit
+git commit -m "Release Candidate: All tests passing, critical TODOs resolved.
+- Fixed test suite import paths (src -> mnemocore)
+- Verified Qdrant consolidation and search implementation
+- Confirmed LLM integration fallbacks"
 # Tag
+git tag -a v0.5.0-beta -m "Public Beta Release"
+# Push
 git push origin main --tags
 ```
 ---
+*Updated: 2026-02-18*

config.yaml CHANGED Viewed

@@ -86,7 +86,7 @@ haim:
   # MCP (Model Context Protocol) bridge
   mcp:
-    enabled: false
     transport: "stdio"  # "stdio" recommended for local MCP clients
     host: "127.0.0.1"
     port: 8110

   # MCP (Model Context Protocol) bridge
   mcp:
+    enabled: true
     transport: "stdio"  # "stdio" recommended for local MCP clients
     host: "127.0.0.1"
     port: 8110

data/mnemocore_hnsw.faiss ADDED Viewed

Binary file (6.95 kB). View file

data/mnemocore_hnsw_idmap.json ADDED Viewed

	@@ -0,0 +1 @@

+ {"id_map": ["test_node_1", "test_node_2", "test_node_0", "test_node_1", "test_node_2", "test_node_3", "test_node_4", "test_node_5", "test_node_6", "test_node_7", "test_node_8", "test_node_9", "f130a982-5936-4943-ac23-e1f4ad997d25", "19c168e1-c1c0-4074-bdc6-fa6c37bf5009", "b7ad4001-e20c-4f6d-8db7-eca98fbde4ea", "f22c991c-6336-4b11-867a-d141724253ff", "db802f41-0c60-4e62-8595-4864058924b2", "835b80bc-c2b1-4ecf-b0af-ec0442ec87bf", "d594c442-d4b5-4246-9c62-0fb605f235ca", "a467b3f5-d899-4b95-9e62-f7012171ec8d", "fdb78500-49fc-4cf3-a269-b023ba8fa11c", "21d4f6d9-72a6-4dd8-b83e-0d09ef57c680", "19f52711-1ae5-4c29-a0be-2618b162dace", "8442e4e6-cf0f-4f54-b35a-0ce6169fd2f3", "70010aa2-0d82-42bc-96f7-9b99374e24cd", "3cdb7cc9-44ce-4328-9d9a-44dc98d088eb", "1f12c17a-b4ef-4f21-b7f3-3df51196e7f6", "ac29dda1-fd96-4880-9141-01bc46ef93b1", "e0644808-6d24-470d-a667-867fe74d78e2", null, "836f116d-f47f-493b-9ac7-47db84e4a4f9", "fc37dc28-9e3a-484f-a65d-8bf46ee95dbb", "1d3fa01a-0710-453e-8738-4c5be348cd1b", "2776ca2a-429b-491d-9b8a-7061c9b14166", "a9cf8418-d188-41a8-b20d-f2431f790414", "eaf66116-a5ab-436a-a6c3-031d303cb6bd", "474ec49c-1f57-42ac-94e7-3d07d233780f", "a1a19beb-a5f8-4b31-9fe7-0db5b00415c6", "bad8ef94-7313-4bbf-a807-739ff8dcb5c2", "2f4bd760-18b2-4dc1-9dcb-3a6adb77ef23", "0c017bbc-e3ca-4ca0-be83-70b76c0b1be1", "3823dfcd-798d-4e59-a09e-113cc4ec6384", "2682da73-2827-4d68-83b5-1d88f92712ae", "280f0ca4-0930-4452-af29-392d2f99ba7b", "521f09c3-ed6c-4d0f-b04d-97362cb4a94d", "f338c239-dcbd-45ab-ab2b-4192084f5492", "2f011bbd-2a40-4666-a566-4117e8c5ed8e", "dae2e9c6-0c36-4536-b2ff-b59f5443c6fe", "d6028558-d803-454f-8a6f-f82463c44f18", "4c64fe2a-4194-494e-81a2-122911f6cd79", null, "n1", "n2", "n1"], "use_hnsw": false, "stale_count": 2}

data/mnemocore_hnsw_vectors.npy ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:00400554e796c7717c4def78feb30b5ba5360efed6a37bd35f71738695ac6522
+size 7040

data/subconscious_evolution.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
-  "updated_at": "2026-02-18T18:55:55.471022+00:00",
-  "cycle_count": 56,
   "insights_generated": 0,
   "current_cycle_interval": 1,
   "schedule": {

 {
+  "updated_at": "2026-02-21T21:14:22.859465+00:00",
+  "cycle_count": 168,
   "insights_generated": 0,
   "current_cycle_interval": 1,
   "schedule": {

docs/AGI_MEMORY_BLUEPRINT.md ADDED Viewed

	@@ -0,0 +1,713 @@

+# MnemoCore AGI Memory Blueprint
+### Toward a True Cognitive Memory Substrate for Agentic Systems
+> This document defines the **Phase 5 “AGI Memory” architecture** for MnemoCore – transforming it from a high‑end hyperdimensional memory engine into a **general cognitive substrate** for autonomous AI agents.
+---
+## 0. Goals & Non‑Goals
+### 0.1 Core Goals
+- Provide a **plug‑and‑play cognitive memory system** that any agent framework can mount as its “mind”:
+  - Solves **context window** limits by offloading long‑term structure and recall.
+  - Solves **memory management** by autonomous consolidation, forgetting, and self‑repair.
+  - Provides **new thoughts, associations and suggestions** rather than only retrieval.
+- Implement an explicit, formal model of:
+  - **Working / Short‑Term Memory (WM/STM)**
+  - **Episodic Memory**
+  - **Semantic Memory**
+  - **Procedural / Skill Memory**
+  - **Meta‑Memory & Self‑Model**
+- Maintain:
+  - `pip install mnemocore` **zero‑infra dev mode** (SQLite / in‑process vector store).
+  - Full infra path (Redis, Qdrant, k8s, MCP, OpenClaw live memory integration).[cite:436][cite:437]
+- Provide **clean public APIs** (Python + HTTP + MCP) that:
+  - Give agents a minimal but powerful surface: `observe / recall / reflect / propose_change`.
+  - Are stable enough to build higher‑level frameworks on (LangGraph, AutoGen, OpenAI Agents, OpenClaw, custom stacks).
+### 0.2 Non‑Goals
+- MnemoCore is **not**:
+  - En LLM eller policy‑generator.
+  - En komplett agentram – det är **minnet + kognitiva processer**.
+- MnemoCore ska **inte** hårdkoda specifika LLM‑providers.
+  - LLM används via abstraherad integration (`SubconsciousAI`, `LLMIntegration`) så att byte av motor är trivialt.
+---
+## 1. Cognitive Architecture Overview
+### 1.1 High‑Level Mental Model
+Systemet ska exponera en internt konsekvent kognitiv modell:
+- **Working Memory (WM)**
+  - Korttidsbuffert per agent / samtal / uppgift.
+  - Håller aktuella mål, senaste steg, delresultat.
+  - Living in RAM, med explicit API.
+- **Episodic Memory (EM)**
+  - Sekvens av *episodes*: “agent X gjorde Y i kontext Z och fick utfallet U”.
+  - Tidsstämplad, med länkar mellan episoder (kedjor).
+  - Riktad mot “vad hände när, i vilken ordning”.
+- **Semantic Memory (SM)**
+  - Abstraherade, konsoliderade representationer (concepts, prototypes).
+  - Sammanfattningar av hundratals episoder → en “semantic anchor”.
+  - Bra för svar på “vad vet jag generellt om X?”.
+- **Procedural Memory (PM)**
+  - Skills, planer, recept: “för att lösa typ‑X problem, gör följande steg …”.
+  - Kan hålla både mänsklig läsbar text och exekverbar kod (snippets, tools).
+- **Meta‑Memory (MM)**
+  - Självmodell för MnemoCore själv: prestanda, reliability, konfiguration, kända svagheter.
+  - Driver **självförbättringsloopen**.
+Alla dessa lever ovanpå din befintliga HDV/VSA‑kärna, tier manager, synapse index, subconscious loop osv.[cite:436][cite:437]
+### 1.2 New Core Services
+Föreslagna nya Python‑moduler (under `src/mnemocore/core`):
+- `memory_model.py`
+  - Typed dataklasser för WM/EM/SM/PM/MM entities.
+- `working_memory.py`
+  - WM implementation per agent/task med snabb caching.
+- `episodic_store.py`
+  - Episodisk tidsserie, sekvens‑API.
+- `semantic_store.py`
+  - Wrapper ovanpå befintlig vektorstore (Qdrant/HDV/HNSW) + consolidation hooks.
+- `procedural_store.py`
+  - Lagret för skills, scripts, tool definitions.
+- `meta_memory.py`
+  - Självmodell, logik för self‑improvement proposals.
+- `pulse.py`
+  - “Heartbeat”‑loop: driver subtle thoughts, consolidation ticks, gap detection, self‑reflection.
+- `agent_profile.py`
+  - Persistent profil per agent: preferenser, styrkor/svagheter, quirks.
+---
+## 2. Data Model
+### 2.1 Working Memory (WM)
+```python
+# src/mnemocore/core/memory_model.py
+@dataclass
+class WorkingMemoryItem:
+    id: str
+    agent_id: str
+    created_at: datetime
+    ttl_seconds: int
+    content: str
+    kind: Literal["thought", "observation", "goal", "plan_step", "meta"]
+    importance: float  #
+    tags: list[str]
+    hdv: BinaryHDV | None
+@dataclass
+class WorkingMemoryState:
+    agent_id: str
+    items: list[WorkingMemoryItem]
+    max_items: int
+```
+**Invariantes:**
+- WM är *liten* (t.ex. 32–128 items per agent).
+- WM ligger primärt i RAM; kan serialiseras till Redis/SQLite för persistens.
+- Access är O(1)/O(log n); LRU + importance‑vägning vid evicering.
+### 2.2 Episodic Memory (EM)
+```python
+@dataclass
+class EpisodeEvent:
+    timestamp: datetime
+    kind: Literal["observation", "action", "thought", "reward", "error"]
+    content: str
+    metadata: dict[str, Any]
+    hdv: BinaryHDV
+@dataclass
+class Episode:
+    id: str
+    agent_id: str
+    started_at: datetime
+    ended_at: datetime | None
+    goal: str | None
+    context: str | None   # project / environment
+    events: list[EpisodeEvent]
+    outcome: Literal["success", "failure", "partial", "unknown"]
+    reward: float | None
+    links_prev: list[str]  # previous episode IDs
+    links_next: list[str]  # next episode IDs
+    ltp_strength: float
+    reliability: float
+```
+### 2.3 Semantic Memory (SM)
+```python
+@dataclass
+class SemanticConcept:
+    id: str
+    label: str                     # "fastapi-request-validation"
+    description: str
+    tags: list[str]
+    prototype_hdv: BinaryHDV
+    support_episode_ids: list[str] # episodes som gav upphov
+    reliability: float
+    last_updated_at: datetime
+    metadata: dict[str, Any]
+```
+Kopplas direkt mot consolidation/semantic_consolidation + codebook/immunology.[cite:436][cite:437]
+### 2.4 Procedural Memory (PM)
+```python
+@dataclass
+class ProcedureStep:
+    order: int
+    instruction: str
+    code_snippet: str | None
+    tool_call: dict[str, Any] | None
+@dataclass
+class Procedure:
+    id: str
+    name: str
+    description: str
+    created_by_agent: str | None
+    created_at: datetime
+    updated_at: datetime
+    steps: list[ProcedureStep]
+    trigger_pattern: str           # "if user asks about X and Y"
+    success_count: int
+    failure_count: int
+    reliability: float
+    tags: list[str]
+```
+Procedurer kan genereras av LLM (SubconsciousAI), testas i episodiskt minne, och sedan promotas/demotas med reliability‑loop.
+### 2.5 Meta‑Memory (MM)
+```python
+@dataclass
+class SelfMetric:
+    name: str         # "hot_tier_hit_rate", "avg_query_latency_ms"
+    value: float
+    window: str       # "5m", "1h", "24h"
+    updated_at: datetime
+@dataclass
+class SelfImprovementProposal:
+    id: str
+    created_at: datetime
+    author: Literal["system", "agent", "human"]
+    title: str
+    description: str
+    rationale: str
+    expected_effect: str
+    status: Literal["pending", "accepted", "rejected", "implemented"]
+    metadata: dict[str, Any]
+```
+MM lagras delvis i vanlig storage (SM/PM) men har egen API‑yta.
+---
+## 3. Service Layer Design
+### 3.1 Working Memory Service
+**Fil:** `src/mnemocore/core/working_memory.py`
+Ansvar:
+- Hålla en per‑agent WM‑state.
+- Explicita operationer:
+  - `push_item(agent_id, item: WorkingMemoryItem)`
+  - `get_state(agent_id) -> WorkingMemoryState`
+  - `clear(agent_id)`
+  - `prune(agent_id)` – enligt importance + LRU.
+- Integrera med engine/query:
+  - Vid varje query: WM får en snapshot av top‑K resultat som “context items”.
+  - Vid svar: agent kan markera vilka items som var relevanta.
+### 3.2 Episodic Store Service
+**Fil:** `src/mnemocore/core/episodic_store.py`
+Ansvar:
+- Skapa och uppdatera Episodes:
+  - `start_episode(agent_id, goal, context) -> episode_id`
+  - `append_event(episode_id, kind, content, metadata)`
+  - `end_episode(episode_id, outcome, reward)`
+- Query:
+  - `get_episode(id)`
+  - `get_recent(agent_id, limit, context)`
+  - `find_similar_episodes(hdv, top_k)`
+- Koppling till befintlig HDV + tier manager:
+  - Varje Episode får en “episode_hdv” (bundle över event‑HDVs).
+  - LTP + reliabilitet följer samma formel som övrig LTP.
+### 3.3 Semantic Store Service
+**Fil:** `src/mnemocore/core/semantic_store.py`
+Ansvar:
+- Hålla SemanticConcepts + codebook.
+- API:
+  - `upsert_concept(concept: SemanticConcept)`
+  - `find_nearby_concepts(hdv, top_k)`
+  - `get_concept(id)`
+- Hookar mot:
+  - `semantic_consolidation.py` → abstraktioner / anchors.
+  - `immunology.py` → attractor cleanup.
+  - `recursive_synthesizer.py` → djup konceptsyntes.
+### 3.4 Procedural Store Service
+**Fil:** `src/mnemocore/core/procedural_store.py`
+Ansvar:
+- Lagra och hämta Procedures.
+- API:
+  - `store_procedure(proc: Procedure)`
+  - `get_procedure(id)`
+  - `find_applicable_procedures(query, agent_id)`
+  - `record_procedure_outcome(id, success: bool)`
+- Integrera med:
+  - SubconsciousAI → generera nya procedurer från pattern i EM/SM.
+  - Reliability‑loopen → promota “verified” skills.
+### 3.5 Meta Memory Service
+**Fil:** `src/mnemocore/core/meta_memory.py`
+Ansvar:
+- Hålla SelfMetrics + SelfImprovementProposals.
+- API:
+  - `record_metric(metric: SelfMetric)`
+  - `list_metrics(filter...)`
+  - `create_proposal(...)`
+  - `update_proposal_status(id, status)`
+- Integrera med:
+  - Pulse → skanna metrics och föreslå ändringar.
+  - LLM → generera förslagstexter (“self‑reflection reports”).
+---
+## 4. Pulse & Subtle Thoughts
+### 4.1 Pulse Definition
+**Fil:** `src/mnemocore/core/pulse.py`
+“Pulsen” är en central loop (async task, cron, eller k8s CronJob) som:
+- Kör med konfigurerbart intervall (t.ex. var 10:e sekund–var 5:e minut).
+- Har ett definierat set “ticks”:
+```python
+class PulseTick(Enum):
+    WM_MAINTENANCE = "wm_maintenance"
+    EPISODIC_CHAINING = "episodic_chaining"
+    SEMANTIC_REFRESH = "semantic_refresh"
+    GAP_DETECTION = "gap_detection"
+    INSIGHT_GENERATION = "insight_generation"
+    PROCEDURE_REFINEMENT = "procedure_refinement"
+    META_SELF_REFLECTION = "meta_self_reflection"
+```
+Pulse orchestrerar:
+- **WM_MAINTENANCE**
+  - Prune WM per agent.
+  - Lyfta nyligen viktiga items (“keep in focus”).
+- **EPISODIC_CHAINING**
+  - Skapa/länka episodiska sekvenser (prev/next).
+  - “Temporala narrativ”.
+- **SEMANTIC_REFRESH**
+  - Uppdatera semantic concepts baserat på nya episoder.
+  - Trigga immunology cleanup för drift.
+- **GAP_DETECTION**
+  - Kör `GapDetector` över EM/SM sista N minuter/timmar.
+  - Producera strukturerade knowledge gaps.
+- **INSIGHT_GENERATION**
+  - Kör SubconsciousAI/LLM över utvalda kluster.
+  - Skapar nya SemanticConcepts, Procedures, eller MetaProposals.
+- **PROCEDURE_REFINEMENT**
+  - Uppdatera reliability över PM.
+  - Flagga outdated/farliga procedures.
+- **META_SELF_REFLECTION**
+  - Sammanfattar senaste metriker, gap, failures → SelfImprovementProposals.
+### 4.2 Pulse Implementation Sketch
+```python
+# src/mnemocore/core/pulse.py
+class Pulse:
+    def __init__(self, container, config):
+        self.container = container
+        self.config = config
+        self._running = False
+    async def start(self):
+        self._running = True
+        while self._running:
+            start = datetime.utcnow()
+            await self.tick()
+            elapsed = (datetime.utcnow() - start).total_seconds()
+            await asyncio.sleep(max(0, self.config.pulse_interval_seconds - elapsed))
+    async def tick(self):
+        await self._wm_maintenance()
+        await self._episodic_chaining()
+        await self._semantic_refresh()
+        await self._gap_detection()
+        await self._insight_generation()
+        await self._procedure_refinement()
+        await self._meta_self_reflection()
+```
+Konfiguration i `config.yaml`:
+```yaml
+haim:
+  pulse:
+    enabled: true
+    interval_seconds: 30
+    max_agents_per_tick: 50
+    max_episodes_per_tick: 200
+```
+---
+## 5. Agent‑Facing APIs (Python & HTTP & MCP)
+### 5.1 High‑Level Python API
+**Fil:** `src/mnemocore/agent_interface.py`
+Syfte: ge agent‑kod ett ENKELT API:
+```python
+class CognitiveMemoryClient:
+    def __init__(self, engine: HAIMEngine, wm, episodic, semantic, procedural, meta):
+        ...
+    # --- Observation & WM ---
+    def observe(self, agent_id: str, content: str, **meta) -> str: ...
+    def get_working_context(self, agent_id: str, limit: int = 16) -> list[WorkingMemoryItem]: ...
+    # --- Episodic ---
+    def start_episode(self, agent_id: str, goal: str, context: str | None = None) -> str: ...
+    def append_event(self, episode_id: str, kind: str, content: str, **meta) -> None: ...
+    def end_episode(self, episode_id: str, outcome: str, reward: float | None = None) -> None: ...
+    # --- Semantic / Retrieval ---
+    def recall(self, agent_id: str, query: str, context: str | None = None,
+               top_k: int = 8, modes: tuple[str, ...] = ("episodic","semantic")) -> list[dict]: ...
+    # --- Procedural ---
+    def suggest_procedures(self, agent_id: str, query: str, top_k: int = 5) -> list[Procedure]: ...
+    def record_procedure_outcome(self, proc_id: str, success: bool) -> None: ...
+    # --- Meta / Self-awareness ---
+    def get_knowledge_gaps(self, agent_id: str, lookback_hours: int = 24) -> list[dict]: ...
+    def get_self_improvement_proposals(self) -> list[SelfImprovementProposal]: ...
+```
+### 5.2 HTTP Layer Additions
+Utöver befintliga `/store`, `/query`, `/feedback`, osv.[cite:437]
+Nya endpoints:
+- `POST /wm/observe`
+- `GET /wm/{agent_id}`
+- `POST /episodes/start`
+- `POST /episodes/{id}/event`
+- `POST /episodes/{id}/end`
+- `GET /episodes/{id}`
+- `GET /agents/{agent_id}/episodes`
+- `GET /agents/{agent_id}/context`
+- `GET /agents/{agent_id}/knowledge-gaps`
+- `GET /procedures/search`
+- `POST /procedures/{id}/feedback`
+- `GET /meta/proposals`
+- `POST /meta/proposals`
+### 5.3 MCP Tools
+Utöka `mnemocore.mcp.server` med nya verktyg:
+- `store_observation`
+- `recall_context`
+- `start_episode`, `end_episode`
+- `query_memory`
+- `get_knowledge_gaps`
+- `get_self_improvement_proposals`
+Så att Claude/GPT‑agenter kan:
+- “Titta in” i agentens egen historik.
+- Få WM + relevanta episoder + semantic concepts innan svar.
+- Få gaps och self‑reflection prompts.
+---
+## 6. Self‑Improvement Loop
+### 6.1 Loop Definition
+Målet: MnemoCore ska **ständigt förbättra sig**:
+1. Samlar **metrics** (performance + quality).
+2. Upptäcker systematiska brister (höga felrates, gap‑clusters).
+3. Genererar SelfImprovementProposals via LLM.
+4. Låter människa eller meta‑agent granska & appliera.
+### 6.2 Pipeline
+1. **Metrics Collection**
+   - Utnyttja befintlig `metrics.py` + Prometheus.[cite:436][cite:437]
+   - Exempelmetriker:
+     - `query_hit_rate`, `retrieval_latency_ms`
+     - `feedback_success_rate`, `feedback_failure_rate`
+     - `hot_tier_size`, `tier_promotion_rate`
+     - `gap_detection_count`, `gap_fill_count`
+2. **Issue Detection (Rule‑Based)**
+   - Batchjobb (Pulse) kör enkla regler:
+     - Om `feedback_failure_rate > X` för en viss tag (t.ex. “fastapi”) → skapa “knowledge area weak” flagg.
+     - Om `hot_tier_hit_rate < threshold` → dålig context‑masking eller fel tuned thresholds.
+3. **Proposal Generation (LLM)**
+   - `SubconsciousAI` får inputs:
+     - Metrics, knowledge gaps, failure cases, config snapshot.
+   - Prompt genererar:
+     - `SelfImprovementProposal.title/description/rationale`.
+4. **Review & Execution**
+   - API / UI för att lista proposals.
+   - Människa/agent accepterar/rejectar.
+   - Vid accept:
+     - Kan trigga config ändringar (med patch PR).
+     - Kan skapa GitHub issues/PR mallar.
+### 6.3 API
+- `GET /meta/proposals`
+- `POST /meta/proposals/{id}/status`
+---
+## 7. Association & “Subtle Thoughts”
+### 7.1 Association Engine
+Målet: Systemet ska **själv föreslå**:
+- Analogier (“det här liknar när vi gjorde X i annat projekt”).
+- Relaterade koncept (“du pratar om Y, men Z har varit viktigt tidigare”).
+- Långsiktiga teman och lärdomar.
+Bygg vidare på:
+- `synapse_index.py` (hebbian connections).[cite:436]
+- `ripple_context.py` (kaskader).[cite:436]
+- `recursive_synthesizer.py` (konceptsyntes).[cite:436]
+Nya pattern:
+- Vid varje Pulse:
+  - Hämta senaste N episoder.
+  - Kör k‑NN i semantic concept space.
+  - Kör ripple over synapses.
+  - Generera en uppsättning **CandidateAssociations**:
+```python
+@dataclass
+class CandidateAssociation:
+    id: str
+    agent_id: str
+    created_at: datetime
+    source_episode_ids: list[str]
+    related_concept_ids: list[str]
+    suggestion_text: str
+    confidence: float
+```
+Lagra i SM/EM så att agent/LLM kan hämta “subtle thoughts” innan svar:
+- `GET /agents/{agent_id}/subtle-thoughts`
+---
+## 8. Storage Backends & Profiles
+### 8.1 Profiles
+Behåll pip‑enkelheten via profiler:
+- **Lite Profile** (default, no extra deps):
+  - WM: in‑process dict
+  - EM: SQLite
+  - SM: in‑process HDV + mmap
+  - PM/MM: SQLite/JSON
+- **Standard Profile**:
+  - WARM: Redis
+  - COLD: filesystem
+- **Scale Profile**:
+  - WARM: Redis
+  - COLD: Qdrant (eller annan vector DB)
+  - Optionellt: S3 archive
+Konfigurationsexempel:
+```yaml
+haim:
+  profile: "lite"  # "lite" | "standard" | "scale"
+```
+---
+## 9. OpenClaw & External Agents
+### 9.1 Designprincip för integration
+För OpenClaw / liknande orchestrators:
+- En agent definieras genom:
+  - `agent_id`
+  - `capabilities` (tools etc.)
+- MnemoCore ska behandla `agent_id` som primär nyckel för:
+  - WM
+  - Episoder
+  - Preferenser
+  - Procedurer som agenten själv skapat
+### 9.2 “Live Memory” Pattern
+- När OpenClaw kör:
+  - Varje observation → `observe(agent_id, content, meta)`
+  - Varje tool call / action → episod event.
+  - Före varje beslut:
+    - Hämta:
+      - `WM`
+      - `recent episodes`
+      - `relevant semantic concepts`
+      - `subtle thoughts` / associations
+      - `knowledge gaps` (om agenten vill använda dessa som frågor).
+---
+## 10. Testing & Evaluation Plan
+### 10.1 Unit & Integration Tests
+Nya testfiler:
+- `tests/test_working_memory.py`
+- `tests/test_episodic_store.py`
+- `tests/test_semantic_store.py`
+- `tests/test_procedural_store.py`
+- `tests/test_meta_memory.py`
+- `tests/test_pulse.py`
+- `tests/test_agent_interface.py`
+Fokus:
+- Invariantes (max WM size, LTP thresholds, reliability‑update).
+- Episodic chaining korrekt.
+- Semantic consolidation integration med nya SM‑API:t.
+- Pulse tick ordering & time budget.
+### 10.2 Behavioural Benchmarks
+Skapa `benchmarks/AGI_MEMORY_SCENARIOS.md`:
+- Multi‑session tasks där agent måste:
+  - Minnas user preferences över dagar.
+  - Lära sig av failed attempts (feedback).
+  - Använda analogier över domäner.
+Mät:
+- Context reuse rate.
+- Time‑to‑solve vs “no memory” baseline.
+- Antal genererade self‑improvement proposals som faktiskt förbättrar outcomes.
+---
+## 11. Implementation Roadmap
+### Phase 5.0 – Core Structure
+1. Introduce `memory_model.py`, `working_memory.py`, `episodic_store.py`, `semantic_store.py`, `procedural_store.py`, `meta_memory.py`, `pulse.py`.
+2. Wire everything in `container.py` (new providers).
+3. Add `CognitiveMemoryClient` + minimal tests.
+### Phase 5.1 – WM/EM/SM in Engine
+4. Integrate WM into engine query/store paths.
+5. Integrate EM creation in API (store/query/feedback).
+6. Adapt semantic_consolidation/immunology to new SM service.
+### Phase 5.2 – Procedural & Association
+7. Implement procedural store + reliability integration.
+8. Build association engine + subtle thoughts endpoints.
+### Phase 5.3 – Self‑Improvement
+9. Wire metrics → meta_memory → proposals via SubconsciousAI.
+10. Add endpoints & optional small UI for proposals.
+### Phase 5.4 – Hardening & Agents
+11. Harden profiles (lite/standard/scale).
+12. Build reference integrations (OpenClaw, LangGraph, AutoGen).
+---
+## 12. Developer Notes
+- Håll **backwards compatibility** på API där det går:
+  - Nya endpoints → prefix `v2` om nödvändigt.
+  - Python API kan vara “ny high‑level layer” ovanpå befintlig `HAIMEngine`.
+- All ny funktionalitet **feature‑flaggas i config**:
+  - `haim.pulse.enabled`
+  - `haim.episodic.enabled`
+  - `haim.procedural.enabled`
+  - etc.
+- Strikt logging / metrics för allt nytt:
+  - `haim_pulse_tick_duration_seconds`
+  - `haim_wm_size`
+  - `haim_episode_count`
+  - `haim_procedure_success_rate`
+  - `haim_self_proposals_pending`
+---
+*This blueprint is the contract between MnemoCore, its agents, and its contributors. The intention is to let autonomous AI agents, human developers, and MnemoCore itself co‑evolve toward a truly cognitive memory substrate – one that remembers, forgets, reflects, and grows.*

integrations/README.md ADDED Viewed

	@@ -0,0 +1,233 @@

+# MnemoCore Integrations
+Connect MnemoCore's persistent cognitive memory to your AI coding tools.
+## Supported tools
+| Tool | Method | Notes |
+|------|--------|-------|
+| **Claude Code** | MCP server + hooks + CLAUDE.md | Best integration — native tool access |
+| **Gemini CLI** | GEMINI.md + wrapper script | Context injected at session start |
+| **Aider** | Wrapper script (`--system-prompt`) | Context injected at session start |
+| **Any CLI tool** | Universal shell scripts | Pipe context into any tool |
+| **Open-source agents** | REST API (`mnemo_bridge.py`) | Minimal Python dependency |
+---
+## Quick setup
+### Prerequisites
+1. MnemoCore running: `uvicorn mnemocore.api.main:app --port 8100`
+2. `HAIM_API_KEY` environment variable set
+3. Python 3.10+ with `requests` (`pip install requests`)
+### Linux / macOS
+```bash
+cd integrations/
+bash setup.sh --all
+```
+### Windows (PowerShell)
+```powershell
+cd integrations\
+.\setup.ps1 -All
+```
+### Manual: test the bridge first
+```bash
+export MNEMOCORE_URL=http://localhost:8100
+export HAIM_API_KEY=your-key-here
+python integrations/mnemo_bridge.py health
+python integrations/mnemo_bridge.py context --top-k 5
+python integrations/mnemo_bridge.py store "Fixed import error in engine.py" --tags "bugfix,python"
+```
+---
+## Claude Code (recommended)
+The setup script does three things:
+### 1. MCP server — native tool access
+Registers MnemoCore as an MCP server in `~/.claude/mcp.json`.
+Claude Code gets four tools:
+- `memory_query` — search memories
+- `memory_store` — store a memory
+- `memory_get` / `memory_delete` — manage individual memories
+Claude will use these automatically when you instruct it to remember things,
+or you can configure CLAUDE.md to trigger them on every session (see below).
+**Verify:** Run `claude mcp list` — you should see `mnemocore` listed.
+### 2. Hooks — automatic background storage
+Two hooks are installed in `~/.claude/settings.json`:
+- **PreToolUse** (`pre_session_inject.py`): On the first tool call of a session,
+  queries MnemoCore and injects recent context into Claude's awareness.
+- **PostToolUse** (`post_tool_store.py`): After every `Edit`/`Write` call,
+  stores a lightweight memory entry in the background (non-blocking).
+Hooks never block Claude Code — they degrade silently if MnemoCore is offline.
+### 3. CLAUDE.md — behavioral instructions
+The setup appends memory usage instructions to `CLAUDE.md`.
+This tells Claude *when* to use memory tools proactively.
+---
+## Gemini CLI
+```bash
+# Option A: Use wrapper (injects context automatically)
+alias gemini='bash integrations/gemini_cli/gemini_wrap.sh'
+gemini "Fix the async bug in engine.py"
+# Option B: Manual context injection
+CONTEXT=$(integrations/universal/context_inject.sh)
+gemini --system-prompt "$CONTEXT" "Fix the async bug in engine.py"
+```
+Also add instructions to your `GEMINI.md`:
+```bash
+cat integrations/gemini_cli/GEMINI_memory_snippet.md >> GEMINI.md
+```
+---
+## Aider
+```bash
+# Option A: Use wrapper
+alias aider='bash integrations/aider/aider_wrap.sh'
+aider --model claude-3-5-sonnet-20241022 engine.py
+# Option B: Manual
+CONTEXT=$(integrations/universal/context_inject.sh "async engine")
+aider --system-prompt "$CONTEXT" engine.py
+```
+---
+## Universal / Open-source agents
+Any tool that accepts a system prompt can use MnemoCore:
+```bash
+# Get context as markdown
+integrations/universal/context_inject.sh "query text" 6
+# Use in any command
+MY_CONTEXT=$(integrations/universal/context_inject.sh)
+some-ai-cli --system "$MY_CONTEXT" "do the task"
+# Store a memory after a session
+integrations/universal/store_session.sh \
+  "Discovered that warm tier mmap files grow unbounded without consolidation" \
+  "discovery,warm-tier,storage" \
+  "mnemocore-project"
+```
+### REST API (Python / any language)
+```python
+import os, requests
+BASE = os.getenv("MNEMOCORE_URL", "http://localhost:8100")
+KEY  = os.getenv("HAIM_API_KEY", "")
+HDR  = {"X-API-Key": KEY}
+# Query
+r = requests.post(f"{BASE}/query", json={"query": "async bugs", "top_k": 5}, headers=HDR)
+for m in r.json()["results"]:
+    print(m["score"], m["content"])
+# Store
+requests.post(f"{BASE}/store", json={
+    "content": "Found root cause of memory leak in consolidation worker",
+    "metadata": {"source": "my-agent", "tags": ["bugfix", "memory"]}
+}, headers=HDR)
+```
+---
+## Environment variables
+| Variable | Default | Description |
+|----------|---------|-------------|
+| `MNEMOCORE_URL` | `http://localhost:8100` | MnemoCore API base URL |
+| `HAIM_API_KEY` | — | API key (same as MnemoCore's `HAIM_API_KEY`) |
+| `MNEMOCORE_TIMEOUT` | `5` | Request timeout in seconds |
+| `MNEMOCORE_CONTEXT_DIR` | `~/.claude/mnemo_context` | Where hook writes context files |
+---
+## Architecture
+```
+┌─────────────────────────────────────────────────────┐
+│                  AI Coding Tool                      │
+│   (Claude Code / Gemini CLI / Aider / Custom)       │
+└──────────────┬──────────────────────┬───────────────┘
+               │ MCP tools            │ System prompt
+               │ (Claude Code only)   │ (all tools)
+               ▼                      ▼
+┌──────────────────────┐  ┌───────────────────────────┐
+│  mnemocore MCP server│  │    mnemo_bridge.py CLI     │
+│  (stdio transport)   │  │    (lightweight wrapper)   │
+└──────────┬───────────┘  └─────────────┬─────────────┘
+           │                            │
+           └────────────┬───────────────┘
+                        │ HTTP REST
+                        ▼
+           ┌────────────────────────┐
+           │   MnemoCore API        │
+           │   localhost:8100       │
+           │                        │
+           │  ┌──────────────────┐  │
+           │  │  HAIMEngine      │  │
+           │  │  HOT/WARM/COLD   │  │
+           │  │  HDV vectors     │  │
+           │  └──────────────────┘  │
+           └────────────────────────┘
+```
+---
+## Troubleshooting
+**MnemoCore offline:**
+```bash
+python integrations/mnemo_bridge.py health
+# → MnemoCore is OFFLINE
+# Start it: uvicorn mnemocore.api.main:app --port 8100
+```
+**API key error (401):**
+```bash
+export HAIM_API_KEY="your-key-from-.env"
+python integrations/mnemo_bridge.py health
+```
+**Hook not triggering (Claude Code):**
+```bash
+# Check settings.json
+cat ~/.claude/settings.json | python -m json.tool | grep -A5 hooks
+```
+**MCP server not found (Claude Code):**
+```bash
+# Verify mcp.json
+cat ~/.claude/mcp.json
+# Check PYTHONPATH includes src/
+cd /path/to/mnemocore && python -m mnemocore.mcp.server --help
+```

integrations/aider/aider_wrap.sh ADDED Viewed

	@@ -0,0 +1,44 @@

+#!/usr/bin/env bash
+# aider_wrap.sh — MnemoCore context injector for Aider
+# ======================================================
+# Usage: ./aider_wrap.sh [any aider args...]
+#
+# Injects MnemoCore memory context into Aider's system prompt
+# using the --system-prompt flag (available in Aider 0.40+).
+#
+# Environment variables:
+#   MNEMOCORE_URL      MnemoCore REST URL (default: http://localhost:8100)
+#   HAIM_API_KEY       API key for MnemoCore
+#   BRIDGE_PY          Path to mnemo_bridge.py (auto-detected)
+#   AIDER_BIN          Path to aider binary (default: aider)
+set -euo pipefail
+SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
+BRIDGE_PY="${BRIDGE_PY:-$(realpath "$SCRIPT_DIR/../mnemo_bridge.py")}"
+AIDER_BIN="${AIDER_BIN:-aider}"
+# ── Fetch context ──────────────────────────────────────────────────────────
+CONTEXT=""
+if python3 "$BRIDGE_PY" health &>/dev/null 2>&1; then
+    CONTEXT="$(python3 "$BRIDGE_PY" context --top-k 6 2>/dev/null || true)"
+fi
+# ── Run Aider with or without injected context ─────────────────────────────
+if [[ -n "$CONTEXT" ]]; then
+    PROMPT_FILE="$(mktemp /tmp/mnemo_aider_XXXXXX.md)"
+    trap 'rm -f "$PROMPT_FILE"' EXIT
+    cat > "$PROMPT_FILE" <<'HEREDOC'
+## MnemoCore: Memory from previous sessions
+Use the following context from persistent memory to inform your work.
+Do not repeat known decisions. Reference this to avoid re-discovering bugs.
+HEREDOC
+    echo "$CONTEXT" >> "$PROMPT_FILE"
+    exec "$AIDER_BIN" --system-prompt "$PROMPT_FILE" "$@"
+else
+    exec "$AIDER_BIN" "$@"
+fi

integrations/claude_code/CLAUDE_memory_snippet.md ADDED Viewed

	@@ -0,0 +1,38 @@

+# MnemoCore — Persistent Cognitive Memory
+You have access to a persistent memory system via MCP tools:
+- `memory_query` — search for relevant memories before starting any task
+- `memory_store` — save important decisions, findings, and bug fixes after completing work
+- `memory_stats` / `memory_health` — check system status
+## When to use memory
+**At session start:** Call `memory_query` with the user's first message to retrieve relevant past context.
+**After completing a task:** Call `memory_store` to record:
+- What was changed and why (key architectural decisions)
+- Bug fixes and root causes
+- Non-obvious patterns discovered in the codebase
+- User preferences and project conventions
+**When you find something unexpected:** Store it immediately with relevant tags.
+## Storing memories
+Include useful metadata:
+```json
+{
+  "content": "Fixed async race condition in tier_manager.py by adding asyncio.Lock around promotion logic",
+  "metadata": {
+    "source": "claude-code",
+    "tags": ["bugfix", "async", "tier_manager"],
+    "project": "mnemocore"
+  }
+}
+```
+## Rules
+- Do NOT store trivial information (e.g., "the user asked me to open a file")
+- DO store non-obvious insights, decisions with reasoning, and recurring patterns
+- Query memory BEFORE reading files when working on a known codebase
+- Store memory AFTER completing non-trivial changes

integrations/claude_code/hooks/post_tool_store.py ADDED Viewed

	@@ -0,0 +1,96 @@

+#!/usr/bin/env python3
+"""
+Claude Code PostToolUse hook — MnemoCore auto-store
+====================================================
+Automatically stores the result of significant file edits into MnemoCore.
+Configure in ~/.claude/settings.json:
+{
+  "hooks": {
+    "PostToolUse": [
+      {
+        "matcher": "Edit|Write",
+        "hooks": [
+          {
+            "type": "command",
+            "command": "python /path/to/post_tool_store.py"
+          }
+        ]
+      }
+    ]
+  }
+}
+The hook receives a JSON blob on stdin and exits 0 to allow the tool call.
+It stores a lightweight memory entry in the background (non-blocking via
+subprocess) so it never delays Claude Code's response.
+"""
+import json
+import os
+import subprocess
+import sys
+from pathlib import Path
+BRIDGE = Path(__file__).resolve().parents[2] / "mnemo_bridge.py"
+MIN_CONTENT_LEN = 30  # Ignore trivially short edits
+def main() -> int:
+    try:
+        raw = sys.stdin.read()
+        data = json.loads(raw) if raw.strip() else {}
+    except json.JSONDecodeError:
+        return 0  # Never block Claude Code
+    tool_name  = data.get("tool_name", "")
+    tool_input = data.get("tool_input", {})
+    session_id = data.get("session_id", "")
+    # Only act on file-writing tools
+    if tool_name not in {"Edit", "Write", "MultiEdit"}:
+        return 0
+    file_path = tool_input.get("file_path", "")
+    new_string = tool_input.get("new_string") or tool_input.get("content", "")
+    if not new_string or len(new_string) < MIN_CONTENT_LEN:
+        return 0
+    # Build a concise memory entry — just the file + a short excerpt
+    excerpt = new_string[:200].replace("\n", " ").strip()
+    memory_text = f"Modified {file_path}: {excerpt}"
+    tags = "claude-code,edit"
+    if file_path.endswith(".py"):
+        tags += ",python"
+    elif file_path.endswith((".ts", ".js")):
+        tags += ",javascript"
+    ctx = session_id[:16] if session_id else None
+    cmd = [
+        sys.executable, str(BRIDGE),
+        "store", memory_text,
+        "--source", "claude-code-hook",
+        "--tags", tags,
+    ]
+    if ctx:
+        cmd += ["--ctx", ctx]
+    env = {**os.environ}
+    # Fire-and-forget: do not block Claude Code
+    subprocess.Popen(
+        cmd,
+        env=env,
+        stdout=subprocess.DEVNULL,
+        stderr=subprocess.DEVNULL,
+        start_new_session=True,
+    )
+    return 0
+if __name__ == "__main__":
+    sys.exit(main())

integrations/claude_code/hooks/pre_session_inject.py ADDED Viewed

	@@ -0,0 +1,93 @@

+#!/usr/bin/env python3
+"""
+Claude Code PreToolUse hook — MnemoCore context injection
+==========================================================
+On the FIRST tool call of a session, queries MnemoCore for recent context
+and writes it to a temporary file that is referenced from CLAUDE.md.
+This gives Claude Code automatic memory of previous sessions WITHOUT
+requiring any explicit user commands.
+Configure in ~/.claude/settings.json:
+{
+  "hooks": {
+    "PreToolUse": [
+      {
+        "matcher": ".*",
+        "hooks": [
+          {
+            "type": "command",
+            "command": "python /path/to/pre_session_inject.py"
+          }
+        ]
+      }
+    ]
+  }
+}
+The hook must exit 0 (allow) or 2 (block with message).
+It never blocks — silently degrades if MnemoCore is offline.
+"""
+import json
+import os
+import subprocess
+import sys
+import tempfile
+from pathlib import Path
+BRIDGE      = Path(__file__).resolve().parents[2] / "mnemo_bridge.py"
+CONTEXT_DIR = Path(os.getenv("MNEMOCORE_CONTEXT_DIR", Path.home() / ".claude" / "mnemo_context"))
+DONE_FILE   = CONTEXT_DIR / ".session_injected"
+def main() -> int:
+    try:
+        raw = sys.stdin.read()
+        data = json.loads(raw) if raw.strip() else {}
+    except json.JSONDecodeError:
+        return 0
+    session_id = data.get("session_id", "")
+    # Only inject once per session
+    done_marker = CONTEXT_DIR / f".injected_{session_id[:16]}"
+    if done_marker.exists():
+        return 0
+    CONTEXT_DIR.mkdir(parents=True, exist_ok=True)
+    # Query MnemoCore for context
+    try:
+        result = subprocess.run(
+            [sys.executable, str(BRIDGE), "context", "--top-k", "8"],
+            capture_output=True,
+            text=True,
+            timeout=5,
+            env={**os.environ},
+        )
+        context_md = result.stdout.strip()
+    except (subprocess.TimeoutExpired, FileNotFoundError):
+        context_md = ""
+    if context_md:
+        context_file = CONTEXT_DIR / "latest_context.md"
+        context_file.write_text(context_md, encoding="utf-8")
+    # Mark session as injected
+    done_marker.touch()
+    # Output context as additional system information if available
+    if context_md:
+        # Claude Code hooks can output JSON to inject content
+        output = {
+            "type": "system_reminder",
+            "content": context_md,
+        }
+        print(json.dumps(output))
+    return 0
+if __name__ == "__main__":
+    sys.exit(main())

integrations/claude_code/hooks_config_fragment.json ADDED Viewed

	@@ -0,0 +1,28 @@

+{
+  "_comment": "Merge this fragment into ~/.claude/settings.json under the 'hooks' key.",
+  "_note": "Replace MNEMOCORE_INTEGRATIONS_PATH with the absolute path to integrations/claude_code/hooks/",
+  "hooks": {
+    "PreToolUse": [
+      {
+        "matcher": ".*",
+        "hooks": [
+          {
+            "type": "command",
+            "command": "python MNEMOCORE_INTEGRATIONS_PATH/pre_session_inject.py"
+          }
+        ]
+      }
+    ],
+    "PostToolUse": [
+      {
+        "matcher": "Edit|Write|MultiEdit",
+        "hooks": [
+          {
+            "type": "command",
+            "command": "python MNEMOCORE_INTEGRATIONS_PATH/post_tool_store.py"
+          }
+        ]
+      }
+    ]
+  }
+}

integrations/claude_code/mcp_config.json ADDED Viewed

	@@ -0,0 +1,13 @@

+{
+  "mcpServers": {
+    "mnemocore": {
+      "command": "python",
+      "args": ["-m", "mnemocore.mcp.server"],
+      "cwd": "${MNEMOCORE_DIR}",
+      "env": {
+        "HAIM_API_KEY": "${HAIM_API_KEY}",
+        "PYTHONPATH": "${MNEMOCORE_DIR}/src"
+      }
+    }
+  }
+}

integrations/gemini_cli/GEMINI_memory_snippet.md ADDED Viewed

	@@ -0,0 +1,35 @@

+# MnemoCore — Persistent Cognitive Memory
+You have access to a persistent memory system via the MnemoCore REST API at `$MNEMOCORE_URL` (default: `http://localhost:8100`).
+## Querying memory
+To recall relevant context, call the API at the start of a task:
+```bash
+curl -s -X POST "$MNEMOCORE_URL/query" \
+  -H "X-API-Key: $HAIM_API_KEY" \
+  -H "Content-Type: application/json" \
+  -d '{"query": "DESCRIBE_TASK_HERE", "top_k": 5}'
+```
+## Storing memory
+After completing significant work, store a memory:
+```bash
+curl -s -X POST "$MNEMOCORE_URL/store" \
+  -H "X-API-Key: $HAIM_API_KEY" \
+  -H "Content-Type: application/json" \
+  -d '{
+    "content": "WHAT_WAS_DONE_AND_WHY",
+    "metadata": {"source": "gemini-cli", "tags": ["relevant", "tags"]}
+  }'
+```
+## Guidelines
+- **Query before starting** any non-trivial task on a known codebase
+- **Store after completing** important changes, bug fixes, or design decisions
+- **Do NOT store** trivial or ephemeral information
+- Include relevant tags: language, component, type (bugfix/feature/refactor)

integrations/gemini_cli/gemini_wrap.sh ADDED Viewed

	@@ -0,0 +1,47 @@

+#!/usr/bin/env bash
+# gemini_wrap.sh — MnemoCore context injector for Gemini CLI
+# =============================================================
+# Usage: ./gemini_wrap.sh [any gemini CLI args...]
+#
+# Fetches recent MnemoCore context and prepends it to the system prompt
+# via a temporary file, then delegates to the real `gemini` binary.
+#
+# Environment variables:
+#   MNEMOCORE_URL      MnemoCore REST URL (default: http://localhost:8100)
+#   HAIM_API_KEY       API key for MnemoCore
+#   BRIDGE_PY          Path to mnemo_bridge.py (auto-detected)
+#   GEMINI_BIN         Path to gemini binary (default: gemini)
+set -euo pipefail
+SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
+BRIDGE_PY="${BRIDGE_PY:-$(realpath "$SCRIPT_DIR/../mnemo_bridge.py")}"
+GEMINI_BIN="${GEMINI_BIN:-gemini}"
+MNEMOCORE_URL="${MNEMOCORE_URL:-http://localhost:8100}"
+# ── Fetch context (silently degrade if offline) ────────────────────────────
+CONTEXT=""
+if python3 "$BRIDGE_PY" health &>/dev/null; then
+    CONTEXT="$(python3 "$BRIDGE_PY" context --top-k 6 2>/dev/null || true)"
+fi
+# ── Build the injected system prompt fragment ──────────────────────────────
+if [[ -n "$CONTEXT" ]]; then
+    MEMORY_FILE="$(mktemp /tmp/mnemo_context_XXXXXX.md)"
+    trap 'rm -f "$MEMORY_FILE"' EXIT
+    cat > "$MEMORY_FILE" <<'HEREDOC'
+## Persistent Memory Context (from MnemoCore)
+The following is relevant context from your memory of previous sessions.
+Use it to avoid re-discovering known patterns, bugs, and decisions.
+HEREDOC
+    echo "$CONTEXT" >> "$MEMORY_FILE"
+    # Gemini CLI supports --system-prompt-file or similar flags.
+    # Adjust this to match the actual Gemini CLI interface.
+    exec "$GEMINI_BIN" --system-prompt-file "$MEMORY_FILE" "$@"
+else
+    exec "$GEMINI_BIN" "$@"
+fi

integrations/mnemo_bridge.py ADDED Viewed

	@@ -0,0 +1,177 @@

+#!/usr/bin/env python3
+"""
+MnemoCore Bridge — Universal CLI
+=================================
+Lightweight bridge between MnemoCore REST API and any AI CLI tool.
+No heavy dependencies: only stdlib + requests.
+Usage:
+    python mnemo_bridge.py context [--query TEXT] [--top-k 5] [--ctx CTX_ID]
+    python mnemo_bridge.py store TEXT [--source SOURCE] [--tags TAG1,TAG2] [--ctx CTX_ID]
+    python mnemo_bridge.py health
+Environment variables:
+    MNEMOCORE_URL       Base URL of MnemoCore API  (default: http://localhost:8100)
+    MNEMOCORE_API_KEY   API key (same as HAIM_API_KEY)
+"""
+import argparse
+import json
+import os
+import sys
+from typing import Any, Dict, List, Optional
+try:
+    import requests
+except ImportError:
+    print("ERROR: 'requests' package required. Run: pip install requests", file=sys.stderr)
+    sys.exit(1)
+# ── Config ────────────────────────────────────────────────────────────────────
+BASE_URL = os.getenv("MNEMOCORE_URL", "http://localhost:8100").rstrip("/")
+API_KEY  = os.getenv("MNEMOCORE_API_KEY") or os.getenv("HAIM_API_KEY", "")
+TIMEOUT  = int(os.getenv("MNEMOCORE_TIMEOUT", "5"))
+HEADERS = {"X-API-Key": API_KEY, "Content-Type": "application/json"}
+# ── API helpers ───────────────────────────────────────────────────────────────
+def _get(path: str) -> Optional[Dict]:
+    try:
+        r = requests.get(f"{BASE_URL}{path}", headers=HEADERS, timeout=TIMEOUT)
+        r.raise_for_status()
+        return r.json()
+    except requests.ConnectionError:
+        return None
+    except requests.HTTPError as e:
+        print(f"HTTP error: {e}", file=sys.stderr)
+        return None
+def _post(path: str, payload: Dict) -> Optional[Dict]:
+    try:
+        r = requests.post(f"{BASE_URL}{path}", headers=HEADERS,
+                          json=payload, timeout=TIMEOUT)
+        r.raise_for_status()
+        return r.json()
+    except requests.ConnectionError:
+        return None
+    except requests.HTTPError as e:
+        print(f"HTTP error: {e}", file=sys.stderr)
+        return None
+# ── Commands ──────────────────────────────────────────────────────────────────
+def cmd_health() -> int:
+    data = _get("/health")
+    if data is None:
+        print("MnemoCore is OFFLINE (could not connect)", file=sys.stderr)
+        return 1
+    status = data.get("status", "unknown")
+    print(f"MnemoCore status: {status}")
+    return 0 if status == "ok" else 1
+def cmd_store(text: str, source: str, tags: List[str], ctx: Optional[str]) -> int:
+    metadata: Dict[str, Any] = {"source": source}
+    if tags:
+        metadata["tags"] = tags
+    payload: Dict[str, Any] = {"content": text, "metadata": metadata}
+    if ctx:
+        payload["agent_id"] = ctx
+    data = _post("/store", payload)
+    if data is None:
+        print("Failed to store memory (MnemoCore offline or error)", file=sys.stderr)
+        return 1
+    memory_id = data.get("id") or data.get("memory_id", "?")
+    print(f"Stored: {memory_id}")
+    return 0
+def cmd_context(query: Optional[str], top_k: int, ctx: Optional[str]) -> int:
+    """
+    Fetch relevant memories and print them as a markdown block
+    suitable for injection into any AI tool's system prompt.
+    """
+    payload: Dict[str, Any] = {
+        "query": query or "recent work context decisions bugs fixes",
+        "top_k": top_k,
+    }
+    if ctx:
+        payload["agent_id"] = ctx
+    data = _post("/query", payload)
+    if data is None:
+        # Silently return empty — don't break the calling tool's startup
+        return 0
+    results: List[Dict] = data.get("results", [])
+    if not results:
+        return 0
+    lines = [
+        "<!-- MnemoCore: Persistent Memory Context -->",
+        "## Relevant memory from previous sessions\n",
+    ]
+    for r in results:
+        content  = r.get("content", "").strip()
+        score    = r.get("score", 0.0)
+        meta     = r.get("metadata", {})
+        source   = meta.get("source", "unknown")
+        tags     = meta.get("tags", [])
+        tag_str  = f" [{', '.join(tags)}]" if tags else ""
+        lines.append(f"- **[{source}{tag_str}]** (relevance {score:.2f}): {content}")
+    lines.append("\n<!-- End MnemoCore Context -->")
+    print("\n".join(lines))
+    return 0
+# ── Entry point ───────────────────────────────────────────────────────────────
+def main() -> int:
+    parser = argparse.ArgumentParser(
+        description="MnemoCore universal CLI bridge",
+        formatter_class=argparse.RawDescriptionHelpFormatter,
+    )
+    sub = parser.add_subparsers(dest="cmd", required=True)
+    # health
+    sub.add_parser("health", help="Check MnemoCore connectivity")
+    # store
+    p_store = sub.add_parser("store", help="Store a memory")
+    p_store.add_argument("text", help="Memory content")
+    p_store.add_argument("--source", default="cli", help="Source label")
+    p_store.add_argument("--tags", default="", help="Comma-separated tags")
+    p_store.add_argument("--ctx",  default=None, help="Context/project ID")
+    # context
+    p_ctx = sub.add_parser("context", help="Fetch context as markdown")
+    p_ctx.add_argument("--query", default=None, help="Semantic query string")
+    p_ctx.add_argument("--top-k", type=int, default=5, help="Number of results")
+    p_ctx.add_argument("--ctx",  default=None, help="Context/project ID")
+    args = parser.parse_args()
+    if args.cmd == "health":
+        return cmd_health()
+    if args.cmd == "store":
+        tags = [t.strip() for t in args.tags.split(",") if t.strip()]
+        return cmd_store(args.text, args.source, tags, args.ctx)
+    if args.cmd == "context":
+        return cmd_context(args.query, args.top_k, args.ctx)
+    return 1
+if __name__ == "__main__":
+    sys.exit(main())

integrations/setup.ps1 ADDED Viewed

	@@ -0,0 +1,158 @@

+# MnemoCore Integration Setup — Windows PowerShell
+# =================================================
+# One-command setup for Claude Code (MCP) on Windows.
+# For full hook/wrapper support, use WSL or Git Bash.
+#
+# Usage:
+#   .\setup.ps1
+#   .\setup.ps1 -All
+#   .\setup.ps1 -ClaudeCode
+param(
+    [switch]$All,
+    [switch]$ClaudeCode,
+    [switch]$Gemini,
+    [switch]$Aider
+)
+$ErrorActionPreference = "Stop"
+$ScriptDir    = Split-Path -Parent $MyInvocation.MyCommand.Path
+$MnemoDir     = Split-Path -Parent $ScriptDir
+$BridgePy     = Join-Path $ScriptDir "mnemo_bridge.py"
+$ClaudeHome   = Join-Path $env:USERPROFILE ".claude"
+$ClaudeMcp    = Join-Path $ClaudeHome "mcp.json"
+$ClaudeSettings = Join-Path $ClaudeHome "settings.json"
+$HooksDir     = Join-Path $ScriptDir "claude_code\hooks"
+function Write-Info    { Write-Host "[INFO]  $args" -ForegroundColor Cyan }
+function Write-Success { Write-Host "[OK]    $args" -ForegroundColor Green }
+function Write-Warn    { Write-Host "[WARN]  $args" -ForegroundColor Yellow }
+function Write-Err     { Write-Host "[ERROR] $args" -ForegroundColor Red }
+# ── Prerequisite checks ────────────────────────────────────────────────────
+Write-Info "Checking Python requests..."
+$requestsCheck = python -c "import requests; print('ok')" 2>&1
+if ($requestsCheck -ne "ok") {
+    Write-Warn "Installing requests..."
+    python -m pip install --quiet requests
+}
+Write-Success "Python requests available"
+Write-Info "Checking MnemoCore connectivity..."
+$healthCheck = python "$BridgePy" health 2>&1
+if ($LASTEXITCODE -eq 0) {
+    Write-Success "MnemoCore is online"
+} else {
+    Write-Warn "MnemoCore offline — start it first:"
+    Write-Warn "  cd $MnemoDir"
+    Write-Warn "  uvicorn mnemocore.api.main:app --port 8100"
+}
+# ── Claude Code MCP Setup ─────────────────────────────────────────────────
+function Setup-ClaudeCode {
+    Write-Info "Setting up Claude Code integration..."
+    if (-not (Test-Path $ClaudeHome)) { New-Item -ItemType Directory -Path $ClaudeHome | Out-Null }
+    New-Item -ItemType Directory -Path (Join-Path $ClaudeHome "mnemo_context") -Force | Out-Null
+    # MCP config
+    $McpTemplate = Get-Content (Join-Path $ScriptDir "claude_code\mcp_config.json") -Raw
+    $McpTemplate = $McpTemplate `
+        -replace '\$\{MNEMOCORE_DIR\}', $MnemoDir.Replace('\', '/') `
+        -replace '\$\{HAIM_API_KEY\}', ($env:HAIM_API_KEY ?? '')
+    if (-not (Test-Path $ClaudeMcp)) {
+        '{"mcpServers":{}}' | Set-Content $ClaudeMcp
+    }
+    $Existing = Get-Content $ClaudeMcp -Raw | ConvertFrom-Json
+    $New      = $McpTemplate | ConvertFrom-Json
+    if (-not $Existing.mcpServers) { $Existing | Add-Member -MemberType NoteProperty -Name mcpServers -Value @{} }
+    $New.mcpServers.PSObject.Properties | ForEach-Object {
+        $Existing.mcpServers | Add-Member -MemberType NoteProperty -Name $_.Name -Value $_.Value -Force
+    }
+    $Existing | ConvertTo-Json -Depth 10 | Set-Content $ClaudeMcp
+    Write-Success "MCP server registered in $ClaudeMcp"
+    # Hooks
+    if (-not (Test-Path $ClaudeSettings)) { '{}' | Set-Content $ClaudeSettings }
+    $Settings = Get-Content $ClaudeSettings -Raw | ConvertFrom-Json
+    if (-not $Settings.hooks) {
+        $Settings | Add-Member -MemberType NoteProperty -Name hooks -Value @{}
+    }
+    $hooksObj = $Settings.hooks
+    $preCmd  = "python `"$($HooksDir.Replace('\','/'))/pre_session_inject.py`""
+    $postCmd = "python `"$($HooksDir.Replace('\','/'))/post_tool_store.py`""
+    if (-not $hooksObj.PreToolUse) {
+        $hooksObj | Add-Member -MemberType NoteProperty -Name PreToolUse -Value @()
+    }
+    if (-not $hooksObj.PostToolUse) {
+        $hooksObj | Add-Member -MemberType NoteProperty -Name PostToolUse -Value @()
+    }
+    $existingPre = $hooksObj.PreToolUse | ForEach-Object { $_.hooks[0].command }
+    if ($preCmd -notin $existingPre) {
+        $hooksObj.PreToolUse += @{matcher=".*"; hooks=@(@{type="command"; command=$preCmd})}
+    }
+    $existingPost = $hooksObj.PostToolUse | ForEach-Object { $_.hooks[0].command }
+    if ($postCmd -notin $existingPost) {
+        $hooksObj.PostToolUse += @{matcher="Edit|Write|MultiEdit"; hooks=@(@{type="command"; command=$postCmd})}
+    }
+    $Settings | ConvertTo-Json -Depth 10 | Set-Content $ClaudeSettings
+    Write-Success "Hooks installed in $ClaudeSettings"
+    # CLAUDE.md snippet
+    $ClaudeMd = Join-Path $MnemoDir "CLAUDE.md"
+    $Snippet  = Get-Content (Join-Path $ScriptDir "claude_code\CLAUDE_memory_snippet.md") -Raw
+    $Marker   = "# MnemoCore — Persistent Cognitive Memory"
+    if (Test-Path $ClaudeMd) {
+        $Current = Get-Content $ClaudeMd -Raw
+        if ($Current -notlike "*$Marker*") {
+            Add-Content $ClaudeMd "`n$Snippet"
+            Write-Success "Memory instructions appended to CLAUDE.md"
+        } else {
+            Write-Info "CLAUDE.md already contains MnemoCore instructions"
+        }
+    } else {
+        $Snippet | Set-Content $ClaudeMd
+        Write-Success "Created CLAUDE.md with memory instructions"
+    }
+    Write-Success "Claude Code integration complete"
+}
+# ── Main ───────────────────────────────────────────────────────────────────
+Write-Host ""
+Write-Host "╔══════════════════════════════════════════╗" -ForegroundColor Magenta
+Write-Host "║    MnemoCore Integration Setup (Win)    ║" -ForegroundColor Magenta
+Write-Host "╚══════════════════════════════════════════╝" -ForegroundColor Magenta
+Write-Host ""
+if (-not ($All -or $ClaudeCode -or $Gemini -or $Aider)) {
+    Write-Host "Choose integrations:"
+    Write-Host "  1) Claude Code (MCP + hooks + CLAUDE.md) — recommended"
+    Write-Host "  4) All"
+    $choice = Read-Host "Enter choice"
+    switch ($choice) {
+        "1" { $ClaudeCode = $true }
+        "4" { $All = $true }
+    }
+}
+if ($All -or $ClaudeCode) { Setup-ClaudeCode }
+Write-Host ""
+Write-Host "╔══════════════════════════════════════════╗" -ForegroundColor Green
+Write-Host "║   Setup complete!                       ║" -ForegroundColor Green
+Write-Host "║                                          ║" -ForegroundColor Green
+Write-Host "║   Test: python integrations/mnemo_bridge.py health" -ForegroundColor Green
+Write-Host "╚══════════════════════════════════════════╝" -ForegroundColor Green
+Write-Host ""

integrations/setup.sh ADDED Viewed

	@@ -0,0 +1,299 @@

+#!/usr/bin/env bash
+# MnemoCore Integration Setup
+# ============================
+# One-command setup for Claude Code, Gemini CLI, Aider, and universal tools.
+#
+# Usage:
+#   ./setup.sh                      # Interactive, choose integrations
+#   ./setup.sh --all                # Enable all integrations
+#   ./setup.sh --claude-code        # Claude Code only
+#   ./setup.sh --gemini             # Gemini CLI only
+#   ./setup.sh --aider              # Aider only
+#
+# Prerequisites:
+#   - Python 3.10+ with 'requests' package
+#   - MnemoCore running (uvicorn mnemocore.api.main:app --port 8100)
+#   - HAIM_API_KEY environment variable set
+set -euo pipefail
+SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
+MNEMOCORE_DIR="$(realpath "$SCRIPT_DIR/..")"
+BRIDGE_PY="$SCRIPT_DIR/mnemo_bridge.py"
+HOOKS_DIR="$SCRIPT_DIR/claude_code/hooks"
+CLAUDE_SETTINGS="$HOME/.claude/settings.json"
+CLAUDE_MCP="$HOME/.claude/mcp.json"
+RED='\033[0;31m'
+GREEN='\033[0;32m'
+YELLOW='\033[1;33m'
+BLUE='\033[0;34m'
+NC='\033[0m'
+# ── Helpers ────────────────────────────────────────────────────────────────
+info()    { echo -e "${BLUE}[INFO]${NC}  $*"; }
+success() { echo -e "${GREEN}[OK]${NC}    $*"; }
+warn()    { echo -e "${YELLOW}[WARN]${NC}  $*"; }
+error()   { echo -e "${RED}[ERROR]${NC} $*" >&2; }
+check_python() {
+    if ! python3 -c "import requests" &>/dev/null; then
+        warn "Python 'requests' not installed. Installing..."
+        python3 -m pip install --quiet requests
+        success "requests installed"
+    fi
+}
+check_mnemocore() {
+    info "Checking MnemoCore connectivity..."
+    if python3 "$BRIDGE_PY" health &>/dev/null; then
+        success "MnemoCore is online"
+        return 0
+    else
+        warn "MnemoCore is not running. Start it first with:"
+        warn "  cd $MNEMOCORE_DIR && uvicorn mnemocore.api.main:app --port 8100"
+        return 1
+    fi
+}
+merge_json() {
+    # Merge JSON object $2 into file $1 (creates if not exists)
+    local target="$1"
+    local fragment="$2"
+    if [[ ! -f "$target" ]]; then
+        echo '{}' > "$target"
+    fi
+    python3 - <<PYEOF
+import json, sys
+with open("$target") as f:
+    existing = json.load(f)
+with open("$fragment") as f:
+    new = json.load(f)
+# Deep merge (one level)
+for k, v in new.items():
+    if k.startswith("_"):
+        continue
+    if k in existing and isinstance(existing[k], dict) and isinstance(v, dict):
+        existing[k].update(v)
+    else:
+        existing[k] = v
+with open("$target", "w") as f:
+    json.dump(existing, f, indent=2)
+print("Merged successfully")
+PYEOF
+}
+# ── Integration: Claude Code ───────────────────────────────────────────────
+setup_claude_code() {
+    info "Setting up Claude Code integration..."
+    mkdir -p "$HOME/.claude/mnemo_context"
+    # 1. MCP Server
+    info "  Configuring MCP server..."
+    local mcp_tmp
+    mcp_tmp="$(mktemp /tmp/mnemo_mcp_XXXXXX.json)"
+    sed \
+        -e "s|\${MNEMOCORE_DIR}|$MNEMOCORE_DIR|g" \
+        -e "s|\${HAIM_API_KEY}|${HAIM_API_KEY:-}|g" \
+        "$SCRIPT_DIR/claude_code/mcp_config.json" > "$mcp_tmp"
+    if [[ ! -f "$CLAUDE_MCP" ]]; then
+        echo '{"mcpServers": {}}' > "$CLAUDE_MCP"
+    fi
+    python3 - "$CLAUDE_MCP" "$mcp_tmp" <<'PYEOF'
+import json, sys
+with open(sys.argv[1]) as f:
+    existing = json.load(f)
+with open(sys.argv[2]) as f:
+    new = json.load(f)
+existing.setdefault("mcpServers", {}).update(new.get("mcpServers", {}))
+with open(sys.argv[1], "w") as f:
+    json.dump(existing, f, indent=2)
+PYEOF
+    rm -f "$mcp_tmp"
+    success "  MCP server registered in $CLAUDE_MCP"
+    # 2. Hooks
+    info "  Installing hooks in $CLAUDE_SETTINGS..."
+    if [[ ! -f "$CLAUDE_SETTINGS" ]]; then
+        echo '{}' > "$CLAUDE_SETTINGS"
+    fi
+    python3 - "$CLAUDE_SETTINGS" "$HOOKS_DIR" <<PYEOF
+import json, sys
+settings_path = sys.argv[1]
+hooks_dir = sys.argv[2]
+with open(settings_path) as f:
+    settings = json.load(f)
+hooks = settings.setdefault("hooks", {})
+pre = hooks.setdefault("PreToolUse", [])
+post = hooks.setdefault("PostToolUse", [])
+pre_hook = {
+    "matcher": ".*",
+    "hooks": [{"type": "command", "command": f"python3 {hooks_dir}/pre_session_inject.py"}]
+}
+post_hook = {
+    "matcher": "Edit|Write|MultiEdit",
+    "hooks": [{"type": "command", "command": f"python3 {hooks_dir}/post_tool_store.py"}]
+}
+# Only add if not already present
+pre_cmds = [h["hooks"][0]["command"] for h in pre if h.get("hooks")]
+post_cmds = [h["hooks"][0]["command"] for h in post if h.get("hooks")]
+if pre_hook["hooks"][0]["command"] not in pre_cmds:
+    pre.append(pre_hook)
+if post_hook["hooks"][0]["command"] not in post_cmds:
+    post.append(post_hook)
+with open(settings_path, "w") as f:
+    json.dump(settings, f, indent=2)
+print("Hooks installed")
+PYEOF
+    success "  Hooks installed in $CLAUDE_SETTINGS"
+    # 3. CLAUDE.md snippet — append if not already present
+    local clause_md="$MNEMOCORE_DIR/CLAUDE.md"
+    local snippet="$SCRIPT_DIR/claude_code/CLAUDE_memory_snippet.md"
+    local marker="# MnemoCore — Persistent Cognitive Memory"
+    if [[ -f "$clause_md" ]] && grep -qF "$marker" "$clause_md"; then
+        info "  CLAUDE.md already contains MnemoCore memory instructions"
+    else
+        echo "" >> "$clause_md"
+        cat "$snippet" >> "$clause_md"
+        success "  Memory instructions appended to $clause_md"
+    fi
+    success "Claude Code integration complete"
+}
+# ── Integration: Gemini CLI ────────────────────────────────────────────────
+setup_gemini() {
+    info "Setting up Gemini CLI integration..."
+    # Make wrapper executable
+    chmod +x "$SCRIPT_DIR/gemini_cli/gemini_wrap.sh"
+    # Append to GEMINI.md if it exists
+    local gemini_md="$MNEMOCORE_DIR/GEMINI.md"
+    local snippet="$SCRIPT_DIR/gemini_cli/GEMINI_memory_snippet.md"
+    local marker="# MnemoCore — Persistent Cognitive Memory"
+    if [[ -f "$gemini_md" ]] && grep -qF "$marker" "$gemini_md"; then
+        info "  GEMINI.md already contains MnemoCore instructions"
+    elif [[ -f "$gemini_md" ]]; then
+        echo "" >> "$gemini_md"
+        cat "$snippet" >> "$gemini_md"
+        success "  Memory instructions appended to $gemini_md"
+    else
+        cp "$snippet" "$gemini_md"
+        success "  Created $gemini_md with memory instructions"
+    fi
+    success "Gemini CLI integration complete"
+    info "  Use: $SCRIPT_DIR/gemini_cli/gemini_wrap.sh [args] instead of 'gemini'"
+    info "  Or alias: alias gemini='$SCRIPT_DIR/gemini_cli/gemini_wrap.sh'"
+}
+# ── Integration: Aider ─────────────────────────────────────────────────────
+setup_aider() {
+    info "Setting up Aider integration..."
+    chmod +x "$SCRIPT_DIR/aider/aider_wrap.sh"
+    # Write .env fragment for aider
+    local aider_env="$MNEMOCORE_DIR/.aider.env"
+    cat > "$aider_env" <<EOF
+# MnemoCore environment for Aider
+export MNEMOCORE_URL="${MNEMOCORE_URL:-http://localhost:8100}"
+export HAIM_API_KEY="${HAIM_API_KEY:-}"
+export BRIDGE_PY="$BRIDGE_PY"
+EOF
+    success "Aider integration complete"
+    info "  Use: $SCRIPT_DIR/aider/aider_wrap.sh [args] instead of 'aider'"
+    info "  Or alias: alias aider='$SCRIPT_DIR/aider/aider_wrap.sh'"
+}
+# ── Integration: Universal scripts ─────────────────────────────────────────
+setup_universal() {
+    chmod +x "$SCRIPT_DIR/universal/context_inject.sh"
+    chmod +x "$SCRIPT_DIR/universal/store_session.sh"
+    success "Universal scripts ready"
+    info "  Context: $SCRIPT_DIR/universal/context_inject.sh [query] [top-k]"
+    info "  Store:   $SCRIPT_DIR/universal/store_session.sh [text] [tags] [ctx]"
+}
+# ── Main ───────────────────────────────────────────────────────────────────
+echo ""
+echo "╔══════════════════════════════════════════════════════╗"
+echo "║          MnemoCore Integration Setup                ║"
+echo "╚══════════════════════════════════════════════════════╝"
+echo ""
+# Check prerequisites
+check_python
+check_mnemocore || true  # Non-fatal — offline check is a warning
+DO_ALL=false
+DO_CLAUDE=false
+DO_GEMINI=false
+DO_AIDER=false
+for arg in "$@"; do
+    case "$arg" in
+        --all)         DO_ALL=true ;;
+        --claude-code) DO_CLAUDE=true ;;
+        --gemini)      DO_GEMINI=true ;;
+        --aider)       DO_AIDER=true ;;
+    esac
+done
+if ! $DO_ALL && ! $DO_CLAUDE && ! $DO_GEMINI && ! $DO_AIDER; then
+    echo "Which integrations do you want to enable?"
+    echo "  1) Claude Code (MCP + hooks + CLAUDE.md)"
+    echo "  2) Gemini CLI (GEMINI.md + wrapper)"
+    echo "  3) Aider (wrapper script)"
+    echo "  4) All of the above"
+    echo ""
+    read -rp "Enter choice(s) [e.g. 1 3 or 4]: " CHOICES
+    for c in $CHOICES; do
+        case "$c" in
+            1) DO_CLAUDE=true ;;
+            2) DO_GEMINI=true ;;
+            3) DO_AIDER=true ;;
+            4) DO_ALL=true ;;
+        esac
+    done
+fi
+if $DO_ALL; then
+    DO_CLAUDE=true; DO_GEMINI=true; DO_AIDER=true
+fi
+echo ""
+setup_universal
+$DO_CLAUDE && setup_claude_code
+$DO_GEMINI && setup_gemini
+$DO_AIDER  && setup_aider
+echo ""
+echo "╔══════════════════════════════════════════════════════╗"
+echo "║   Setup complete! Quick start:                      ║"
+echo "║                                                      ║"
+echo "║   Test bridge:  python3 integrations/mnemo_bridge.py health"
+echo "║   Get context:  integrations/universal/context_inject.sh"
+echo "║   Store memory: integrations/universal/store_session.sh"
+echo "╚══════════════════════════════════════════════════════╝"
+echo ""

integrations/universal/context_inject.sh ADDED Viewed

	@@ -0,0 +1,29 @@

+#!/usr/bin/env bash
+# context_inject.sh — Universal MnemoCore context provider
+# =========================================================
+# Outputs MnemoCore memory context as plain text/markdown.
+# Pipe or include the output into any tool that accepts system prompts.
+#
+# Usage:
+#   ./context_inject.sh                    # General context
+#   ./context_inject.sh "bug fix async"    # Focused query
+#   ./context_inject.sh "" 10             # Top-10 results
+#
+# Examples:
+#   codex --system "$(./context_inject.sh)" ...
+#   openai-cli --system-prompt "$(./context_inject.sh 'auth')"
+set -euo pipefail
+SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
+BRIDGE_PY="${BRIDGE_PY:-$(realpath "$SCRIPT_DIR/../mnemo_bridge.py")}"
+QUERY="${1:-}"
+TOP_K="${2:-6}"
+ARGS=(context --top-k "$TOP_K")
+if [[ -n "$QUERY" ]]; then
+    ARGS+=(--query "$QUERY")
+fi
+python3 "$BRIDGE_PY" "${ARGS[@]}" 2>/dev/null || true

integrations/universal/store_session.sh ADDED Viewed

	@@ -0,0 +1,40 @@

+#!/usr/bin/env bash
+# store_session.sh — Store session outcomes into MnemoCore
+# =========================================================
+# Call this at the end of an AI coding session to persist key findings.
+#
+# Usage (interactive):
+#   ./store_session.sh
+#
+# Usage (non-interactive / scripted):
+#   ./store_session.sh "Fixed race condition in tier_manager.py" "bugfix,async" "my-project"
+set -euo pipefail
+SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
+BRIDGE_PY="${BRIDGE_PY:-$(realpath "$SCRIPT_DIR/../mnemo_bridge.py")}"
+if [[ $# -ge 1 ]]; then
+    CONTENT="$1"
+    TAGS="${2:-cli}"
+    CTX="${3:-}"
+else
+    echo "Enter memory content (what was done/decided/fixed):"
+    read -r CONTENT
+    echo "Tags (comma-separated, e.g. bugfix,python,auth):"
+    read -r TAGS
+    echo "Context/project ID (optional, press Enter to skip):"
+    read -r CTX
+fi
+if [[ -z "$CONTENT" ]]; then
+    echo "No content provided, nothing stored." >&2
+    exit 0
+fi
+ARGS=(store "$CONTENT" --source "manual-session" --tags "$TAGS")
+if [[ -n "$CTX" ]]; then
+    ARGS+=(--ctx "$CTX")
+fi
+python3 "$BRIDGE_PY" "${ARGS[@]}"

mnemocore_verify.py ADDED Viewed

	@@ -0,0 +1,136 @@

+import asyncio
+import os
+import shutil
+import pytest
+from pathlib import Path
+import numpy as np
+# Set dummy test config environment
+os.environ["HAIM_API_KEY"] = "test-key"
+from mnemocore.core.config import HAIMConfig, PathsConfig, TierConfig
+from mnemocore.core.binary_hdv import TextEncoder, BinaryHDV
+from mnemocore.core.hnsw_index import HNSWIndexManager
+from mnemocore.core.engine import HAIMEngine
+from mnemocore.core.tier_manager import TierManager
+from unittest.mock import patch
+@pytest.fixture(autouse=True)
+def setup_test_env():
+    # Force all components to use test_data_verify as their data dir
+    # to prevent polluting/reading the user's real ./data folder
+    test_dir = Path("./test_data_verify")
+    test_dir.mkdir(exist_ok=True)
+    cfg = HAIMConfig(
+        paths=PathsConfig(
+            data_dir=str(test_dir),
+            warm_mmap_dir=str(test_dir / "warm"),
+            cold_archive_dir=str(test_dir / "cold")
+        )
+    )
+    with patch('mnemocore.core.config.get_config', return_value=cfg), \
+         patch('mnemocore.core.hnsw_index.get_config', return_value=cfg), \
+         patch('mnemocore.core.engine.get_config', return_value=cfg):
+        yield cfg
+    if test_dir.exists():
+        shutil.rmtree(test_dir)
+@pytest.mark.asyncio
+async def test_text_encoder_normalization():
+    """Verify BUG-02: Text normalization fixes identical string variances"""
+    encoder = TextEncoder(dimension=1024)
+    hdv1 = encoder.encode("Hello World")
+    hdv2 = encoder.encode("hello, world!")
+    assert (hdv1.data == hdv2.data).all(), "Normalization failed: Different HDVs for identical texts"
+def test_hnsw_singleton():
+    """Verify BUG-08: HNSWIndexManager is a thread-safe singleton"""
+    HNSWIndexManager._instance = None
+    idx1 = HNSWIndexManager(dimension=1024)
+    idx2 = HNSWIndexManager(dimension=1024)
+    assert idx1 is idx2, "HNSWIndexManager is not a singleton"
+def test_hnsw_index_add_search():
+    """Verify BUG-01 & BUG-03: Vector cache lost / Position mapping"""
+    HNSWIndexManager._instance = None
+    idx = HNSWIndexManager(dimension=1024)
+    # Optional cleanup if it's reused
+    idx._id_map = []
+    idx._vector_store = []
+    if idx._index:
+        idx._index.reset()
+    vec1 = BinaryHDV.random(1024)
+    vec2 = BinaryHDV.random(1024)
+    idx.add("test_node_1", vec1.data)
+    idx.add("test_node_2", vec2.data)
+    assert "test_node_1" in idx._id_map, "ID Map does not contain node 1"
+    assert "test_node_2" in idx._id_map, "ID Map does not contain node 2"
+    # The search should return test_node_1 as the top result for vec1.data
+    res = idx.search(vec1.data, top_k=1)
+    assert res[0][0] == "test_node_1", f"Incorrect search return: {res}"
+@pytest.mark.asyncio
+async def test_agent_isolation():
+    """Verify BUG-09: Agent namespace isolation via engine and tier manager"""
+    HNSWIndexManager._instance = None
+    test_data_dir = Path("./test_data_verify")
+    test_data_dir.mkdir(exist_ok=True)
+    config = HAIMConfig(
+        qdrant=None,
+        paths=PathsConfig(
+            data_dir=str(test_data_dir),
+            warm_mmap_dir=str(test_data_dir / "warm"),
+            cold_archive_dir=str(test_data_dir / "cold")
+        ),
+        tiers_hot=TierConfig(max_memories=1000, ltp_threshold_min=0.0)
+    )
+    # Prevent newly created memories (LTP=0.5) from being eagerly demoted
+    # We run purely local/in-memory for this unit test
+    tier_manager = TierManager(config=config, qdrant_store=None)
+    engine = HAIMEngine(
+        persist_path=str(test_data_dir / "memory.jsonl"),
+        config=config,
+        tier_manager=tier_manager
+    )
+    try:
+        await engine.initialize()
+        # Store two memories, isolated
+        await engine.store("Secret logic for agent 1", metadata={"agent_id": "agent_alpha"})
+        await engine.store("Public logic for agent 2", metadata={"agent_id": "agent_beta"})
+        # Search global
+        res_global = await engine.query("logic", top_k=5)
+        # We expect 2 given we just pushed 2
+        assert len(res_global) >= 2, f"Global search should return at least 2 memories, got {len(res_global)}"
+        # Search isolated by agent_alpha
+        res_isolated = await engine.query("logic", top_k=5, metadata_filter={"agent_id": "agent_alpha"})
+        assert len(res_isolated) > 0, "Should find at least 1 memory for agent_alpha"
+        for nid, score in res_isolated:
+            node = await engine.get_memory(nid)
+            assert node.metadata.get("agent_id") == "agent_alpha", "Found leaked memory from another agent namespace!"
+    finally:
+        await engine.close()
+        # Clean up test dir
+        if test_data_dir.exists():
+            shutil.rmtree(test_data_dir)
+if __name__ == "__main__":
+    pytest.main(["-v", __file__])

src/mnemocore/agent_interface.py ADDED Viewed

	@@ -0,0 +1,145 @@

+"""
+Cognitive Memory Client
+=======================
+The high-level facade for autonomous agents to interact with the MnemoCore AGI Memory Substrate.
+Provides easy methods for observation, episodic sequence tracking, and working memory recall.
+"""
+from typing import List, Optional, Any, Tuple
+import logging
+from .core.engine import HAIMEngine
+from .core.working_memory import WorkingMemoryService, WorkingMemoryItem
+from .core.episodic_store import EpisodicStoreService
+from .core.semantic_store import SemanticStoreService
+from .core.procedural_store import ProceduralStoreService
+from .core.meta_memory import MetaMemoryService, SelfImprovementProposal
+from .core.memory_model import Procedure
+logger = logging.getLogger(__name__)
+class CognitiveMemoryClient:
+    """
+    Plug-and-play cognitive memory facade for agent frameworks (LangGraph, AutoGen, OpenClaw, etc.).
+    """
+    def __init__(
+        self,
+        engine: HAIMEngine,
+        wm: WorkingMemoryService,
+        episodic: EpisodicStoreService,
+        semantic: SemanticStoreService,
+        procedural: ProceduralStoreService,
+        meta: MetaMemoryService,
+    ):
+        self.engine = engine
+        self.wm = wm
+        self.episodic = episodic
+        self.semantic = semantic
+        self.procedural = procedural
+        self.meta = meta
+    # --- Observation & WM ---
+    def observe(self, agent_id: str, content: str, kind: str = "observation", importance: float = 0.5, tags: Optional[List[str]] = None, **meta) -> str:
+        """
+        Push a new observation or thought directly into the agent's short-term Working Memory.
+        """
+        import uuid
+        from datetime import datetime
+        item_id = f"wm_{uuid.uuid4().hex[:8]}"
+        item = WorkingMemoryItem(
+            id=item_id,
+            agent_id=agent_id,
+            created_at=datetime.utcnow(),
+            ttl_seconds=3600, # 1 hour default
+            content=content,
+            kind=kind, # type: ignore
+            importance=importance,
+            tags=tags or [],
+            hdv=None # Could encode via engine in future
+        )
+        self.wm.push_item(agent_id, item)
+        logger.debug(f"Agent {agent_id} observed: {content[:30]}...")
+        return item_id
+    def get_working_context(self, agent_id: str, limit: int = 16) -> List[WorkingMemoryItem]:
+        """
+        Read the active, un-pruned context out of the agent's working memory buffer.
+        """
+        state = self.wm.get_state(agent_id)
+        if not state:
+            return []
+        return state.items[-limit:]
+    # --- Episodic ---
+    def start_episode(self, agent_id: str, goal: str, context: Optional[str] = None) -> str:
+        """Begin a new temporally-linked event sequence."""
+        return self.episodic.start_episode(agent_id, goal=goal, context=context)
+    def append_event(self, episode_id: str, kind: str, content: str, **meta) -> None:
+        """Log an action or outcome to an ongoing episode."""
+        self.episodic.append_event(episode_id, kind, content, meta)
+    def end_episode(self, episode_id: str, outcome: str, reward: Optional[float] = None) -> None:
+        """Seal an episode, logging its final success or failure state."""
+        self.episodic.end_episode(episode_id, outcome, reward)
+    # --- Semantic / Retrieval ---
+    async def recall(
+        self,
+        agent_id: str,
+        query: str,
+        context: Optional[str] = None,
+        top_k: int = 8,
+        modes: Tuple[str, ...] = ("episodic", "semantic")
+    ) -> List[dict]:
+        """
+        A unified query interface that checks Working Memory, Episodic History, and the Semantic Vector Store.
+        Currently delegates heavily to the backing HAIMEngine, but can be augmented to return semantic concepts.
+        """
+        results = []
+        # 1. Broad retrieval via existing HAIM engine (SM / general memories)
+        if "semantic" in modes:
+            engine_results = await self.engine.query(query, top_k=top_k)
+            for mem_id, score in engine_results:
+                node = await self.engine.tier_manager.get_memory(mem_id)  # Fix: tier_manager.get_memory is async
+                if node:
+                    results.append({"source": "semantic/engine", "content": node.content, "score": score})
+        # 2. Local episodic retrieval
+        if "episodic" in modes:
+            recent_eps = self.episodic.get_recent(agent_id, limit=top_k, context=context)
+            for ep in recent_eps:
+                summary = f"Episode(goal={ep.goal}, outcome={ep.outcome}, events={len(ep.events)})"
+                results.append({"source": "episodic", "content": summary, "score": ep.reliability})
+        # Sort and trim mixed results
+        results.sort(key=lambda x: x.get("score", 0.0), reverse=True)
+        return results[:top_k]
+    # --- Procedural ---
+    def suggest_procedures(self, agent_id: str, query: str, top_k: int = 5) -> List[Procedure]:
+        """Fetch executable tool-patterns based on the agent's intent."""
+        return self.procedural.find_applicable_procedures(query, agent_id=agent_id, top_k=top_k)
+    def record_procedure_outcome(self, proc_id: str, success: bool) -> None:
+        """Report on the utility of a chosen procedure."""
+        self.procedural.record_procedure_outcome(proc_id, success)
+    # --- Meta / Self-awareness ---
+    def get_knowledge_gaps(self, agent_id: str, lookback_hours: int = 24) -> List[dict]:
+        """Return currently open knowledge gaps identified by the Pulse loop."""
+        # Stubbed: Would interact with gap_detector
+        return []
+    def get_self_improvement_proposals(self) -> List[SelfImprovementProposal]:
+        """Retrieve system-generated proposals to improve operation or prompt alignment."""
+        return self.meta.list_proposals()

src/mnemocore/api/main.py CHANGED Viewed

@@ -156,9 +156,22 @@ async def lifespan(app: FastAPI):
         persist_path="./data/memory.jsonl",
         config=config,
         tier_manager=tier_manager,
     )
     await engine.initialize()
     app.state.engine = engine
     yield
@@ -377,7 +390,8 @@ async def query_memory(
     API_REQUEST_COUNT.labels(method="POST", endpoint="/query", status="200").inc()
     # CPU heavy vector search (offloaded inside engine)
-    results = await engine.query(req.query, top_k=req.top_k)
     formatted = []
     for mem_id, score in results:
@@ -476,6 +490,52 @@ async def delete_memory(
     return {"ok": True, "deleted": memory_id}
 # --- Conceptual Endpoints ---
 @app.post(
@@ -627,6 +687,310 @@ async def rlm_query(
     }
 if __name__ == "__main__":
     import uvicorn
     uvicorn.run(app, host="0.0.0.0", port=8100)

         persist_path="./data/memory.jsonl",
         config=config,
         tier_manager=tier_manager,
+        working_memory=container.working_memory,
+        episodic_store=container.episodic_store,
+        semantic_store=container.semantic_store,
     )
     await engine.initialize()
     app.state.engine = engine
+    # Also expose the cognitive client to app state for agentic frameworks
+    from mnemocore.agent_interface import CognitiveMemoryClient
+    app.state.cognitive_client = CognitiveMemoryClient(
+        engine=engine,
+        wm=container.working_memory,
+        episodic=container.episodic_store,
+        semantic=container.semantic_store,
+        procedural=container.procedural_store,
+        meta=container.meta_memory,
+    )
     yield
     API_REQUEST_COUNT.labels(method="POST", endpoint="/query", status="200").inc()
     # CPU heavy vector search (offloaded inside engine)
+    metadata_filter = {"agent_id": req.agent_id} if req.agent_id else None
+    results = await engine.query(req.query, top_k=req.top_k, metadata_filter=metadata_filter)
     formatted = []
     for mem_id, score in results:
     return {"ok": True, "deleted": memory_id}
+# --- Phase 5: Cognitive Client Endpoints ---
+class ObserveRequest(BaseModel):
+    agent_id: str
+    content: str
+    kind: str = "observation"
+    importance: float = 0.5
+    tags: Optional[List[str]] = None
+@app.post("/wm/observe", dependencies=[Depends(get_api_key)])
+async def observe_context(req: ObserveRequest, request: Request):
+    """Push an observation explicitly into Working Memory."""
+    client = request.app.state.cognitive_client
+    if not client:
+        raise HTTPException(status_code=503, detail="Cognitive Client unavailable")
+    item_id = client.observe(
+        agent_id=req.agent_id,
+        content=req.content,
+        kind=req.kind,
+        importance=req.importance,
+        tags=req.tags
+    )
+    return {"ok": True, "item_id": item_id}
+@app.get("/wm/context/{agent_id}", dependencies=[Depends(get_api_key)])
+async def get_working_context(agent_id: str, limit: int = 16, request: Request = None):
+    """Read active Working Memory context."""
+    client = request.app.state.cognitive_client
+    items = client.get_working_context(agent_id, limit=limit)
+    return {"ok": True, "items": [
+        {"id": i.id, "content": i.content, "kind": i.kind, "importance": i.importance}
+        for i in items
+    ]}
+class EpisodeStartRequest(BaseModel):
+    agent_id: str
+    goal: str
+    context: Optional[str] = None
+@app.post("/episodes/start", dependencies=[Depends(get_api_key)])
+async def start_episode(req: EpisodeStartRequest, request: Request):
+    """Start a new episode chain."""
+    client = request.app.state.cognitive_client
+    ep_id = client.start_episode(req.agent_id, goal=req.goal, context=req.context)
+    return {"ok": True, "episode_id": ep_id}
 # --- Conceptual Endpoints ---
 @app.post(
     }
+# ─────────────────────────────────────────────────────────────────────────────
+# Phase 5.0 — Agent 1: Trust & Provenance Endpoints
+# ─────────────────────────────────────────────────────────────────────────────
+@app.get(
+    "/memory/{memory_id}/lineage",
+    dependencies=[Depends(get_api_key)],
+    tags=["Phase 5.0 — Trust"],
+    summary="Get full provenance lineage for a memory",
+)
+async def get_memory_lineage(
+    memory_id: str,
+    engine: HAIMEngine = Depends(get_engine),
+):
+    """
+    Return the complete provenance lineage of a memory:
+    origin (who created it, how, when) and all transformation events
+    (consolidated, verified, contradicted, archived, …).
+    """
+    node = await engine.get_memory(memory_id)
+    if not node:
+        raise MemoryNotFoundError(memory_id)
+    prov = getattr(node, "provenance", None)
+    if prov is None:
+        return {
+            "ok": True,
+            "memory_id": memory_id,
+            "provenance": None,
+            "message": "No provenance record attached to this memory.",
+        }
+    return {
+        "ok": True,
+        "memory_id": memory_id,
+        "provenance": prov.to_dict(),
+    }
+@app.get(
+    "/memory/{memory_id}/confidence",
+    dependencies=[Depends(get_api_key)],
+    tags=["Phase 5.0 — Trust"],
+    summary="Get confidence envelope for a memory",
+)
+async def get_memory_confidence(
+    memory_id: str,
+    engine: HAIMEngine = Depends(get_engine),
+):
+    """
+    Return a structured confidence envelope for a memory, combining:
+    - Bayesian reliability (BayesianLTP posterior mean)
+    - access_count (evidence strength)
+    - staleness (days since last verification)
+    - source_type trust weight
+    - contradiction flag
+    Level: high | medium | low | contradicted | stale
+    """
+    from mnemocore.core.confidence import build_confidence_envelope
+    node = await engine.get_memory(memory_id)
+    if not node:
+        raise MemoryNotFoundError(memory_id)
+    prov = getattr(node, "provenance", None)
+    envelope = build_confidence_envelope(node, prov)
+    return {
+        "ok": True,
+        "memory_id": memory_id,
+        "confidence": envelope,
+    }
+# ─────────────────────────────────────────────────────────────────────────────
+# Phase 5.0 — Agent 3 stub: Proactive Recall
+# (Full implementation added by Agent 3 workstream)
+# ─────────────────────────────────────────────────────────────────────────────
+@app.get(
+    "/proactive",
+    dependencies=[Depends(get_api_key)],
+    tags=["Phase 5.0 — Autonomy"],
+    summary="Retrieve contextually relevant memories without explicit query",
+)
+async def get_proactive_memories(
+    agent_id: Optional[str] = None,
+    limit: int = 10,
+    engine: HAIMEngine = Depends(get_engine),
+):
+    """
+    Proactive recall stub (Phase 5.0 / Agent 3).
+    Returns the most recently active high-LTP memories as a stand-in
+    until the full ProactiveRecallDaemon is implemented.
+    """
+    nodes = await engine.tier_manager.get_hot_snapshot() if hasattr(engine, "tier_manager") else []
+    sorted_nodes = sorted(nodes, key=lambda n: n.ltp_strength, reverse=True)[:limit]
+    from mnemocore.core.confidence import build_confidence_envelope
+    results = []
+    for n in sorted_nodes:
+        prov = getattr(n, "provenance", None)
+        results.append({
+            "id": n.id,
+            "content": n.content,
+            "ltp_strength": round(n.ltp_strength, 4),
+            "confidence": build_confidence_envelope(n, prov),
+            "tier": getattr(n, "tier", "hot"),
+        })
+    return {"ok": True, "proactive_results": results, "count": len(results)}
+# ─────────────────────────────────────────────────────────────────────────────
+# Phase 5.0 — Agent 2: Memory Lifecycle Endpoints
+# ─────────────────────────────────────────────────────────────────────────────
+@app.get(
+    "/contradictions",
+    dependencies=[Depends(get_api_key)],
+    tags=["Phase 5.0 — Lifecycle"],
+    summary="List active contradiction groups requiring resolution",
+)
+async def list_contradictions(
+    unresolved_only: bool = True,
+):
+    """
+    Returns all detected contradiction groups from the ContradictionRegistry.
+    By default only unresolved contradictions are returned.
+    """
+    from mnemocore.core.contradiction import get_contradiction_detector
+    detector = get_contradiction_detector()
+    records = detector.registry.list_all(unresolved_only=unresolved_only)
+    return {
+        "ok": True,
+        "count": len(records),
+        "contradictions": [r.to_dict() for r in records],
+    }
+class ResolveContradictionRequest(BaseModel):
+    note: Optional[str] = None
+@app.post(
+    "/contradictions/{group_id}/resolve",
+    dependencies=[Depends(get_api_key)],
+    tags=["Phase 5.0 — Lifecycle"],
+    summary="Mark a contradiction group as resolved",
+)
+async def resolve_contradiction(group_id: str, req: ResolveContradictionRequest):
+    """Manually resolve a detected contradiction."""
+    from mnemocore.core.contradiction import get_contradiction_detector
+    detector = get_contradiction_detector()
+    success = detector.registry.resolve(group_id, note=req.note)
+    if not success:
+        raise HTTPException(status_code=404, detail=f"Contradiction group {group_id!r} not found.")
+    return {"ok": True, "resolved_group_id": group_id}
+# ─────────────────────────────────────────────────────────────────────────────
+# Phase 5.0 — Agent 3: Autonomous Cognition Endpoints
+# ───────────��─────────────────────────────────────────────────────────────────
+@app.get(
+    "/memory/{memory_id}/emotional-tag",
+    dependencies=[Depends(get_api_key)],
+    tags=["Phase 5.0 — Autonomy"],
+    summary="Get emotional (valence/arousal) tag for a memory",
+)
+async def get_emotional_tag_ep(
+    memory_id: str,
+    engine: HAIMEngine = Depends(get_engine),
+):
+    """Return the valence/arousal emotional metadata for a memory."""
+    from mnemocore.core.emotional_tag import get_emotional_tag
+    node = await engine.get_memory(memory_id)
+    if not node:
+        raise MemoryNotFoundError(memory_id)
+    tag = get_emotional_tag(node)
+    return {
+        "ok": True,
+        "memory_id": memory_id,
+        "emotional_tag": {
+            "valence": tag.valence,
+            "arousal": tag.arousal,
+            "salience": round(tag.salience(), 4),
+        },
+    }
+class EmotionalTagPatchRequest(BaseModel):
+    valence: float
+    arousal: float
+@app.patch(
+    "/memory/{memory_id}/emotional-tag",
+    dependencies=[Depends(get_api_key)],
+    tags=["Phase 5.0 — Autonomy"],
+    summary="Attach or update emotional tag on a memory",
+)
+async def patch_emotional_tag(
+    memory_id: str,
+    req: EmotionalTagPatchRequest,
+    engine: HAIMEngine = Depends(get_engine),
+):
+    from mnemocore.core.emotional_tag import EmotionalTag, attach_emotional_tag
+    node = await engine.get_memory(memory_id)
+    if not node:
+        raise MemoryNotFoundError(memory_id)
+    tag = EmotionalTag(valence=req.valence, arousal=req.arousal)
+    attach_emotional_tag(node, tag)
+    return {"ok": True, "memory_id": memory_id, "emotional_tag": tag.to_metadata_dict()}
+# ─────────────────────────────────────────────────────────────────────────────
+# Phase 5.0 — Agent 4: Prediction Endpoints
+# ─────────────────────────────────────────────────────────────────────────────
+_prediction_store_instance = None
+def _get_prediction_store(engine: HAIMEngine = Depends(get_engine)):
+    from mnemocore.core.prediction_store import PredictionStore
+    global _prediction_store_instance
+    if _prediction_store_instance is None:
+        _prediction_store_instance = PredictionStore(engine=engine)
+    return _prediction_store_instance
+class CreatePredictionRequest(BaseModel):
+    content: str
+    confidence: float = 0.5
+    deadline_days: Optional[float] = None
+    related_memory_ids: Optional[List[str]] = None
+    tags: Optional[List[str]] = None
+class VerifyPredictionRequest(BaseModel):
+    success: bool
+    notes: Optional[str] = None
+@app.post(
+    "/predictions",
+    dependencies=[Depends(get_api_key)],
+    tags=["Phase 5.0 — Prediction"],
+    summary="Store a new forward-looking prediction",
+)
+async def create_prediction(req: CreatePredictionRequest):
+    from mnemocore.core.prediction_store import PredictionStore
+    global _prediction_store_instance
+    if _prediction_store_instance is None:
+        _prediction_store_instance = PredictionStore()
+    pred_id = _prediction_store_instance.create(
+        content=req.content,
+        confidence=req.confidence,
+        deadline_days=req.deadline_days,
+        related_memory_ids=req.related_memory_ids,
+        tags=req.tags,
+    )
+    pred = _prediction_store_instance.get(pred_id)
+    return {"ok": True, "prediction": pred.to_dict()}
+@app.get(
+    "/predictions",
+    dependencies=[Depends(get_api_key)],
+    tags=["Phase 5.0 — Prediction"],
+    summary="List all predictions",
+)
+async def list_predictions(status: Optional[str] = None):
+    from mnemocore.core.prediction_store import PredictionStore
+    global _prediction_store_instance
+    if _prediction_store_instance is None:
+        _prediction_store_instance = PredictionStore()
+    return {
+        "ok": True,
+        "predictions": [
+            p.to_dict()
+            for p in _prediction_store_instance.list_all(status=status)
+        ],
+    }
+@app.post(
+    "/predictions/{pred_id}/verify",
+    dependencies=[Depends(get_api_key)],
+    tags=["Phase 5.0 — Prediction"],
+    summary="Verify or falsify a prediction",
+)
+async def verify_prediction(pred_id: str, req: VerifyPredictionRequest):
+    from mnemocore.core.prediction_store import PredictionStore
+    global _prediction_store_instance
+    if _prediction_store_instance is None:
+        _prediction_store_instance = PredictionStore()
+    pred = await _prediction_store_instance.verify(pred_id, success=req.success, notes=req.notes)
+    if pred is None:
+        raise HTTPException(status_code=404, detail=f"Prediction {pred_id!r} not found.")
+    return {"ok": True, "prediction": pred.to_dict()}
 if __name__ == "__main__":
     import uvicorn
     uvicorn.run(app, host="0.0.0.0", port=8100)

src/mnemocore/core/agent_profile.py ADDED Viewed

	@@ -0,0 +1,65 @@

+"""
+Agent Profiles
+==============
+Persistent state encompassing quirks, long-term alignment details, and tooling preferences per individual actor.
+Allows multiple independent agents to interact cleanly without memory namespace collisions.
+"""
+from typing import Dict, List, Optional, Any
+from dataclasses import dataclass, field
+from datetime import datetime
+import threading
+import logging
+logger = logging.getLogger(__name__)
+@dataclass
+class AgentProfile:
+    id: str
+    name: str
+    description: str
+    created_at: datetime
+    last_active: datetime
+    # Hard bounds over behavior: e.g. "Do not delete files without explicit prompt"
+    core_directives: List[str] = field(default_factory=list)
+    # Flexible learned preferences
+    preferences: dict[str, Any] = field(default_factory=dict)
+    # Agent-specific metrics
+    reliability_score: float = 1.0
+class AgentProfileService:
+    def __init__(self):
+        # Local state dict, should back out to SQLite or Redis
+        self._profiles: Dict[str, AgentProfile] = {}
+        self._lock = threading.RLock()
+    def get_or_create_profile(self, agent_id: str, name: str = "Unknown Agent") -> AgentProfile:
+        """Retrieve the identity profile for an agent, constructing it if completely uninitialized."""
+        with self._lock:
+            if agent_id not in self._profiles:
+                self._profiles[agent_id] = AgentProfile(
+                    id=agent_id,
+                    name=name,
+                    description=f"Auto-generated profile for {agent_id}",
+                    created_at=datetime.utcnow(),
+                    last_active=datetime.utcnow()
+                )
+            profile = self._profiles[agent_id]
+            profile.last_active = datetime.utcnow()
+            return profile
+    def update_preferences(self, agent_id: str, new_preferences: dict[str, Any]) -> None:
+        """Merge learned trait or task preferences into an agent's persistent identity."""
+        with self._lock:
+            profile = self.get_or_create_profile(agent_id)
+            profile.preferences.update(new_preferences)
+            logger.debug(f"Updated preferences for agent {agent_id}.")
+    def adjust_reliability(self, agent_id: str, points: float) -> None:
+        """Alter universal trust rating of the agent based on episodic action evaluations."""
+        with self._lock:
+            profile = self.get_or_create_profile(agent_id)
+            profile.reliability_score = max(0.0, min(1.0, profile.reliability_score + points))

src/mnemocore/core/anticipatory.py ADDED Viewed

	@@ -0,0 +1,51 @@

+from typing import List, Optional
+from loguru import logger
+from .config import AnticipatoryConfig
+from .synapse_index import SynapseIndex
+from .tier_manager import TierManager
+from .topic_tracker import TopicTracker
+class AnticipatoryEngine:
+    """
+    Phase 13.2: Anticipatory Memory
+    Predicts which memories the user is likely to request next based on the
+    current topic trajectory and graph structure, and pre-loads them into the HOT tier.
+    """
+    def __init__(
+        self,
+        config: AnticipatoryConfig,
+        synapse_index: SynapseIndex,
+        tier_manager: TierManager,
+        topic_tracker: TopicTracker
+    ):
+        self.config = config
+        self.synapse_index = synapse_index
+        self.tier_manager = tier_manager
+        self.topic_tracker = topic_tracker
+    async def predict_and_preload(self, current_node_id: str) -> List[str]:
+        """
+        Predicts surrounding context from the current node and ensures they are preloaded.
+        Uses the multi-hop network in the SynapseIndex to find likely next nodes.
+        """
+        if not self.config.enabled:
+            return []
+        # Get neighbors up to predictive depth
+        # We use a relatively low depth to avoid flooding the HOT tier
+        neighbors = self.synapse_index.get_multi_hop_neighbors(
+            current_node_id,
+            depth=self.config.predictive_depth
+        )
+        # We'll just take the top 5 highest-weighted neighbors
+        # Sort by path weight (which multi-hop computes)
+        sorted_neighbors = sorted(neighbors.items(), key=lambda x: x[1], reverse=True)[:5]
+        target_ids = [nid for nid, weight in sorted_neighbors if nid != current_node_id]
+        if target_ids:
+            logger.debug(f"Anticipatory engine pre-loading {len(target_ids)} predicted nodes.")
+            await self.tier_manager.anticipate(target_ids)
+        return target_ids

src/mnemocore/core/binary_hdv.py CHANGED Viewed

@@ -22,6 +22,21 @@ import hashlib
 from typing import List, Optional, Tuple
 import numpy as np
 class BinaryHDV:
@@ -138,12 +153,13 @@ class BinaryHDV:
         """
         Hamming distance: count of differing bits.
-        Uses np.unpackbits + sum for correctness.
         Range: [0, dimension].
         """
         assert self.dimension == other.dimension
         xor_result = np.bitwise_xor(self.data, other.data)
-        return int(np.unpackbits(xor_result).sum())
     def normalized_distance(self, other: "BinaryHDV") -> float:
         """Hamming distance normalized to [0.0, 1.0]."""
@@ -210,7 +226,8 @@ class BinaryHDV:
         return cls(data=data, dimension=dimension)
     def __repr__(self) -> str:
-        popcount = int(np.unpackbits(self.data).sum())
         return f"BinaryHDV(dim={self.dimension}, popcount={popcount}/{self.dimension})"
     def __eq__(self, other: object) -> bool:
@@ -383,26 +400,37 @@ class TextEncoder:
         """
         Encode a text string to a binary HDV.
-        Tokenization: simple whitespace split + lowercasing.
         Each token is bound with its position via XOR(token, permute(position_marker, i)).
         All position-bound tokens are bundled via majority vote.
         """
-        tokens = text.lower().split()
         if not tokens:
             return BinaryHDV.random(self.dimension)
         if len(tokens) == 1:
             return self.get_token_vector(tokens[0])
-        # Build position-bound token vectors
-        bound_vectors = []
-        for i, token in enumerate(tokens):
-            token_hdv = self.get_token_vector(token)
-            # Permute by position index for order encoding
-            positioned = token_hdv.permute(shift=i)
-            bound_vectors.append(positioned)
-        return majority_bundle(bound_vectors)
     def encode_with_context(
         self, text: str, context_hdv: BinaryHDV
@@ -415,21 +443,3 @@ class TextEncoder:
         """
         content_hdv = self.encode(text)
         return content_hdv.xor_bind(context_hdv)
-# ======================================================================
-# Internal helpers
-# ======================================================================
-# Cached lookup table for popcount (bits set per byte value 0-255)
-_POPCOUNT_TABLE: Optional[np.ndarray] = None
-def _build_popcount_table() -> np.ndarray:
-    """Build or return cached popcount lookup table for bytes (0-255)."""
-    global _POPCOUNT_TABLE
-    if _POPCOUNT_TABLE is None:
-        _POPCOUNT_TABLE = np.array(
-            [bin(i).count("1") for i in range(256)], dtype=np.int32
-        )
-    return _POPCOUNT_TABLE

 from typing import List, Optional, Tuple
 import numpy as np
+import re
+# Cached lookup table for popcount (bits set per byte value 0-255)
+_POPCOUNT_TABLE: Optional[np.ndarray] = None
+def _build_popcount_table() -> np.ndarray:
+    """Build or return cached popcount lookup table for bytes (0-255)."""
+    global _POPCOUNT_TABLE
+    if _POPCOUNT_TABLE is None:
+        _POPCOUNT_TABLE = np.array(
+            [bin(i).count("1") for i in range(256)], dtype=np.int32
+        )
+    return _POPCOUNT_TABLE
 class BinaryHDV:
         """
         Hamming distance: count of differing bits.
+        Uses lookup table for speed (replacing unpackbits).
         Range: [0, dimension].
         """
         assert self.dimension == other.dimension
         xor_result = np.bitwise_xor(self.data, other.data)
+        # Optimized: use precomputed popcount table instead of unpacking bits
+        return int(_build_popcount_table()[xor_result].sum())
     def normalized_distance(self, other: "BinaryHDV") -> float:
         """Hamming distance normalized to [0.0, 1.0]."""
         return cls(data=data, dimension=dimension)
     def __repr__(self) -> str:
+        # Optimized: use precomputed popcount table
+        popcount = int(_build_popcount_table()[self.data].sum())
         return f"BinaryHDV(dim={self.dimension}, popcount={popcount}/{self.dimension})"
     def __eq__(self, other: object) -> bool:
         """
         Encode a text string to a binary HDV.
+        Tokenization: simple whitespace split after normalization.
         Each token is bound with its position via XOR(token, permute(position_marker, i)).
         All position-bound tokens are bundled via majority vote.
         """
+        # BUG-02 Fix: strip punctuation and normalize spaces
+        normalized = re.sub(r'[^\w\s]', '', text).lower()
+        tokens = normalized.split()
         if not tokens:
             return BinaryHDV.random(self.dimension)
         if len(tokens) == 1:
             return self.get_token_vector(tokens[0])
+        # Build position-bound token vectors (#27)
+        # Optimized: Batch process data instead of multiple object instantiations
+        token_hdvs = [self.get_token_vector(t) for t in tokens]
+        packed_data = np.stack([v.data for v in token_hdvs], axis=0)
+        all_bits = np.unpackbits(packed_data, axis=1)
+        # Apply position-based permutations (roll)
+        for i in range(len(tokens)):
+            if i > 0:
+                all_bits[i] = np.roll(all_bits[i], i)
+        # Vectorized majority vote (equivalent to majority_bundle)
+        sums = all_bits.sum(axis=0)
+        threshold = len(tokens) / 2.0
+        result_bits = np.zeros(self.dimension, dtype=np.uint8)
+        result_bits[sums > threshold] = 1
+        return BinaryHDV(data=np.packbits(result_bits), dimension=self.dimension)
     def encode_with_context(
         self, text: str, context_hdv: BinaryHDV
         """
         content_hdv = self.encode(text)
         return content_hdv.xor_bind(context_hdv)

src/mnemocore/core/confidence.py ADDED Viewed

	@@ -0,0 +1,196 @@

+"""
+Confidence Calibration Module (Phase 5.0)
+==========================================
+Generates structured confidence envelopes for retrieved memories,
+combining all available trust signals into a single queryable object.
+Signals used:
+  - BayesianLTP reliability (mean of Beta posterior)
+  - access_count       (low count → less evidence)
+  - staleness          (days since last verification)
+  - source type        (external ≤ user_correction vs observation)
+  - contradiction flag (from ProvenanceRecord)
+Output: a ConfidenceEnvelope dict appended to every query response,
+enabling consuming agents to make trust-aware decisions.
+Public API:
+    env = ConfidenceEnvelopeGenerator.build(node, provenance)
+    level = env["level"]   # "high" | "medium" | "low" | "contradicted" | "stale"
+"""
+from __future__ import annotations
+from datetime import datetime, timezone
+from typing import TYPE_CHECKING, Any, Dict, Optional
+if TYPE_CHECKING:
+    from .node import MemoryNode
+    from .provenance import ProvenanceRecord
+# ------------------------------------------------------------------ #
+#  Confidence levels (ordered by trust)                              #
+# ------------------------------------------------------------------ #
+LEVEL_HIGH = "high"
+LEVEL_MEDIUM = "medium"
+LEVEL_LOW = "low"
+LEVEL_CONTRADICTED = "contradicted"
+LEVEL_STALE = "stale"
+# Thresholds
+RELIABILITY_HIGH_THRESHOLD = 0.80
+RELIABILITY_MEDIUM_THRESHOLD = 0.50
+ACCESS_COUNT_MIN_EVIDENCE = 2       # Less than this → low confidence
+ACCESS_COUNT_HIGH_EVIDENCE = 5      # At least this → supports high confidence
+STALENESS_STALE_DAYS = 30           # Days without verification → stale
+# ------------------------------------------------------------------ #
+#  Source-type trust weights                                         #
+# ------------------------------------------------------------------ #
+SOURCE_TRUST: Dict[str, float] = {
+    "observation": 1.0,
+    "inference": 0.8,
+    "external_sync": 0.75,
+    "dream": 0.6,
+    "consolidation": 0.85,
+    "prediction": 0.5,
+    "user_correction": 1.0,
+    "unknown": 0.5,
+}
+# ------------------------------------------------------------------ #
+#  Confidence Envelope Generator                                     #
+# ------------------------------------------------------------------ #
+class ConfidenceEnvelopeGenerator:
+    """
+    Builds a confidence_envelope dict for a MemoryNode.
+    Does NOT mutate the node — only reads fields.
+    Thread-safe; no shared state.
+    """
+    @staticmethod
+    def _reliability(node: "MemoryNode") -> float:
+        """
+        Extract reliability float from the node.
+        Falls back to ltp_strength if no Bayesian state is attached.
+        """
+        bayes = getattr(node, "_bayes", None)
+        if bayes is not None:
+            return float(bayes.mean)
+        return float(getattr(node, "ltp_strength", 0.5))
+    @staticmethod
+    def _staleness_days(node: "MemoryNode", provenance: Optional["ProvenanceRecord"]) -> float:
+        """Days since last verification, or days since last access."""
+        if provenance:
+            # Find the most recent 'verified' event
+            for evt in reversed(provenance.lineage):
+                if evt.event == "verified" and evt.outcome is True:
+                    try:
+                        ts = datetime.fromisoformat(evt.timestamp)
+                        if ts.tzinfo is None:
+                            ts = ts.replace(tzinfo=timezone.utc)
+                        delta = datetime.now(timezone.utc) - ts
+                        return delta.total_seconds() / 86400.0
+                    except (ValueError, TypeError):
+                        pass
+        # Fall back to last_accessed on the node
+        last = getattr(node, "last_accessed", None)
+        if last is not None:
+            if getattr(last, "tzinfo", None) is None:
+                last = last.replace(tzinfo=timezone.utc)
+            delta = datetime.now(timezone.utc) - last
+            return delta.total_seconds() / 86400.0
+        return 0.0
+    @classmethod
+    def build(
+        cls,
+        node: "MemoryNode",
+        provenance: Optional["ProvenanceRecord"] = None,
+    ) -> Dict[str, Any]:
+        """
+        Build a full confidence_envelope dict for the given node.
+        Returns a dict suitable for direct JSON serialization.
+        """
+        reliability = cls._reliability(node)
+        access_count: int = getattr(node, "access_count", 1)
+        staleness: float = cls._staleness_days(node, provenance)
+        # Determine source type for trust weighting
+        source_type = "unknown"
+        if provenance:
+            source_type = provenance.origin.type
+        source_trust = SOURCE_TRUST.get(source_type, 0.5)
+        # Contradiction check
+        is_contradicted = provenance.is_contradicted() if provenance else False
+        # Last verified date (human-readable)
+        last_verified: Optional[str] = None
+        if provenance:
+            for evt in reversed(provenance.lineage):
+                if evt.event == "verified" and evt.outcome is True:
+                    last_verified = evt.timestamp
+                    break
+        # ---- Determine level ------------------------------------ #
+        if is_contradicted:
+            level = LEVEL_CONTRADICTED
+        elif staleness > STALENESS_STALE_DAYS:
+            level = LEVEL_STALE
+        elif (
+            reliability >= RELIABILITY_HIGH_THRESHOLD
+            and access_count >= ACCESS_COUNT_HIGH_EVIDENCE
+            and source_trust >= 0.75
+        ):
+            level = LEVEL_HIGH
+        elif reliability >= RELIABILITY_MEDIUM_THRESHOLD and access_count >= ACCESS_COUNT_MIN_EVIDENCE:
+            level = LEVEL_MEDIUM
+        else:
+            level = LEVEL_LOW
+        envelope: Dict[str, Any] = {
+            "level": level,
+            "reliability": round(reliability, 4),
+            "access_count": access_count,
+            "staleness_days": round(staleness, 1),
+            "source_type": source_type,
+            "source_trust": round(source_trust, 2),
+            "is_contradicted": is_contradicted,
+        }
+        if last_verified:
+            envelope["last_verified"] = last_verified
+        return envelope
+# ------------------------------------------------------------------ #
+#  Convenience function                                              #
+# ------------------------------------------------------------------ #
+def build_confidence_envelope(
+    node: "MemoryNode",
+    provenance: Optional["ProvenanceRecord"] = None,
+) -> Dict[str, Any]:
+    """
+    Module-level shortcut for ConfidenceEnvelopeGenerator.build().
+    Args:
+        node:        MemoryNode to evaluate.
+        provenance:  Optional ProvenanceRecord for the node.
+    Returns:
+        confidence_envelope dict with level, reliability, staleness, etc.
+    """
+    return ConfidenceEnvelopeGenerator.build(node, provenance)

src/mnemocore/core/config.py CHANGED Viewed

@@ -139,6 +139,37 @@ class EncodingConfig:
     token_method: str = "bundle"
 @dataclass(frozen=True)
 class DreamLoopConfig:
     """Configuration for the dream loop (subconscious background processing)."""
@@ -194,11 +225,19 @@ class SubconsciousAIConfig:
     max_memories_per_cycle: int = 10  # Process at most N memories per pulse
 @dataclass(frozen=True)
 class HAIMConfig:
     """Root configuration for the HAIM system."""
-    version: str = "3.0"
     dimensionality: int = 16384
     encoding: EncodingConfig = field(default_factory=EncodingConfig)
     tiers_hot: TierConfig = field(
@@ -230,8 +269,13 @@ class HAIMConfig:
     paths: PathsConfig = field(default_factory=PathsConfig)
     consolidation: ConsolidationConfig = field(default_factory=ConsolidationConfig)
     attention_masking: AttentionMaskingConfig = field(default_factory=AttentionMaskingConfig)
     dream_loop: DreamLoopConfig = field(default_factory=DreamLoopConfig)
     subconscious_ai: SubconsciousAIConfig = field(default_factory=SubconsciousAIConfig)
 def _env_override(key: str, default):
@@ -347,15 +391,6 @@ def load_config(path: Optional[Path] = None) -> HAIMConfig:
         token_method=enc_raw.get("token_method", "bundle"),
     )
-    # Build LTP config
-    ltp_raw = raw.get("ltp") or {}
-    ltp = LTPConfig(
-        initial_importance=ltp_raw.get("initial_importance", 0.5),
-        decay_lambda=ltp_raw.get("decay_lambda", 0.01),
-        permanence_threshold=ltp_raw.get("permanence_threshold", 0.95),
-        half_life_days=ltp_raw.get("half_life_days", 30.0),
-    )
     # Build paths config
     paths_raw = raw.get("paths") or {}
     paths = PathsConfig(
@@ -499,6 +534,37 @@ def load_config(path: Optional[Path] = None) -> HAIMConfig:
         model=_env_override("DREAM_LOOP_MODEL", dream_raw.get("model", "gemma3:1b")),
     )
     # Build subconscious AI config (Phase 4.4 BETA)
     sub_raw = raw.get("subconscious_ai") or {}
     subconscious_ai = SubconsciousAIConfig(
@@ -524,8 +590,17 @@ def load_config(path: Optional[Path] = None) -> HAIMConfig:
         max_memories_per_cycle=_env_override("SUBCONSCIOUS_AI_MAX_MEMORIES_PER_CYCLE", sub_raw.get("max_memories_per_cycle", 10)),
     )
     return HAIMConfig(
-        version=raw.get("version", "3.0"),
         dimensionality=dimensionality,
         encoding=encoding,
         tiers_hot=_build_tier("hot", hot_raw),
@@ -542,8 +617,13 @@ def load_config(path: Optional[Path] = None) -> HAIMConfig:
         paths=paths,
         consolidation=consolidation,
         attention_masking=attention_masking,
         dream_loop=dream_loop,
         subconscious_ai=subconscious_ai,
     )

     token_method: str = "bundle"
+@dataclass(frozen=True)
+class SynapseConfig:
+    """Configuration for Phase 12.1: Aggressive Synapse Formation"""
+    similarity_threshold: float = 0.5
+    auto_bind_on_store: bool = True
+    multi_hop_depth: int = 2
+@dataclass(frozen=True)
+class ContextConfig:
+    """Configuration for Phase 12.2: Contextual Awareness"""
+    enabled: bool = True
+    shift_threshold: float = 0.3
+    rolling_window_size: int = 5
+@dataclass(frozen=True)
+class PreferenceConfig:
+    """Configuration for Phase 12.3: Preference Learning"""
+    enabled: bool = True
+    learning_rate: float = 0.1
+    history_limit: int = 100
+@dataclass(frozen=True)
+class AnticipatoryConfig:
+    """Configuration for Phase 13.2: Anticipatory Memory"""
+    enabled: bool = True
+    predictive_depth: int = 1
 @dataclass(frozen=True)
 class DreamLoopConfig:
     """Configuration for the dream loop (subconscious background processing)."""
     max_memories_per_cycle: int = 10  # Process at most N memories per pulse
+@dataclass(frozen=True)
+class PulseConfig:
+    """Configuration for Phase 5 AGI Pulse Loop orchestrator."""
+    enabled: bool = True
+    interval_seconds: int = 30
+    max_agents_per_tick: int = 50
+    max_episodes_per_tick: int = 200
 @dataclass(frozen=True)
 class HAIMConfig:
     """Root configuration for the HAIM system."""
+    version: str = "4.5"
     dimensionality: int = 16384
     encoding: EncodingConfig = field(default_factory=EncodingConfig)
     tiers_hot: TierConfig = field(
     paths: PathsConfig = field(default_factory=PathsConfig)
     consolidation: ConsolidationConfig = field(default_factory=ConsolidationConfig)
     attention_masking: AttentionMaskingConfig = field(default_factory=AttentionMaskingConfig)
+    synapse: SynapseConfig = field(default_factory=SynapseConfig)
+    context: ContextConfig = field(default_factory=ContextConfig)
+    preference: PreferenceConfig = field(default_factory=PreferenceConfig)
+    anticipatory: AnticipatoryConfig = field(default_factory=AnticipatoryConfig)
     dream_loop: DreamLoopConfig = field(default_factory=DreamLoopConfig)
     subconscious_ai: SubconsciousAIConfig = field(default_factory=SubconsciousAIConfig)
+    pulse: PulseConfig = field(default_factory=PulseConfig)
 def _env_override(key: str, default):
         token_method=enc_raw.get("token_method", "bundle"),
     )
     # Build paths config
     paths_raw = raw.get("paths") or {}
     paths = PathsConfig(
         model=_env_override("DREAM_LOOP_MODEL", dream_raw.get("model", "gemma3:1b")),
     )
+    # Build synapse config (Phase 12.1)
+    syn_raw = raw.get("synapse") or {}
+    synapse = SynapseConfig(
+        similarity_threshold=_env_override("SYNAPSE_SIMILARITY_THRESHOLD", syn_raw.get("similarity_threshold", 0.5)),
+        auto_bind_on_store=_env_override("SYNAPSE_AUTO_BIND_ON_STORE", syn_raw.get("auto_bind_on_store", True)),
+        multi_hop_depth=_env_override("SYNAPSE_MULTI_HOP_DEPTH", syn_raw.get("multi_hop_depth", 2)),
+    )
+    # Build context config (Phase 12.2)
+    ctx_raw = raw.get("context") or {}
+    context = ContextConfig(
+        enabled=_env_override("CONTEXT_ENABLED", ctx_raw.get("enabled", True)),
+        shift_threshold=_env_override("CONTEXT_SHIFT_THRESHOLD", ctx_raw.get("shift_threshold", 0.3)),
+        rolling_window_size=_env_override("CONTEXT_ROLLING_WINDOW_SIZE", ctx_raw.get("rolling_window_size", 5)),
+    )
+    # Build preference config (Phase 12.3)
+    pref_raw = raw.get("preference") or {}
+    preference = PreferenceConfig(
+        enabled=_env_override("PREFERENCE_ENABLED", pref_raw.get("enabled", True)),
+        learning_rate=_env_override("PREFERENCE_LEARNING_RATE", pref_raw.get("learning_rate", 0.1)),
+        history_limit=_env_override("PREFERENCE_HISTORY_LIMIT", pref_raw.get("history_limit", 100)),
+    )
+    # Build anticipatory config (Phase 13.2)
+    ant_raw = raw.get("anticipatory") or {}
+    anticipatory = AnticipatoryConfig(
+        enabled=_env_override("ANTICIPATORY_ENABLED", ant_raw.get("enabled", True)),
+        predictive_depth=_env_override("ANTICIPATORY_PREDICTIVE_DEPTH", ant_raw.get("predictive_depth", 1)),
+    )
     # Build subconscious AI config (Phase 4.4 BETA)
     sub_raw = raw.get("subconscious_ai") or {}
     subconscious_ai = SubconsciousAIConfig(
         max_memories_per_cycle=_env_override("SUBCONSCIOUS_AI_MAX_MEMORIES_PER_CYCLE", sub_raw.get("max_memories_per_cycle", 10)),
     )
+    # Build pulse config (Phase 5.0)
+    pulse_raw = raw.get("pulse") or {}
+    pulse = PulseConfig(
+        enabled=_env_override("PULSE_ENABLED", pulse_raw.get("enabled", True)),
+        interval_seconds=_env_override("PULSE_INTERVAL_SECONDS", pulse_raw.get("interval_seconds", 30)),
+        max_agents_per_tick=_env_override("PULSE_MAX_AGENTS_PER_TICK", pulse_raw.get("max_agents_per_tick", 50)),
+        max_episodes_per_tick=_env_override("PULSE_MAX_EPISODES_PER_TICK", pulse_raw.get("max_episodes_per_tick", 200)),
+    )
     return HAIMConfig(
+        version=raw.get("version", "4.5"),
         dimensionality=dimensionality,
         encoding=encoding,
         tiers_hot=_build_tier("hot", hot_raw),
         paths=paths,
         consolidation=consolidation,
         attention_masking=attention_masking,
+        synapse=synapse,
+        context=context,
+        preference=preference,
+        anticipatory=anticipatory,
         dream_loop=dream_loop,
         subconscious_ai=subconscious_ai,
+        pulse=pulse,
     )

src/mnemocore/core/container.py CHANGED Viewed

@@ -12,6 +12,14 @@ from .config import HAIMConfig
 from .async_storage import AsyncRedisStorage
 from .qdrant_store import QdrantStore
 @dataclass
 class Container:
@@ -21,6 +29,14 @@ class Container:
     config: HAIMConfig
     redis_storage: Optional[AsyncRedisStorage] = None
     qdrant_store: Optional[QdrantStore] = None
 def build_container(config: HAIMConfig) -> Container:
@@ -57,6 +73,14 @@ def build_container(config: HAIMConfig) -> Container:
         hnsw_ef_construct=config.qdrant.hnsw_ef_construct,
     )
     return container

 from .async_storage import AsyncRedisStorage
 from .qdrant_store import QdrantStore
+# Phase 5 AGI Services
+from .working_memory import WorkingMemoryService
+from .episodic_store import EpisodicStoreService
+from .semantic_store import SemanticStoreService
+from .procedural_store import ProceduralStoreService
+from .meta_memory import MetaMemoryService
+from .agent_profile import AgentProfileService
 @dataclass
 class Container:
     config: HAIMConfig
     redis_storage: Optional[AsyncRedisStorage] = None
     qdrant_store: Optional[QdrantStore] = None
+    # Phase 5 Services
+    working_memory: Optional[WorkingMemoryService] = None
+    episodic_store: Optional[EpisodicStoreService] = None
+    semantic_store: Optional[SemanticStoreService] = None
+    procedural_store: Optional[ProceduralStoreService] = None
+    meta_memory: Optional[MetaMemoryService] = None
+    agent_profiles: Optional[AgentProfileService] = None
 def build_container(config: HAIMConfig) -> Container:
         hnsw_ef_construct=config.qdrant.hnsw_ef_construct,
     )
+    # Initialize Phase 5 AGI Services
+    container.working_memory = WorkingMemoryService()
+    container.episodic_store = EpisodicStoreService()
+    container.semantic_store = SemanticStoreService(qdrant_store=container.qdrant_store)
+    container.procedural_store = ProceduralStoreService()
+    container.meta_memory = MetaMemoryService()
+    container.agent_profiles = AgentProfileService()
     return container

src/mnemocore/core/contradiction.py ADDED Viewed

	@@ -0,0 +1,336 @@

+"""
+Contradiction Detection Module (Phase 5.0)
+==========================================
+Detects contradicting memories in MnemoCore using a two-stage pipeline:
+Stage 1: TextEncoder similarity search (fast, vector-based)
+  - At /store time: compare new memory against top-5 existing memories
+  - If similarity > SIMILARITY_THRESHOLD (0.80) → proceed to Stage 2
+Stage 2: LLM-based semantic comparison (accurate, but heavier)
+  - Uses SubconsciousAI connector to evaluate if two memories actually contradict
+  - Avoids false positives from paraphrases (similarity doesn't mean contradiction)
+On confirmed contradiction:
+  - Both memories receive a 'contradiction_group_id' in their provenance lineage
+  - Both are flagged in their metadata
+  - The API returns an alert in the store response
+  - Entries are added to a ContradictionRegistry for the /contradictions endpoint
+Background scan:
+  - ContradictionDetector.scan(nodes) can be called from ConsolidationWorker
+Public API:
+    detector = ContradictionDetector(engine)
+    result = await detector.check_on_store(new_content, new_node, existing_nodes)
+    all = detector.registry.list_all()
+"""
+from __future__ import annotations
+import uuid
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from typing import TYPE_CHECKING, Any, Dict, List, Optional, Tuple
+from loguru import logger
+if TYPE_CHECKING:
+    from .node import MemoryNode
+# ------------------------------------------------------------------ #
+#  Thresholds                                                         #
+# ------------------------------------------------------------------ #
+SIMILARITY_THRESHOLD: float = 0.80   # Above this → suspect contradiction
+LLM_CONFIRM_MIN_SCORE: float = 0.70  # LLM contradiction confidence minimum
+# ------------------------------------------------------------------ #
+#  ContradictionRecord                                               #
+# ------------------------------------------------------------------ #
+@dataclass
+class ContradictionRecord:
+    """A detected contradiction between two memories."""
+    group_id: str = field(default_factory=lambda: f"cg_{uuid.uuid4().hex[:12]}")
+    memory_a_id: str = ""
+    memory_b_id: str = ""
+    similarity_score: float = 0.0
+    llm_confirmed: bool = False
+    detected_at: str = field(
+        default_factory=lambda: datetime.now(timezone.utc).isoformat()
+    )
+    resolved: bool = False
+    resolution_note: Optional[str] = None
+    def to_dict(self) -> Dict[str, Any]:
+        return {
+            "group_id": self.group_id,
+            "memory_a_id": self.memory_a_id,
+            "memory_b_id": self.memory_b_id,
+            "similarity_score": round(self.similarity_score, 4),
+            "llm_confirmed": self.llm_confirmed,
+            "detected_at": self.detected_at,
+            "resolved": self.resolved,
+            "resolution_note": self.resolution_note,
+        }
+# ------------------------------------------------------------------ #
+#  ContradictionRegistry                                             #
+# ------------------------------------------------------------------ #
+class ContradictionRegistry:
+    """In-memory store of detected contradictions (survives until restart)."""
+    def __init__(self) -> None:
+        self._records: Dict[str, ContradictionRecord] = {}
+    def register(self, record: ContradictionRecord) -> None:
+        self._records[record.group_id] = record
+    def resolve(self, group_id: str, note: Optional[str] = None) -> bool:
+        if group_id in self._records:
+            self._records[group_id].resolved = True
+            self._records[group_id].resolution_note = note
+            return True
+        return False
+    def list_all(self, unresolved_only: bool = True) -> List[ContradictionRecord]:
+        recs = list(self._records.values())
+        if unresolved_only:
+            recs = [r for r in recs if not r.resolved]
+        return sorted(recs, key=lambda r: r.detected_at, reverse=True)
+    def list_for_memory(self, memory_id: str) -> List[ContradictionRecord]:
+        return [
+            r for r in self._records.values()
+            if r.memory_a_id == memory_id or r.memory_b_id == memory_id
+        ]
+    def __len__(self) -> int:
+        return len([r for r in self._records.values() if not r.resolved])
+# ------------------------------------------------------------------ #
+#  ContradictionDetector                                             #
+# ------------------------------------------------------------------ #
+class ContradictionDetector:
+    """
+    Two-stage contradiction detector.
+    Stage 1: Vector similarity via the engine's binary HDV comparison.
+    Stage 2: LLM semantic check via SubconsciousAI (optional).
+    """
+    def __init__(
+        self,
+        engine=None,  # HAIMEngine — optional; if None, similarity check uses fallback
+        similarity_threshold: float = SIMILARITY_THRESHOLD,
+        top_k: int = 5,
+        use_llm: bool = True,
+    ) -> None:
+        self.engine = engine
+        self.similarity_threshold = similarity_threshold
+        self.top_k = top_k
+        self.use_llm = use_llm
+        self.registry = ContradictionRegistry()
+    # ---- Similarity helpers -------------------------------------- #
+    def _hamming_similarity(self, node_a: "MemoryNode", node_b: "MemoryNode") -> float:
+        """
+        Compute binary HDV similarity between two nodes.
+        Similarity = 1 - normalized_hamming_distance.
+        """
+        try:
+            import numpy as np
+            a = node_a.hdv.data
+            b = node_b.hdv.data
+            xor = np.bitwise_xor(a, b)
+            ham = float(bin(int.from_bytes(xor.tobytes(), "little")).count("1"))
+            dim = len(a) * 8
+            return 1.0 - ham / dim
+        except Exception:
+            return 0.0
+    # ---- LLM contradiction check --------------------------------- #
+    async def _llm_contradicts(
+        self, content_a: str, content_b: str
+    ) -> Tuple[bool, float]:
+        """
+        Ask SubconsciousAI if two contents contradict each other.
+        Returns (is_contradiction, confidence_score).
+        Falls back to False if LLM is unavailable.
+        """
+        if not self.engine or not self.use_llm:
+            return False, 0.0
+        try:
+            subcon = getattr(self.engine, "subconscious_ai", None)
+            if subcon is None:
+                return False, 0.0
+            prompt = (
+                "Do the following two statements contradict each other? "
+                "Answer with a JSON object: {\"contradiction\": true/false, \"confidence\": 0.0-1.0}.\n\n"
+                f"Statement A: {content_a[:500]}\n"
+                f"Statement B: {content_b[:500]}"
+            )
+            raw = await subcon.generate(prompt, max_tokens=64)
+            import json as _json
+            parsed = _json.loads(raw.strip())
+            return bool(parsed.get("contradiction", False)), float(parsed.get("confidence", 0.0))
+        except Exception as exc:
+            logger.debug(f"LLM contradiction check failed: {exc}")
+            return False, 0.0
+    # ---- Flag helpers ------------------------------------------- #
+    def _flag_node(self, node: "MemoryNode", group_id: str) -> None:
+        """Attach contradiction metadata to a node's provenance and metadata fields."""
+        node.metadata["contradiction_group_id"] = group_id
+        node.metadata["contradicted_at"] = datetime.now(timezone.utc).isoformat()
+        prov = getattr(node, "provenance", None)
+        if prov is not None:
+            prov.mark_contradicted(group_id)
+    # ---- Main API ------------------------------------------------ #
+    async def check_on_store(
+        self,
+        new_node: "MemoryNode",
+        candidates: Optional[List["MemoryNode"]] = None,
+    ) -> Optional[ContradictionRecord]:
+        """
+        Check a newly stored node against existing memories.
+        Args:
+            new_node:   The node just stored.
+            candidates: Optional pre-fetched list of nodes to compare against.
+                        If None and engine is available, fetches via HDV search.
+        Returns:
+            ContradictionRecord if a contradiction was detected, else None.
+        """
+        # Fetch candidates if not provided
+        if candidates is None and self.engine is not None:
+            try:
+                results = await self.engine.query(
+                    new_node.content, top_k=self.top_k
+                )
+                nodes = []
+                for mem_id, _score in results:
+                    n = await self.engine.get_memory(mem_id)
+                    if n and n.id != new_node.id:
+                        nodes.append(n)
+                candidates = nodes
+            except Exception as e:
+                logger.debug(f"ContradictionDetector: candidate fetch failed: {e}")
+                candidates = []
+        if not candidates:
+            return None
+        # Stage 1: similarity filter
+        high_sim_candidates = []
+        for cand in candidates:
+            sim = self._hamming_similarity(new_node, cand)
+            if sim >= self.similarity_threshold:
+                high_sim_candidates.append((cand, sim))
+        if not high_sim_candidates:
+            return None
+        # Stage 2: LLM confirmation for the highest-similarity candidate
+        high_sim_candidates.sort(key=lambda x: x[1], reverse=True)
+        top_cand, top_sim = high_sim_candidates[0]
+        is_contradiction = False
+        llm_confirmed = False
+        if self.use_llm:
+            is_contradiction, conf = await self._llm_contradicts(
+                new_node.content, top_cand.content
+            )
+            llm_confirmed = is_contradiction and conf >= LLM_CONFIRM_MIN_SCORE
+        else:
+            # Without LLM, use high similarity as a soft contradiction signal
+            is_contradiction = top_sim >= 0.90
+            llm_confirmed = False
+        if not is_contradiction:
+            return None
+        # Register the contradiction
+        record = ContradictionRecord(
+            memory_a_id=new_node.id,
+            memory_b_id=top_cand.id,
+            similarity_score=top_sim,
+            llm_confirmed=llm_confirmed,
+        )
+        self.registry.register(record)
+        self._flag_node(new_node, record.group_id)
+        self._flag_node(top_cand, record.group_id)
+        logger.warning(
+            f"⚠️  Contradiction detected: {new_node.id[:8]} ↔ {top_cand.id[:8]} "
+            f"(sim={top_sim:.3f}, llm_confirmed={llm_confirmed}, group={record.group_id})"
+        )
+        return record
+    async def scan(self, nodes: "List[MemoryNode]") -> List[ContradictionRecord]:
+        """
+        Background scan: compare each node against its peers in the provided list.
+        Called periodically from ConsolidationWorker.
+        Returns all newly detected contradiction records.
+        """
+        found: List[ContradictionRecord] = []
+        n = len(nodes)
+        for i in range(n):
+            for j in range(i + 1, n):
+                sim = self._hamming_similarity(nodes[i], nodes[j])
+                if sim < self.similarity_threshold:
+                    continue
+                is_contradiction, _ = await self._llm_contradicts(
+                    nodes[i].content, nodes[j].content
+                )
+                if not is_contradiction:
+                    continue
+                record = ContradictionRecord(
+                    memory_a_id=nodes[i].id,
+                    memory_b_id=nodes[j].id,
+                    similarity_score=sim,
+                    llm_confirmed=True,
+                )
+                self.registry.register(record)
+                self._flag_node(nodes[i], record.group_id)
+                self._flag_node(nodes[j], record.group_id)
+                found.append(record)
+        if found:
+            logger.info(f"ContradictionDetector background scan: {len(found)} contradictions found in {n} nodes")
+        return found
+# ------------------------------------------------------------------ #
+#  Module singleton                                                  #
+# ------------------------------------------------------------------ #
+_DETECTOR: ContradictionDetector | None = None
+def get_contradiction_detector(engine=None) -> ContradictionDetector:
+    """Return the shared ContradictionDetector singleton."""
+    global _DETECTOR
+    if _DETECTOR is None:
+        _DETECTOR = ContradictionDetector(engine=engine)
+    elif engine is not None and _DETECTOR.engine is None:
+        _DETECTOR.engine = engine
+    return _DETECTOR

src/mnemocore/core/cross_domain.py ADDED Viewed

	@@ -0,0 +1,211 @@

+"""
+Cross-Domain Association Builder (Phase 5.0 — Agent 3)
+=======================================================
+Automatically links memories across three semantic domains:
+    strategic   – goals, decisions, roadmaps, strategies
+    operational – code, bugs, documentation, tasks
+    personal    – preferences, habits, relationships, context
+Cross-domain synapses improve holistic reasoning: when a strategic
+goal changes, the system can surface related operational tasks or
+personal context without being explicitly queried.
+Implementation:
+  - Each memory is tagged with a `domain` in its metadata (or inferred)
+  - CrossDomainSynapseBuilder monitors recently stored memories
+  - Co-occurrence within a time window → create a cross-domain synapse
+  - Synapse weight is damped (0.2×) relative to intra-domain (1.0×)
+Integration with RippleContext:
+  - ripple_context.py uses domain_weight when propagating context
+  - Cross-domain propagation uses CROSS_DOMAIN_WEIGHT as the multiplier
+Public API:
+    builder = CrossDomainSynapseBuilder(engine)
+    await builder.process_new_memory(node)  # call after /store
+    pairs = await builder.scan_recent(hours=1)  # background scan
+"""
+from __future__ import annotations
+from datetime import datetime, timezone, timedelta
+from typing import TYPE_CHECKING, Dict, List, Optional, Set, Tuple
+from loguru import logger
+if TYPE_CHECKING:
+    from .node import MemoryNode
+# ------------------------------------------------------------------ #
+#  Constants                                                          #
+# ------------------------------------------------------------------ #
+DOMAINS = {"strategic", "operational", "personal"}
+DEFAULT_DOMAIN = "operational"
+# Weight applied to cross-domain synapses (vs 1.0 for intra-domain)
+CROSS_DOMAIN_WEIGHT: float = 0.2
+# Time window for co-occurrence detection (hours)
+COOCCURRENCE_WINDOW_HOURS: float = 2.0
+# Keywords used to infer domain automatically if not tagged
+DOMAIN_KEYWORDS: Dict[str, List[str]] = {
+    "strategic": [
+        "goal", "strategy", "roadmap", "vision", "mission", "objective",
+        "decision", "priority", "kpi", "okr", "plan", "budget", "market",
+    ],
+    "personal": [
+        "prefer", "habit", "feel", "emotion", "prefer", "like", "dislike",
+        "relationship", "trust", "colleague", "friend", "name", "remember me",
+    ],
+    "operational": [
+        "code", "bug", "fix", "implement", "test", "deploy", "api",
+        "function", "class", "module", "error", "exception", "task", "ticket",
+    ],
+}
+# ------------------------------------------------------------------ #
+#  Domain inference                                                  #
+# ------------------------------------------------------------------ #
+def infer_domain(content: str, metadata: Optional[Dict] = None) -> str:
+    """
+    Infer the semantic domain of a memory from its content and metadata.
+    Priority:
+    1. metadata["domain"] if set
+    2. keyword match in content (highest score wins)
+    3. DEFAULT_DOMAIN ("operational")
+    """
+    if metadata and "domain" in metadata:
+        d = metadata["domain"].lower()
+        return d if d in DOMAINS else DEFAULT_DOMAIN
+    content_lower = content.lower()
+    best_domain = DEFAULT_DOMAIN
+    best_count = 0
+    for domain, keywords in DOMAIN_KEYWORDS.items():
+        count = sum(1 for kw in keywords if kw in content_lower)
+        if count > best_count:
+            best_count = count
+            best_domain = domain
+    return best_domain
+# ------------------------------------------------------------------ #
+#  CrossDomainSynapseBuilder                                         #
+# ------------------------------------------------------------------ #
+class CrossDomainSynapseBuilder:
+    """
+    Detects cross-domain co-occurrences and requests synapse creation.
+    Works by maintaining a rolling buffer of recently stored memories,
+    then pairing memories from different domains that appeared within
+    COOCCURRENCE_WINDOW_HOURS of each other.
+    """
+    def __init__(
+        self,
+        engine=None,  # HAIMEngine
+        window_hours: float = COOCCURRENCE_WINDOW_HOURS,
+        cross_domain_weight: float = CROSS_DOMAIN_WEIGHT,
+    ) -> None:
+        self.engine = engine
+        self.window = timedelta(hours=window_hours)
+        self.weight = cross_domain_weight
+        # Buffer: list of (node_id, domain, stored_at)
+        self._buffer: List[Tuple[str, str, datetime]] = []
+    # ---- Domain helpers ------------------------------------------ #
+    def tag_domain(self, node: "MemoryNode") -> str:
+        """Infer and write domain tag to node.metadata. Returns domain string."""
+        domain = infer_domain(node.content, getattr(node, "metadata", {}))
+        if hasattr(node, "metadata"):
+            node.metadata["domain"] = domain
+        return domain
+    # ---- Synapse creation --------------------------------------- #
+    async def _create_synapse(self, id_a: str, id_b: str) -> None:
+        """
+        Request synapse creation between two nodes via the engine's synapse index.
+        Weight is damped by CROSS_DOMAIN_WEIGHT.
+        """
+        if self.engine is None:
+            logger.debug(f"CrossDomain: no engine, skipping synapse {id_a[:8]} ↔ {id_b[:8]}")
+            return
+        try:
+            synapse_index = getattr(self.engine, "synapse_index", None)
+            if synapse_index is not None:
+                synapse_index.add_or_strengthen(id_a, id_b, delta=self.weight)
+                logger.debug(
+                    f"CrossDomain synapse created: {id_a[:8]} ↔ {id_b[:8]} weight={self.weight}"
+                )
+        except Exception as exc:
+            logger.debug(f"CrossDomain synapse creation failed: {exc}")
+    # ---- Main API ----------------------------------------------- #
+    async def process_new_memory(self, node: "MemoryNode") -> List[Tuple[str, str]]:
+        """
+        Called after a new memory is stored.
+        Tags its domain and checks for cross-domain co-occurrences in the buffer.
+        Returns list of (id_a, id_b) pairs for which synapses were created.
+        """
+        domain = self.tag_domain(node)
+        now = datetime.now(timezone.utc)
+        # Cut stale entries from buffer
+        cutoff = now - self.window
+        self._buffer = [(nid, d, ts) for nid, d, ts in self._buffer if ts >= cutoff]
+        # Find cross-domain pairs with current node
+        pairs: List[Tuple[str, str]] = []
+        already_seen: Set[str] = set()
+        for existing_id, existing_domain, _ts in self._buffer:
+            if existing_domain != domain and existing_id not in already_seen:
+                await self._create_synapse(node.id, existing_id)
+                pairs.append((node.id, existing_id))
+                already_seen.add(existing_id)
+        # Add current node to buffer
+        self._buffer.append((node.id, domain, now))
+        if pairs:
+            logger.info(
+                f"CrossDomain: {len(pairs)} cross-domain synapses created for node {node.id[:8]} (domain={domain})"
+            )
+        return pairs
+    async def scan_recent(self, hours: float = 1.0) -> List[Tuple[str, str]]:
+        """
+        Scan the current buffer for any unpaired cross-domain co-occurrences.
+        Returns all cross-domain pairs.
+        """
+        now = datetime.now(timezone.utc)
+        cutoff = now - timedelta(hours=hours)
+        recent = [(nid, d, ts) for nid, d, ts in self._buffer if ts >= cutoff]
+        pairs: List[Tuple[str, str]] = []
+        n = len(recent)
+        for i in range(n):
+            for j in range(i + 1, n):
+                id_i, dom_i, _ = recent[i]
+                id_j, dom_j, _ = recent[j]
+                if dom_i != dom_j:
+                    await self._create_synapse(id_i, id_j)
+                    pairs.append((id_i, id_j))
+        return pairs
+    def clear_buffer(self) -> None:
+        """Reset the co-occurrence buffer."""
+        self._buffer.clear()

src/mnemocore/core/emotional_tag.py ADDED Viewed

	@@ -0,0 +1,124 @@

+"""
+Emotional Tagging Module (Phase 5.0 — Agent 3)
+================================================
+Adds valence/arousal emotional metadata to MemoryNode storage.
+Based on affective computing research (Russell's circumplex model):
+  - emotional_valence: float in [-1.0, 1.0]
+      -1.0 = extremely negative (fear, grief)
+       0.0 = neutral
+      +1.0 = extremely positive (joy, excitement)
+  - emotional_arousal: float in [0.0, 1.0]
+       0.0 = calm / low energy
+       1.0 = highly activated / intense
+These signals are used by the SubconsciousAI dream cycle to prioritize
+consolidation of high-valence, high-arousal memories (the most
+biologically significant ones).
+Public API:
+    tag = EmotionalTag(valence=0.8, arousal=0.9)
+    meta = tag.to_metadata_dict()
+    tag_back = EmotionalTag.from_metadata(node.metadata)
+    score = tag.salience()  # combined importance weight
+"""
+from __future__ import annotations
+from dataclasses import dataclass
+from typing import Any, Dict, Optional, TYPE_CHECKING
+if TYPE_CHECKING:
+    from .node import MemoryNode
+# ------------------------------------------------------------------ #
+#  EmotionalTag                                                      #
+# ------------------------------------------------------------------ #
+@dataclass
+class EmotionalTag:
+    """
+    Two-dimensional emotional metadata for a memory.
+    valence  ∈ [-1.0, 1.0]  (-1 = very negative, +1 = very positive)
+    arousal  ∈ [ 0.0, 1.0]  ( 0 = calm, 1 = highly activated)
+    """
+    valence: float = 0.0
+    arousal: float = 0.0
+    def __post_init__(self) -> None:
+        self.valence = float(max(-1.0, min(1.0, self.valence)))
+        self.arousal = float(max(0.0, min(1.0, self.arousal)))
+    # ---- Salience ------------------------------------------------ #
+    def salience(self) -> float:
+        """
+        Combined salience score for dream cycle prioritization.
+        High |valence| AND high arousal = most memorable / worth consolidating.
+        Returns a float in [0.0, 1.0].
+        """
+        return abs(self.valence) * self.arousal
+    def is_emotionally_significant(self, threshold: float = 0.3) -> bool:
+        """True if the salience is above the given threshold."""
+        return self.salience() >= threshold
+    # ---- Serialization ------------------------------------------- #
+    def to_metadata_dict(self) -> Dict[str, Any]:
+        return {
+            "emotional_valence": self.valence,
+            "emotional_arousal": self.arousal,
+            "emotional_salience": round(self.salience(), 4),
+        }
+    @classmethod
+    def from_metadata(cls, metadata: Dict[str, Any]) -> "EmotionalTag":
+        """Extract an EmotionalTag from a MemoryNode's metadata dict."""
+        return cls(
+            valence=float(metadata.get("emotional_valence", 0.0)),
+            arousal=float(metadata.get("emotional_arousal", 0.0)),
+        )
+    @classmethod
+    def from_node(cls, node: "MemoryNode") -> "EmotionalTag":
+        """Extract emotional tag directly from a MemoryNode."""
+        return cls.from_metadata(getattr(node, "metadata", {}))
+    # ---- Helpers -------------------------------------------------- #
+    @classmethod
+    def neutral(cls) -> "EmotionalTag":
+        return cls(valence=0.0, arousal=0.0)
+    @classmethod
+    def high_positive(cls) -> "EmotionalTag":
+        """Factory for highly positive, highly aroused tags (e.g. breakthrough)."""
+        return cls(valence=1.0, arousal=1.0)
+    @classmethod
+    def high_negative(cls) -> "EmotionalTag":
+        """Factory for highly negative, highly aroused tags (e.g. critical failure)."""
+        return cls(valence=-1.0, arousal=1.0)
+    def __repr__(self) -> str:
+        return f"EmotionalTag(valence={self.valence:+.2f}, arousal={self.arousal:.2f}, salience={self.salience():.2f})"
+# ------------------------------------------------------------------ #
+#  Node helpers                                                      #
+# ------------------------------------------------------------------ #
+def attach_emotional_tag(node: "MemoryNode", tag: EmotionalTag) -> None:
+    """Write emotional metadata into node.metadata in place."""
+    node.metadata.update(tag.to_metadata_dict())
+def get_emotional_tag(node: "MemoryNode") -> EmotionalTag:
+    """Read the emotional tag from a node's metadata (returns neutral if absent)."""
+    return EmotionalTag.from_node(node)

src/mnemocore/core/engine.py CHANGED Viewed

@@ -39,6 +39,11 @@ from .gap_filler import GapFiller, GapFillerConfig
 from .synapse_index import SynapseIndex
 from .subconscious_ai import SubconsciousAIWorker
 # Phase 4.5: Recursive Synthesis Engine
 from .recursive_synthesizer import RecursiveSynthesizer, SynthesizerConfig
@@ -71,6 +76,9 @@ class HAIMEngine:
         persist_path: Optional[str] = None,
         config: Optional[HAIMConfig] = None,
         tier_manager: Optional[TierManager] = None,
     ):
         """
         Initialize HAIMEngine with optional dependency injection.
@@ -80,6 +88,9 @@ class HAIMEngine:
             persist_path: Path to memory persistence file.
             config: Configuration object. If None, uses global get_config().
             tier_manager: TierManager instance. If None, creates a new one.
         """
         self.config = config or get_config()
         self.dimension = self.config.dimensionality
@@ -89,6 +100,11 @@ class HAIMEngine:
         # Core Components
         self.tier_manager = tier_manager or TierManager(config=self.config)
         self.binary_encoder = TextEncoder(self.dimension)
         # ── Phase 3.x: synapse raw dicts (kept for backward compat) ──
@@ -132,6 +148,23 @@ class HAIMEngine:
         # ── Phase 4.5: recursive synthesizer ───────────────────────────
         self._recursive_synthesizer: Optional[RecursiveSynthesizer] = None
         # Conceptual Layer (VSA Soul)
         data_dir = self.config.paths.data_dir
@@ -337,6 +370,24 @@ class HAIMEngine:
         """
         _is_gap_fill = metadata.get("source") == "llm_gap_fill"
         self.subconscious_queue.append(node.id)
         if not _is_gap_fill:
@@ -346,6 +397,9 @@ class HAIMEngine:
     # Main store() method - Orchestration only
     # ==========================================================================
     @timer(STORE_DURATION_SECONDS, labels={"tier": "hot"})
     @traced("store_memory")
     async def store(
@@ -359,20 +413,38 @@ class HAIMEngine:
         Store new memory with holographic encoding.
         This method orchestrates the memory storage pipeline:
-        1. Encode input content
-        2. Evaluate tier placement via EIG
-        3. Persist to storage
-        4. Trigger post-store processing
         Args:
-            content: The text content to store.
             metadata: Optional metadata dictionary.
             goal_id: Optional goal identifier for context binding.
             project_id: Optional project identifier for isolation masking (Phase 4.1).
         Returns:
             The unique identifier of the stored memory node.
         """
         # 1. Encode input and bind goal context
         encoded_vec, updated_metadata = await self._encode_input(content, metadata, goal_id)
@@ -387,6 +459,35 @@ class HAIMEngine:
         # 3. Create and persist memory node
         node = await self._persist_memory(content, encoded_vec, updated_metadata)
         # 4. Trigger post-store processing
         await self._trigger_post_store(node, updated_metadata)
@@ -412,24 +513,24 @@ class HAIMEngine:
         if node_id in self.subconscious_queue:
             self.subconscious_queue.remove(node_id)
-        # 3. Phase 4.0: clean up via SynapseIndex (O(k))
         async with self.synapse_lock:
             removed_count = self._synapse_index.remove_node(node_id)
-            # Rebuild legacy dicts
-            self.synapses = dict(self._synapse_index.items())
-            self.synapse_adjacency = {}
-            for syn in self._synapse_index.values():
-                self.synapse_adjacency.setdefault(syn.neuron_a_id, [])
-                self.synapse_adjacency.setdefault(syn.neuron_b_id, [])
-                self.synapse_adjacency[syn.neuron_a_id].append(syn)
-                self.synapse_adjacency[syn.neuron_b_id].append(syn)
         if removed_count:
             await self._save_synapses()
         return deleted
     async def close(self):
         """Perform graceful shutdown of engine components."""
         logger.info("Shutting down HAIMEngine...")
@@ -461,6 +562,8 @@ class HAIMEngine:
         chrono_weight: bool = True,
         chrono_lambda: float = 0.0001,
         include_neighbors: bool = False,
     ) -> List[Tuple[str, float]]:
         """
         Query memories using Hamming distance.
@@ -480,10 +583,18 @@ class HAIMEngine:
             Formula: Final_Score = Semantic_Similarity * (1 / (1 + lambda * Time_Delta))
           - chrono_lambda: Decay rate in seconds^-1 (default: 0.0001 ~ 2.7h half-life).
           - include_neighbors: Also fetch temporal neighbors (previous/next) for top results.
         """
         # Encode Query
         query_vec = await self._run_in_thread(self.binary_encoder.encode, query_text)
         # Phase 4.1: Apply project isolation mask to query
         if project_id:
             query_vec = self.isolation_masker.apply_mask(query_vec, project_id)
@@ -494,6 +605,8 @@ class HAIMEngine:
             query_vec,
             top_k=top_k * 2,
             time_range=time_range,
         )
         scores: Dict[str, float] = {}
@@ -515,13 +628,38 @@ class HAIMEngine:
             if chrono_weight and score > 0:
                 mem = mem_map.get(nid)
                 if mem:
-                    time_delta = now_ts - mem.created_at.timestamp()  # seconds since creation
                     # Formula: Final = Semantic * (1 / (1 + lambda * time_delta))
                     decay_factor = 1.0 / (1.0 + chrono_lambda * time_delta)
                     score = score * decay_factor
             scores[nid] = score
         # 2. Associative Spreading (via SynapseIndex for O(1) adjacency lookup)
         if associative_jump and self._synapse_index:
             top_seeds = sorted(scores.items(), key=lambda x: x[1], reverse=True)[:3]
@@ -540,6 +678,15 @@ class HAIMEngine:
                     if neighbor not in augmented_scores:
                         mem = await self.tier_manager.get_memory(neighbor)
                         if mem:
                             augmented_scores[neighbor] = query_vec.similarity(mem.hdv)
                     if neighbor in augmented_scores:
@@ -595,6 +742,15 @@ class HAIMEngine:
                 if mem.previous_id:
                     prev_mem = await self.tier_manager.get_memory(mem.previous_id)
                     if prev_mem and prev_mem.id not in scores:
                         neighbor_ids.add(prev_mem.id)
                 # Try to find the memory that follows this one (has this as previous_id).
@@ -614,8 +770,35 @@ class HAIMEngine:
             # Re-sort after adding neighbors, but preserve query() top_k contract.
             top_results = sorted(top_results, key=lambda x: x[1], reverse=True)[:top_k]
         return top_results
     async def _background_dream(self, depth: int = 2):
         """
         Passive Subconscious – strengthen synapses in idle cycles.
@@ -668,12 +851,32 @@ class HAIMEngine:
         return sorted(active_nodes, key=score, reverse=True)[:max_collapse]
-    async def bind_memories(self, id_a: str, id_b: str, success: bool = True):
         """
         Bind two memories by ID.
-        Phase 4.0: delegates to SynapseIndex for O(1) insert/fire.
-        Also syncs legacy dicts for backward-compat.
         """
         mem_a = await self.tier_manager.get_memory(id_a)
         mem_b = await self.tier_manager.get_memory(id_b)
@@ -682,17 +885,7 @@ class HAIMEngine:
             return
         async with self.synapse_lock:
-            syn = self._synapse_index.add_or_fire(id_a, id_b, success=success)
-            # Keep legacy dict in sync for any external code still using it
-            synapse_key = tuple(sorted([id_a, id_b]))
-            self.synapses[synapse_key] = syn
-            self.synapse_adjacency.setdefault(synapse_key[0], [])
-            self.synapse_adjacency.setdefault(synapse_key[1], [])
-            if syn not in self.synapse_adjacency[synapse_key[0]]:
-                self.synapse_adjacency[synapse_key[0]].append(syn)
-            if syn not in self.synapse_adjacency[synapse_key[1]]:
-                self.synapse_adjacency[synapse_key[1]].append(syn)
         await self._save_synapses()
@@ -712,26 +905,17 @@ class HAIMEngine:
         Also syncs any legacy dict entries into the index before compacting.
         """
         async with self.synapse_lock:
-            # Sync legacy dict → SynapseIndex via the public register() API
-            # (handles tests / external code that injects into self.synapses directly)
-            for key, syn in list(self.synapses.items()):
                 if self._synapse_index.get(syn.neuron_a_id, syn.neuron_b_id) is None:
                     self._synapse_index.register(syn)
             removed = self._synapse_index.compact(threshold)
-            if removed:
-                # Rebuild legacy dicts from the index
-                self.synapses = dict(self._synapse_index.items())
-                self.synapse_adjacency = {}
-                for syn in self._synapse_index.values():
-                    self.synapse_adjacency.setdefault(syn.neuron_a_id, [])
-                    self.synapse_adjacency.setdefault(syn.neuron_b_id, [])
-                    self.synapse_adjacency[syn.neuron_a_id].append(syn)
-                    self.synapse_adjacency[syn.neuron_b_id].append(syn)
-                logger.info(f"cleanup_decay: pruned {removed} synapses below {threshold}")
-                await self._save_synapses()
     async def get_stats(self) -> Dict[str, Any]:
         """Aggregate statistics from engine components."""
@@ -936,18 +1120,9 @@ class HAIMEngine:
         def _load():
             self._synapse_index.load_from_file(self.synapse_path)
         await self._run_in_thread(_load)
-        # Rebuild legacy dicts from SynapseIndex for backward compat
-        async with self.synapse_lock:
-            self.synapses = dict(self._synapse_index.items())
-            self.synapse_adjacency = {}
-            for syn in self._synapse_index.values():
-                self.synapse_adjacency.setdefault(syn.neuron_a_id, [])
-                self.synapse_adjacency.setdefault(syn.neuron_b_id, [])
-                self.synapse_adjacency[syn.neuron_a_id].append(syn)
-                self.synapse_adjacency[syn.neuron_b_id].append(syn)
     async def _save_synapses(self):
         """
         Save synapses to disk in JSONL format.

 from .synapse_index import SynapseIndex
 from .subconscious_ai import SubconsciousAIWorker
+# Phase 5 AGI Stores
+from .working_memory import WorkingMemoryService
+from .episodic_store import EpisodicStoreService
+from .semantic_store import SemanticStoreService
 # Phase 4.5: Recursive Synthesis Engine
 from .recursive_synthesizer import RecursiveSynthesizer, SynthesizerConfig
         persist_path: Optional[str] = None,
         config: Optional[HAIMConfig] = None,
         tier_manager: Optional[TierManager] = None,
+        working_memory: Optional[WorkingMemoryService] = None,
+        episodic_store: Optional[EpisodicStoreService] = None,
+        semantic_store: Optional[SemanticStoreService] = None,
     ):
         """
         Initialize HAIMEngine with optional dependency injection.
             persist_path: Path to memory persistence file.
             config: Configuration object. If None, uses global get_config().
             tier_manager: TierManager instance. If None, creates a new one.
+            working_memory: Optional Phase 5 WM service.
+            episodic_store: Optional Phase 5 EM service.
+            semantic_store: Optional Phase 5 Semantic service.
         """
         self.config = config or get_config()
         self.dimension = self.config.dimensionality
         # Core Components
         self.tier_manager = tier_manager or TierManager(config=self.config)
+        # Phase 5 Components
+        self.working_memory = working_memory
+        self.episodic_store = episodic_store
+        self.semantic_store = semantic_store
         self.binary_encoder = TextEncoder(self.dimension)
         # ── Phase 3.x: synapse raw dicts (kept for backward compat) ──
         # ── Phase 4.5: recursive synthesizer ───────────────────────────
         self._recursive_synthesizer: Optional[RecursiveSynthesizer] = None
+        # ── Phase 12.2: Contextual Topic Tracker ───────────────────────
+        from .topic_tracker import TopicTracker
+        self.topic_tracker = TopicTracker(self.config.context, self.dimension)
+        # ── Phase 12.3: Preference Learning ────────────────────────────
+        from .preference_store import PreferenceStore
+        self.preference_store = PreferenceStore(self.config.preference, self.dimension)
+        # ── Phase 13.2: Anticipatory Memory ────────────────────────────
+        from .anticipatory import AnticipatoryEngine
+        self.anticipatory_engine = AnticipatoryEngine(
+            self.config.anticipatory,
+            self._synapse_index,
+            self.tier_manager,
+            self.topic_tracker
+        )
         # Conceptual Layer (VSA Soul)
         data_dir = self.config.paths.data_dir
         """
         _is_gap_fill = metadata.get("source") == "llm_gap_fill"
+        # Phase 12.1: Aggressive Synapse Formation (Auto-bind).
+        # Fix 4: collect all bindings first, persist synapses only once at the end.
+        if hasattr(self.config, 'synapse') and self.config.synapse.auto_bind_on_store:
+            similar_nodes = await self.query(
+                node.content,
+                top_k=3,
+                associative_jump=False,
+                track_gaps=False,
+            )
+            bind_pairs = [
+                (node.id, neighbor_id)
+                for neighbor_id, similarity in similar_nodes
+                if neighbor_id != node.id
+                and similarity >= self.config.synapse.similarity_threshold
+            ]
+            if bind_pairs:
+                await self._auto_bind_batch(bind_pairs)
         self.subconscious_queue.append(node.id)
         if not _is_gap_fill:
     # Main store() method - Orchestration only
     # ==========================================================================
+    # Maximum allowed content length (Fix 5: input validation)
+    _MAX_CONTENT_LENGTH: int = 100_000
     @timer(STORE_DURATION_SECONDS, labels={"tier": "hot"})
     @traced("store_memory")
     async def store(
         Store new memory with holographic encoding.
         This method orchestrates the memory storage pipeline:
+        1. Validate input
+        2. Encode input content
+        3. Evaluate tier placement via EIG
+        4. Persist to storage
+        5. Trigger post-store processing
         Args:
+            content: The text content to store. Must be non-empty and ≤100 000 chars.
             metadata: Optional metadata dictionary.
             goal_id: Optional goal identifier for context binding.
             project_id: Optional project identifier for isolation masking (Phase 4.1).
         Returns:
             The unique identifier of the stored memory node.
+        Raises:
+            ValueError: If content is empty or exceeds the maximum allowed length.
+            RuntimeError: If the engine has not been initialized via initialize().
         """
+        # Fix 5: Input validation
+        if not content or not content.strip():
+            raise ValueError("Memory content cannot be empty or whitespace-only.")
+        if len(content) > self._MAX_CONTENT_LENGTH:
+            raise ValueError(
+                f"Memory content is too long ({len(content):,} chars). "
+                f"Maximum: {self._MAX_CONTENT_LENGTH:,}."
+            )
+        if not self._initialized:
+            raise RuntimeError(
+                "HAIMEngine.initialize() must be awaited before calling store()."
+            )
         # 1. Encode input and bind goal context
         encoded_vec, updated_metadata = await self._encode_input(content, metadata, goal_id)
         # 3. Create and persist memory node
         node = await self._persist_memory(content, encoded_vec, updated_metadata)
+        # Phase 5.1: If agent_id in metadata, push to Working Memory and log Episode event
+        agent_id = updated_metadata.get("agent_id")
+        if agent_id:
+            if self.working_memory:
+                from .memory_model import WorkingMemoryItem
+                self.working_memory.push_item(
+                    agent_id,
+                    WorkingMemoryItem(
+                        id=f"wm_{node.id[:8]}",
+                        agent_id=agent_id,
+                        created_at=datetime.utcnow(),
+                        ttl_seconds=3600,
+                        content=content,
+                        kind="observation",
+                        importance=node.epistemic_value or 0.5,
+                        tags=updated_metadata.get("tags", []),
+                        hdv=encoded_vec
+                    )
+                )
+            episode_id = updated_metadata.get("episode_id")
+            if episode_id and self.episodic_store:
+                self.episodic_store.append_event(
+                    episode_id=episode_id,
+                    kind="observation",
+                    content=content,
+                    metadata=updated_metadata
+                )
         # 4. Trigger post-store processing
         await self._trigger_post_store(node, updated_metadata)
         if node_id in self.subconscious_queue:
             self.subconscious_queue.remove(node_id)
+        # 3. Phase 4.0: clean up via SynapseIndex (O(k)).
+        # Fix 2: legacy dict rebuild removed — _synapse_index is authoritative.
         async with self.synapse_lock:
             removed_count = self._synapse_index.remove_node(node_id)
         if removed_count:
             await self._save_synapses()
         return deleted
+    async def log_decision(self, context_text: str, outcome: float) -> None:
+        """
+        Phase 12.3: Logs a user decision or feedback context to update preference vector.
+        Outcome should be positive (e.g. 1.0) or negative (e.g. -1.0).
+        """
+        vec = await self._run_in_thread(self.binary_encoder.encode, context_text)
+        self.preference_store.log_decision(vec, outcome)
     async def close(self):
         """Perform graceful shutdown of engine components."""
         logger.info("Shutting down HAIMEngine...")
         chrono_weight: bool = True,
         chrono_lambda: float = 0.0001,
         include_neighbors: bool = False,
+        metadata_filter: Optional[Dict[str, Any]] = None,
+        include_cold: bool = False,
     ) -> List[Tuple[str, float]]:
         """
         Query memories using Hamming distance.
             Formula: Final_Score = Semantic_Similarity * (1 / (1 + lambda * Time_Delta))
           - chrono_lambda: Decay rate in seconds^-1 (default: 0.0001 ~ 2.7h half-life).
           - include_neighbors: Also fetch temporal neighbors (previous/next) for top results.
+          - include_cold: Include COLD tier in the search (bounded linear scan, default False).
+        Fix 3: Triggers anticipatory preloading (Phase 13.2) as fire-and-forget after returning.
         """
         # Encode Query
         query_vec = await self._run_in_thread(self.binary_encoder.encode, query_text)
+        # Phase 12.2: Context Tracking
+        is_shift, sim = self.topic_tracker.add_query(query_vec)
+        if is_shift:
+            logger.info(f"Context shifted during query. (sim {sim:.3f})")
         # Phase 4.1: Apply project isolation mask to query
         if project_id:
             query_vec = self.isolation_masker.apply_mask(query_vec, project_id)
             query_vec,
             top_k=top_k * 2,
             time_range=time_range,
+            metadata_filter=metadata_filter,
+            include_cold=include_cold,
         )
         scores: Dict[str, float] = {}
             if chrono_weight and score > 0:
                 mem = mem_map.get(nid)
                 if mem:
+                    time_delta = max(0.0, now_ts - mem.created_at.timestamp())  # seconds since creation
                     # Formula: Final = Semantic * (1 / (1 + lambda * time_delta))
                     decay_factor = 1.0 / (1.0 + chrono_lambda * time_delta)
                     score = score * decay_factor
+            # Phase 12.3: Preference Learning Bias
+            if self.preference_store.config.enabled and self.preference_store.preference_vector is not None:
+                mem = mem_map.get(nid)
+                if not mem:
+                    mem = await self.tier_manager.get_memory(nid)
+                    if mem and mem.id not in mem_map:
+                        mem_map[mem.id] = mem
+                if mem:
+                    score = self.preference_store.bias_score(mem.hdv, score)
             scores[nid] = score
+        # Phase 5.1: Boost context matching Working Memory
+        agent_id = metadata_filter.get("agent_id") if metadata_filter else None
+        if agent_id and self.working_memory:
+            wm_state = self.working_memory.get_state(agent_id)
+            if wm_state:
+                wm_texts = [item.content for item in wm_state.items]
+                if wm_texts:
+                    # Very lightweight lexical boost for items currently in working memory
+                    q_lower = query_text.lower()
+                    for nid in scores:
+                        mem = mem_map.get(nid) # Assuming already cached from chrono weighting
+                        if mem and mem.content:
+                            if any(w_text.lower() in mem.content.lower() for w_text in wm_texts):
+                                scores[nid] *= 1.15 # 15% boost for WM overlap
         # 2. Associative Spreading (via SynapseIndex for O(1) adjacency lookup)
         if associative_jump and self._synapse_index:
             top_seeds = sorted(scores.items(), key=lambda x: x[1], reverse=True)[:3]
                     if neighbor not in augmented_scores:
                         mem = await self.tier_manager.get_memory(neighbor)
                         if mem:
+                            if metadata_filter:
+                                match = True
+                                node_meta = mem.metadata or {}
+                                for k, v in metadata_filter.items():
+                                    if node_meta.get(k) != v:
+                                        match = False
+                                        break
+                                if not match:
+                                    continue
                             augmented_scores[neighbor] = query_vec.similarity(mem.hdv)
                     if neighbor in augmented_scores:
                 if mem.previous_id:
                     prev_mem = await self.tier_manager.get_memory(mem.previous_id)
                     if prev_mem and prev_mem.id not in scores:
+                        if metadata_filter:
+                            match = True
+                            p_meta = prev_mem.metadata or {}
+                            for k, v in metadata_filter.items():
+                                if p_meta.get(k) != v:
+                                    match = False
+                                    break
+                            if not match:
+                                continue
                         neighbor_ids.add(prev_mem.id)
                 # Try to find the memory that follows this one (has this as previous_id).
             # Re-sort after adding neighbors, but preserve query() top_k contract.
             top_results = sorted(top_results, key=lambda x: x[1], reverse=True)[:top_k]
+        # Phase 13.2 (Fix 3): Anticipatory preloading — fire-and-forget so it
+        # never blocks the caller. Only activated when the engine is fully warm.
+        if top_results and self._initialized and self.config.anticipatory.enabled:
+            asyncio.ensure_future(
+                self.anticipatory_engine.predict_and_preload(top_results[0][0])
+            )
         return top_results
+    async def get_context_nodes(self, top_k: int = 3) -> List[Tuple[str, float]]:
+        """
+        Phase 12.2: Contextual Awareness
+        Retrieves the top_k most relevant nodes relating to the current topic context vector.
+        Should be explicitly used by prompt builders before LLM logic injection.
+        """
+        if not self.topic_tracker.config.enabled:
+            return []
+        ctx = self.topic_tracker.get_context()
+        if ctx is None:
+            return []
+        results = await self.tier_manager.search(
+            ctx,
+            top_k=top_k,
+            time_range=None,
+            metadata_filter=None,
+        )
+        return results
     async def _background_dream(self, depth: int = 2):
         """
         Passive Subconscious – strengthen synapses in idle cycles.
         return sorted(active_nodes, key=score, reverse=True)[:max_collapse]
+    async def _auto_bind_batch(
+        self,
+        pairs: List[Tuple[str, str]],
+        success: bool = True,
+        weight: float = 1.0,
+    ) -> None:
+        """
+        Fix 4: Bind multiple (id_a, id_b) pairs in one pass, saving synapses once.
+        Used by auto-bind in _trigger_post_store() to avoid N disk writes per store.
+        """
+        async with self.synapse_lock:
+            for id_a, id_b in pairs:
+                mem_a = await self.tier_manager.get_memory(id_a)
+                mem_b = await self.tier_manager.get_memory(id_b)
+                if mem_a and mem_b:
+                    self._synapse_index.add_or_fire(id_a, id_b, success=success, weight=weight)
+        await self._save_synapses()
+    async def bind_memories(self, id_a: str, id_b: str, success: bool = True, weight: float = 1.0):
         """
         Bind two memories by ID.
+        Fix 2: delegates exclusively to SynapseIndex — legacy dict sync removed.
+        The legacy self.synapses / self.synapse_adjacency attributes remain for
+        backward compatibility but are only populated at startup from disk.
         """
         mem_a = await self.tier_manager.get_memory(id_a)
         mem_b = await self.tier_manager.get_memory(id_b)
             return
         async with self.synapse_lock:
+            self._synapse_index.add_or_fire(id_a, id_b, success=success, weight=weight)
         await self._save_synapses()
         Also syncs any legacy dict entries into the index before compacting.
         """
         async with self.synapse_lock:
+            # Retain legacy→index sync so tests that write to self.synapses directly
+            # still get their entries registered (Fix 2: sync only in this direction).
+            for syn in list(self.synapses.values()):
                 if self._synapse_index.get(syn.neuron_a_id, syn.neuron_b_id) is None:
                     self._synapse_index.register(syn)
             removed = self._synapse_index.compact(threshold)
+        if removed:
+            logger.info(f"cleanup_decay: pruned {removed} synapses below {threshold}")
+            await self._save_synapses()
     async def get_stats(self) -> Dict[str, Any]:
         """Aggregate statistics from engine components."""
         def _load():
             self._synapse_index.load_from_file(self.synapse_path)
+        # Fix 2: _synapse_index is authoritative — legacy dicts no longer rebuilt.
         await self._run_in_thread(_load)
     async def _save_synapses(self):
         """
         Save synapses to disk in JSONL format.

src/mnemocore/core/episodic_store.py ADDED Viewed

	@@ -0,0 +1,144 @@

+"""
+Episodic Store Service
+======================
+Manages sequences of events (Episodes), chaining them chronologically.
+Provides the foundation for episodic recall and narrative tracking over time.
+"""
+from typing import Dict, List, Optional, Any
+from datetime import datetime
+import threading
+import uuid
+import logging
+from .memory_model import Episode, EpisodeEvent
+from .tier_manager import TierManager
+logger = logging.getLogger(__name__)
+class EpisodicStoreService:
+    def __init__(self, tier_manager: Optional[TierManager] = None):
+        self._tier_manager = tier_manager
+        # In-memory index of active episodes; eventually backed by SQLite/Qdrant
+        self._active_episodes: Dict[str, Episode] = {}
+        # Simple backward index map from agent to sorted list of historical episodes
+        self._agent_history: Dict[str, List[Episode]] = {}
+        self._lock = threading.RLock()
+    def start_episode(
+        self, agent_id: str, goal: Optional[str] = None, context: Optional[str] = None
+    ) -> str:
+        with self._lock:
+            ep_id = f"ep_{uuid.uuid4().hex[:12]}"
+            # Find previous absolute episode for this agent to populate links_prev
+            prev_links = []
+            if agent_id in self._agent_history and self._agent_history[agent_id]:
+                last_ep = self._agent_history[agent_id][-1]
+                prev_links.append(last_ep.id)
+            new_ep = Episode(
+                id=ep_id,
+                agent_id=agent_id,
+                started_at=datetime.utcnow(),
+                ended_at=None,
+                goal=goal,
+                context=context,
+                events=[],
+                outcome="in_progress",
+                reward=None,
+                links_prev=prev_links,
+                links_next=[],
+                ltp_strength=0.0,
+                reliability=1.0,
+            )
+            # Link the previous episode forward
+            if prev_links:
+                last_ep_id = prev_links[0]
+                last_ep = self._get_historical_ep(agent_id, last_ep_id)
+                if last_ep and new_ep.id not in last_ep.links_next:
+                    last_ep.links_next.append(new_ep.id)
+            self._active_episodes[ep_id] = new_ep
+            return ep_id
+    def append_event(
+        self,
+        episode_id: str,
+        kind: str,
+        content: str,
+        metadata: Optional[dict[str, Any]] = None,
+    ) -> None:
+        with self._lock:
+            ep = self._active_episodes.get(episode_id)
+            if not ep:
+                logger.warning(f"Attempted to append event to inactive or not found episode: {episode_id}")
+                return
+            event = EpisodeEvent(
+                timestamp=datetime.utcnow(),
+                kind=kind, # type: ignore
+                content=content,
+                metadata=metadata or {},
+            )
+            ep.events.append(event)
+    def end_episode(
+        self, episode_id: str, outcome: str, reward: Optional[float] = None
+    ) -> None:
+        with self._lock:
+            ep = self._active_episodes.pop(episode_id, None)
+            if not ep:
+                logger.warning(f"Attempted to end inactive or not found episode: {episode_id}")
+                return
+            ep.ended_at = datetime.utcnow()
+            ep.outcome = outcome # type: ignore
+            ep.reward = reward
+            agent_history = self._agent_history.setdefault(ep.agent_id, [])
+            agent_history.append(ep)
+            # Sort by start time just to ensure chronological order is preserved
+            agent_history.sort(key=lambda x: x.started_at)
+            logger.debug(f"Ended episode {episode_id} with outcome {outcome}")
+    def get_episode(self, episode_id: str) -> Optional[Episode]:
+        with self._lock:
+            # Check active first
+            if episode_id in self._active_episodes:
+                return self._active_episodes[episode_id]
+            # Then check history
+            for history in self._agent_history.values():
+                for ep in history:
+                    if ep.id == episode_id:
+                        return ep
+            return None
+    def get_recent(
+        self, agent_id: str, limit: int = 5, context: Optional[str] = None
+    ) -> List[Episode]:
+        with self._lock:
+            history = self._agent_history.get(agent_id, [])
+            # Active episodes count too
+            active = [ep for ep in self._active_episodes.values() if ep.agent_id == agent_id]
+            combined = history + active
+            combined.sort(key=lambda x: x.started_at, reverse=True)
+            if context:
+                combined = [ep for ep in combined if ep.context == context]
+            return combined[:limit]
+    def _get_historical_ep(self, agent_id: str, episode_id: str) -> Optional[Episode]:
+        history = self._agent_history.get(agent_id, [])
+        for ep in history:
+            if ep.id == episode_id:
+                return ep
+        return None

src/mnemocore/core/forgetting_curve.py ADDED Viewed

	@@ -0,0 +1,233 @@

+"""
+Forgetting Curve Manager (Phase 5.0)
+=====================================
+Implements Ebbinghaus-based spaced repetition scheduling for MnemoCore.
+The ForgettingCurveManager layers on top of AdaptiveDecayEngine to:
+  1. Schedule "review" events at optimal intervals (spaced repetition)
+  2. Decide whether low-retention memories should be consolidated vs. deleted
+  3. Work collaboratively with the ConsolidationWorker
+Key idea: at each review interval, the system re-evaluates a memory's EIG.
+  - High EIG + low retention → CONSOLIDATE (absorb into a stronger anchor)
+  - Low EIG + low retention  → ARCHIVE / EVICT
+The review scheduling uses the SuperMemo-inspired interval:
+    next_review_days = S_i * ln(1 / TARGET_RETENTION)^-1
+where TARGET_RETENTION = 0.70 (retain 70% at next review point).
+Public API:
+    manager = ForgettingCurveManager(engine)
+    await manager.run_once(nodes)   # scan HOT/WARM nodes, schedule reviews
+    schedule = manager.get_schedule()  # sorted list of upcoming reviews
+"""
+from __future__ import annotations
+import asyncio
+import math
+from dataclasses import dataclass, field
+from datetime import datetime, timezone, timedelta
+from typing import TYPE_CHECKING, Dict, List, Optional
+from loguru import logger
+from .temporal_decay import AdaptiveDecayEngine, get_adaptive_decay_engine
+if TYPE_CHECKING:
+    from .node import MemoryNode
+# ------------------------------------------------------------------ #
+#  Constants                                                          #
+# ------------------------------------------------------------------ #
+TARGET_RETENTION: float = 0.70  # Retention level at which we schedule the next review
+MIN_EIG_TO_CONSOLIDATE: float = 0.3  # Minimum epistemic value to consolidate instead of evict
+# ------------------------------------------------------------------ #
+#  Review Schedule Entry                                             #
+# ------------------------------------------------------------------ #
+@dataclass
+class ReviewEntry:
+    """A scheduled review for a single memory."""
+    memory_id: str
+    due_at: datetime          # When to review
+    current_retention: float  # Retention at scheduling time
+    stability: float          # S_i at scheduling time
+    action: str = "review"    # "review" | "consolidate" | "evict"
+    def to_dict(self) -> Dict:
+        return {
+            "memory_id": self.memory_id,
+            "due_at": self.due_at.isoformat(),
+            "current_retention": round(self.current_retention, 4),
+            "stability": round(self.stability, 4),
+            "action": self.action,
+        }
+# ------------------------------------------------------------------ #
+#  Forgetting Curve Manager                                          #
+# ------------------------------------------------------------------ #
+class ForgettingCurveManager:
+    """
+    Schedules spaced-repetition review events for MemoryNodes.
+    Attach to a running HAIMEngine to enable automatic review scheduling.
+    Works in concert with AdaptiveDecayEngine and ConsolidationWorker.
+    """
+    def __init__(
+        self,
+        engine=None,  # HAIMEngine – typed as Any to avoid circular import
+        decay_engine: Optional[AdaptiveDecayEngine] = None,
+        target_retention: float = TARGET_RETENTION,
+        min_eig_to_consolidate: float = MIN_EIG_TO_CONSOLIDATE,
+    ) -> None:
+        self.engine = engine
+        self.decay = decay_engine or get_adaptive_decay_engine()
+        self.target_retention = target_retention
+        self.min_eig_to_consolidate = min_eig_to_consolidate
+        self._schedule: List[ReviewEntry] = []
+    # ---- Interval calculation ------------------------------------ #
+    def next_review_days(self, node: "MemoryNode") -> float:
+        """
+        Days until the next review should be scheduled.
+        Derived from: TARGET_RETENTION = e^(-next_days / S_i)
+        → next_days = -S_i * ln(TARGET_RETENTION)
+        Example: S_i=5, target=0.70 → next_days = 5 × 0.357 ≈ 1.78 days
+        """
+        s_i = self.decay.stability(node)
+        # Protect against math domain errors
+        target = max(1e-6, min(self.target_retention, 0.999))
+        return -s_i * math.log(target)
+    def _determine_action(self, node: "MemoryNode", retention: float) -> str:
+        """
+        Decide what to do with a low-retention memory:
+        - consolidate: has historical importance (epistemic_value > threshold)
+        - evict: low value, low retention
+        - review: needs attention but not critical yet
+        """
+        if self.decay.should_evict(node):
+            eig = getattr(node, "epistemic_value", 0.0)
+            if eig >= self.min_eig_to_consolidate:
+                return "consolidate"
+            return "evict"
+        return "review"
+    # ---- Scan and schedule --------------------------------------- #
+    def schedule_reviews(self, nodes: "List[MemoryNode]") -> List[ReviewEntry]:
+        """
+        Scan the provided nodes and build a schedule of upcoming reviews.
+        Nodes with retention ≤ REVIEW_THRESHOLD are immediately flagged.
+        Returns the new ReviewEntry objects added to the schedule.
+        """
+        now = datetime.now(timezone.utc)
+        new_entries: List[ReviewEntry] = []
+        for node in nodes:
+            retention = self.decay.retention(node)
+            s_i = self.decay.stability(node)
+            # Always update review_candidate flag on the node itself
+            self.decay.update_review_candidate(node)
+            # Schedule next review based on spaced repetition interval
+            days_until = self.next_review_days(node)
+            due_at = now + timedelta(days=days_until)
+            action = self._determine_action(node, retention)
+            entry = ReviewEntry(
+                memory_id=node.id,
+                due_at=due_at,
+                current_retention=retention,
+                stability=s_i,
+                action=action,
+            )
+            new_entries.append(entry)
+        # Merge into the schedule (replace existing entries for same memory_id)
+        existing_ids = {e.memory_id for e in self._schedule}
+        self._schedule = [
+            e for e in self._schedule if e.memory_id not in {n.id for n in nodes}
+        ]
+        self._schedule.extend(new_entries)
+        self._schedule.sort(key=lambda e: e.due_at)
+        logger.info(
+            f"ForgettingCurveManager: scheduled {len(new_entries)} reviews for {len(nodes)} nodes. "
+            f"Total scheduled: {len(self._schedule)}"
+        )
+        return new_entries
+    def get_schedule(self) -> List[ReviewEntry]:
+        """Return the current review schedule sorted by due_at."""
+        return sorted(self._schedule, key=lambda e: e.due_at)
+    def get_due_reviews(self) -> List[ReviewEntry]:
+        """Return entries that are due now (due_at <= now)."""
+        now = datetime.now(timezone.utc)
+        return [e for e in self._schedule if e.due_at <= now]
+    def get_actions_by_type(self, action: str) -> List[ReviewEntry]:
+        """Filter schedule by action type: 'review', 'consolidate', or 'evict'."""
+        return [e for e in self._schedule if e.action == action]
+    def remove_entry(self, memory_id: str) -> None:
+        """Remove a memory from the review schedule (e.g., it was evicted)."""
+        self._schedule = [e for e in self._schedule if e.memory_id != memory_id]
+    # ---- Engine integration ------------------------------------- #
+    async def run_once(self) -> Dict:
+        """
+        Run a full scan over HOT + WARM nodes and update the review schedule.
+        Returns a stats dict with counts per action.
+        """
+        if self.engine is None:
+            logger.warning("ForgettingCurveManager: no engine attached, cannot scan tiers.")
+            return {}
+        nodes: List["MemoryNode"] = []
+        try:
+            hot = await self.engine.tier_manager.get_hot_snapshot()
+            nodes.extend(hot)
+        except Exception as e:
+            logger.warning(f"ForgettingCurveManager: could not fetch HOT nodes: {e}")
+        try:
+            warm = await self.engine.tier_manager.list_warm(max_results=1000)
+            nodes.extend(warm)
+        except (AttributeError, Exception) as e:
+            logger.debug(f"ForgettingCurveManager: WARM fetch skipped: {e}")
+        entries = self.schedule_reviews(nodes)
+        # Count actions
+        from collections import Counter
+        action_counts = dict(Counter(e.action for e in entries))
+        logger.info(f"ForgettingCurveManager scan: {action_counts}")
+        return {
+            "nodes_scanned": len(nodes),
+            "entries_scheduled": len(entries),
+            "action_counts": action_counts,
+            "timestamp": datetime.now(timezone.utc).isoformat(),
+        }
+# Convenience import alias
+from typing import Dict  # noqa: E402 (already imported above, just ensuring type hint works)

src/mnemocore/core/hnsw_index.py CHANGED Viewed

@@ -50,18 +50,32 @@ FLAT_THRESHOLD: int = 256          # use flat index below this hop count
 #  HNSW Index Manager                                                 #
 # ------------------------------------------------------------------ #
 class HNSWIndexManager:
     """
     Manages a FAISS HNSW binary ANN index for the HOT tier.
     Automatically switches between:
      - IndexBinaryFlat  (N < FLAT_THRESHOLD — exact, faster for small N)
      - IndexBinaryHNSW  (N ≥ FLAT_THRESHOLD — approx, faster for large N)
-    The index is rebuilt from scratch when switching modes (rare operation).
-    All operations are synchronous (called from within asyncio.Lock context).
     """
     def __init__(
         self,
         dimension: int = 16384,
@@ -69,52 +83,70 @@ class HNSWIndexManager:
         ef_construction: int = DEFAULT_EF_CONSTRUCTION,
         ef_search: int = DEFAULT_EF_SEARCH,
     ):
         self.dimension = dimension
         self.m = m
         self.ef_construction = ef_construction
         self.ef_search = ef_search
-        # ID maps
-        self._id_map: Dict[int, str] = {}         # faiss_int_id → node_id
-        self._node_map: Dict[str, int] = {}        # node_id → faiss_int_id
-        self._next_id: int = 1
-        self._use_hnsw: bool = False
-        # FAISS index (initialised below)
         self._index = None
         if FAISS_AVAILABLE:
-            self._build_flat_index()
-        else:
-            logger.warning("HNSWIndexManager running WITHOUT faiss — linear fallback only.")
     # ---- Index construction -------------------------------------- #
     def _build_flat_index(self) -> None:
         """Create a fresh IndexBinaryFlat (exact Hamming ANN)."""
-        base = faiss.IndexBinaryFlat(self.dimension)
-        self._index = faiss.IndexBinaryIDMap(base)
         self._use_hnsw = False
         logger.debug(f"Built FAISS flat binary index (dim={self.dimension})")
-    def _build_hnsw_index(self, existing_nodes: Optional[List[Tuple[int, np.ndarray]]] = None) -> None:
         """
         Build an HNSW binary index and optionally re-populate with existing vectors.
-        Note: FAISS IndexBinaryHNSW does NOT support IDMap natively, so we use a
-        custom double-mapping approach: HNSW indices map 1-to-1 to our _id_map.
-        We rebuild as IndexBinaryHNSW and re-add all existing vectors.
         """
         hnsw = faiss.IndexBinaryHNSW(self.dimension, self.m)
         hnsw.hnsw.efConstruction = self.ef_construction
         hnsw.hnsw.efSearch = self.ef_search
-        if existing_nodes:
-            # Batch add in order of faiss_int_id so positions are deterministic
-            existing_nodes.sort(key=lambda x: x[0])
-            vecs = np.stack([v for _, v in existing_nodes])
-            hnsw.add(vecs)
-            logger.debug(f"HNSW index rebuilt with {len(existing_nodes)} existing vectors")
         self._index = hnsw
         self._use_hnsw = True
@@ -125,43 +157,18 @@ class HNSWIndexManager:
     def _maybe_upgrade_to_hnsw(self) -> None:
         """Upgrade to HNSW index if HOT tier has grown large enough."""
-        if not FAISS_AVAILABLE:
-            return
-        if self._use_hnsw:
             return
-        if len(self._id_map) < FLAT_THRESHOLD:
             return
         logger.info(
-            f"HOT tier size ({len(self._id_map)}) ≥ threshold ({FLAT_THRESHOLD}) "
             "— upgrading to HNSW index."
         )
-        # NOTE: For HNSW without IDMap we maintain position-based mapping.
-        # We rebuild from the current flat index contents.
-        # Collect all existing (local_pos → node_vector) pairs.
-        #
-        # For simplicity in this transition we do a full rebuild from scratch:
-        # the upgrade happens at most once per process lifetime (HOT usually stays
-        # under threshold or once it crosses, it stays crossed).
-        existing: List[Tuple[int, np.ndarray]] = []
-        for fid, node_id in self._id_map.items():
-            # We can't reconstruct vectors from IndexBinaryIDMap cheaply,
-            # so we store them in a shadow cache while using the flat index.
-            if node_id in self._vector_cache:
-                existing.append((fid, self._vector_cache[node_id]))
-        self._build_hnsw_index(existing)
-    # ---- Vector shadow cache (needed for HNSW rebuild) ----------- #
-    # HNSW indices don't support IDMap; we cache raw vectors separately
-    # so we can rebuild on threshold-crossing.
-    @property
-    def _vector_cache(self) -> Dict[str, np.ndarray]:
-        if not hasattr(self, "_vcache"):
-            object.__setattr__(self, "_vcache", {})
-        return self._vcache  # type: ignore[attr-defined]
     # ---- Public API --------------------------------------------- #
@@ -176,77 +183,66 @@ class HNSWIndexManager:
         if not FAISS_AVAILABLE or self._index is None:
             return
-        fid = self._next_id
-        self._next_id += 1
-        self._id_map[fid] = node_id
-        self._node_map[node_id] = fid
-        self._vector_cache[node_id] = hdv_data.copy()
-        vec = np.expand_dims(hdv_data, axis=0)
-        try:
-            if self._use_hnsw:
-                # HNSW.add() — position is implicit (sequential)
                 self._index.add(vec)
-            else:
-                ids = np.array([fid], dtype="int64")
-                self._index.add_with_ids(vec, ids)
-        except Exception as exc:
-            logger.error(f"HNSW/FAISS add failed for {node_id}: {exc}")
-            return
-        # Check if we should upgrade to HNSW
-        self._maybe_upgrade_to_hnsw()
     def remove(self, node_id: str) -> None:
         """
         Remove a node from the index.
-        For HNSW (no IDMap), we mark the node as deleted in our bookkeeping
-        and rebuild the index lazily when the deletion rate exceeds 20%.
         """
         if not FAISS_AVAILABLE or self._index is None:
             return
-        fid = self._node_map.pop(node_id, None)
-        if fid is None:
-            return
-        self._id_map.pop(fid, None)
-        self._vector_cache.pop(node_id, None)
-        if not self._use_hnsw:
             try:
-                ids = np.array([fid], dtype="int64")
-                self._index.remove_ids(ids)
-            except Exception as exc:
-                logger.error(f"FAISS flat remove failed for {node_id}: {exc}")
-        else:
-            # HNSW doesn't support removal; track stale fraction and rebuild when needed
-            if not hasattr(self, "_stale_count"):
-                object.__setattr__(self, "_stale_count", 0)
-            self._stale_count += 1  # type: ignore[attr-defined]
-            total = max(len(self._id_map) + self._stale_count, 1)
-            stale_fraction = self._stale_count / total
-            if stale_fraction > 0.20 and len(self._id_map) > 0:
-                logger.info(f"HNSW stale fraction {stale_fraction:.1%} — rebuilding index.")
-                existing = [
-                    (fid2, self._vector_cache[nid])
-                    for fid2, nid in self._id_map.items()
-                    if nid in self._vector_cache
-                ]
-                self._build_hnsw_index(existing)
-                self._stale_count = 0
     def search(self, query_data: np.ndarray, top_k: int = 10) -> List[Tuple[str, float]]:
         """
         Search for top-k nearest neighbours.
-        Args:
-            query_data: Packed uint8 query array (D/8 bytes).
-            top_k: Number of results to return.
         Returns:
             List of (node_id, similarity_score) sorted by descending similarity.
             similarity = 1 - normalised_hamming_distance  ∈ [0, 1].
@@ -254,8 +250,25 @@ class HNSWIndexManager:
         if not FAISS_AVAILABLE or self._index is None or not self._id_map:
             return []
-        k = min(top_k, len(self._id_map))
-        q = np.expand_dims(query_data, axis=0)
         try:
             distances, ids = self._index.search(q, k)
@@ -265,43 +278,59 @@ class HNSWIndexManager:
         results: List[Tuple[str, float]] = []
         for dist, idx in zip(distances[0], ids[0]):
-            if idx == -1:
                 continue
-            if self._use_hnsw:
-                # HNSW returns 0-based position indices; map back through insertion order
-                node_id = self._position_to_node_id(int(idx))
-            else:
-                node_id = self._id_map.get(int(idx))
-            if node_id:
-                sim = 1.0 - float(dist) / self.dimension
                 results.append((node_id, sim))
         return results
-    def _position_to_node_id(self, position: int) -> Optional[str]:
-        """
-        Map HNSW sequential position back to node_id.
-        Positions correspond to insertion order; we track this via _position_map.
-        """
-        if not hasattr(self, "_position_map"):
-            object.__setattr__(self, "_position_map", {})
-        pm: Dict[int, str] = self._position_map  # type: ignore[attr-defined]
-        # Rebuild position map if needed (after index rebuild)
-        if len(pm) < len(self._id_map):
-            pm.clear()
-            for pos, (fid, nid) in enumerate(
-                sorted(self._id_map.items(), key=lambda x: x[0])
-            ):
-                pm[pos] = nid
-        return pm.get(position)
     @property
     def size(self) -> int:
-        return len(self._id_map)
     @property
     def index_type(self) -> str:
@@ -318,4 +347,5 @@ class HNSWIndexManager:
             "ef_construction": self.ef_construction if self._use_hnsw else None,
             "ef_search": self.ef_search if self._use_hnsw else None,
             "faiss_available": FAISS_AVAILABLE,
         }

 #  HNSW Index Manager                                                 #
 # ------------------------------------------------------------------ #
+import json
+from pathlib import Path
+from threading import Lock
+from .config import get_config
 class HNSWIndexManager:
     """
     Manages a FAISS HNSW binary ANN index for the HOT tier.
+    Thread-safe singleton with disk persistence.
     Automatically switches between:
      - IndexBinaryFlat  (N < FLAT_THRESHOLD — exact, faster for small N)
      - IndexBinaryHNSW  (N ≥ FLAT_THRESHOLD — approx, faster for large N)
     """
+    _instance: "HNSWIndexManager | None" = None
+    _singleton_lock: Lock = Lock()
+    def __new__(cls, *args, **kwargs) -> "HNSWIndexManager":
+        with cls._singleton_lock:
+            if cls._instance is None:
+                obj = super().__new__(cls)
+                obj._initialized = False
+                cls._instance = obj
+        return cls._instance
     def __init__(
         self,
         dimension: int = 16384,
         ef_construction: int = DEFAULT_EF_CONSTRUCTION,
         ef_search: int = DEFAULT_EF_SEARCH,
     ):
+        if getattr(self, "_initialized", False):
+            return
         self.dimension = dimension
         self.m = m
         self.ef_construction = ef_construction
         self.ef_search = ef_search
+        self._write_lock = Lock()
+        self._id_map: List[Optional[str]] = []
+        self._vector_store: List[np.ndarray] = []
+        self._use_hnsw = False
+        self._stale_count = 0
         self._index = None
+        config = get_config()
+        data_dir = Path(config.paths.data_dir if hasattr(config, 'paths') else "./data")
+        data_dir.mkdir(parents=True, exist_ok=True)
+        self.INDEX_PATH = data_dir / "mnemocore_hnsw.faiss"
+        self.IDMAP_PATH = data_dir / "mnemocore_hnsw_idmap.json"
+        self.VECTOR_PATH = data_dir / "mnemocore_hnsw_vectors.npy"
         if FAISS_AVAILABLE:
+            if self.INDEX_PATH.exists() and self.IDMAP_PATH.exists() and self.VECTOR_PATH.exists():
+                self._load()
+            else:
+                self._build_flat_index()
+        self._initialized = True
     # ---- Index construction -------------------------------------- #
     def _build_flat_index(self) -> None:
         """Create a fresh IndexBinaryFlat (exact Hamming ANN)."""
+        self._index = faiss.IndexBinaryFlat(self.dimension)
         self._use_hnsw = False
         logger.debug(f"Built FAISS flat binary index (dim={self.dimension})")
+    def _build_hnsw_index(self) -> None:
         """
         Build an HNSW binary index and optionally re-populate with existing vectors.
         """
         hnsw = faiss.IndexBinaryHNSW(self.dimension, self.m)
         hnsw.hnsw.efConstruction = self.ef_construction
         hnsw.hnsw.efSearch = self.ef_search
+        if self._vector_store:
+            # Compact the index to remove None entries
+            compact_ids = []
+            compact_vecs = []
+            for i, node_id in enumerate(self._id_map):
+                if node_id is not None:
+                    compact_ids.append(node_id)
+                    compact_vecs.append(self._vector_store[i])
+            if compact_vecs:
+                vecs = np.stack(compact_vecs)
+                hnsw.add(vecs)
+            self._id_map = compact_ids
+            self._vector_store = compact_vecs
+            self._stale_count = 0
         self._index = hnsw
         self._use_hnsw = True
     def _maybe_upgrade_to_hnsw(self) -> None:
         """Upgrade to HNSW index if HOT tier has grown large enough."""
+        if not FAISS_AVAILABLE or self._use_hnsw:
             return
+        active_count = len(self._id_map) - self._stale_count
+        if active_count < FLAT_THRESHOLD:
             return
         logger.info(
+            f"HOT tier size ({active_count}) ≥ threshold ({FLAT_THRESHOLD}) "
             "— upgrading to HNSW index."
         )
+        self._build_hnsw_index()
     # ---- Public API --------------------------------------------- #
         if not FAISS_AVAILABLE or self._index is None:
             return
+        vec = np.ascontiguousarray(np.expand_dims(hdv_data, axis=0))
+        with self._write_lock:
+            try:
                 self._index.add(vec)
+                self._id_map.append(node_id)
+                self._vector_store.append(hdv_data.copy())
+            except Exception as exc:
+                logger.error(f"HNSW/FAISS add failed for {node_id}: {repr(exc)}")
+                return
+            self._maybe_upgrade_to_hnsw()
+            self._save()
     def remove(self, node_id: str) -> None:
         """
         Remove a node from the index.
+        Marks node as deleted and rebuilds index lazily when the deletion rate exceeds 20%.
         """
         if not FAISS_AVAILABLE or self._index is None:
             return
+        with self._write_lock:
             try:
+                fid = self._id_map.index(node_id)
+                self._id_map[fid] = None
+                self._stale_count += 1
+                total = max(len(self._id_map), 1)
+                stale_fraction = self._stale_count / total
+                if stale_fraction > 0.20 and len(self._id_map) > 0:
+                    logger.info(f"HNSW stale fraction {stale_fraction:.1%} — rebuilding index.")
+                    if self._use_hnsw:
+                        self._build_hnsw_index()
+                    else:
+                        self._build_flat_index()
+                        if self._vector_store:
+                            compact_ids = []
+                            compact_vecs = []
+                            for i, nid in enumerate(self._id_map):
+                                if nid is not None:
+                                    compact_ids.append(nid)
+                                    compact_vecs.append(self._vector_store[i])
+                            if compact_vecs:
+                                vecs = np.ascontiguousarray(np.stack(compact_vecs))
+                                self._index.add(vecs)
+                            self._id_map = compact_ids
+                            self._vector_store = compact_vecs
+                            self._stale_count = 0
+                self._save()
+            except ValueError:
+                pass
     def search(self, query_data: np.ndarray, top_k: int = 10) -> List[Tuple[str, float]]:
         """
         Search for top-k nearest neighbours.
         Returns:
             List of (node_id, similarity_score) sorted by descending similarity.
             similarity = 1 - normalised_hamming_distance  ∈ [0, 1].
         if not FAISS_AVAILABLE or self._index is None or not self._id_map:
             return []
+        # Fetch more to account for deleted (None) entries
+        k = min(top_k + self._stale_count, len(self._id_map))
+        if k <= 0:
+            return []
+        index_dimension = int(getattr(self._index, "d", self.dimension) or self.dimension)
+        query_bytes = np.ascontiguousarray(query_data, dtype=np.uint8).reshape(-1)
+        expected_bytes = index_dimension // 8
+        if expected_bytes > 0 and query_bytes.size != expected_bytes:
+            logger.warning(
+                f"HNSW query dimension mismatch: index={index_dimension} bits ({expected_bytes} bytes), "
+                f"query={query_bytes.size} bytes. Adjusting query to index dimension."
+            )
+            if query_bytes.size > expected_bytes:
+                query_bytes = query_bytes[:expected_bytes]
+            else:
+                query_bytes = np.pad(query_bytes, (0, expected_bytes - query_bytes.size), mode="constant")
+        q = np.expand_dims(query_bytes, axis=0)
         try:
             distances, ids = self._index.search(q, k)
         results: List[Tuple[str, float]] = []
         for dist, idx in zip(distances[0], ids[0]):
+            if idx < 0 or idx >= len(self._id_map):
                 continue
+            node_id = self._id_map[idx]
+            if node_id is not None:
+                sim = 1.0 - float(dist) / max(index_dimension, 1)
+                sim = float(np.clip(sim, 0.0, 1.0))
                 results.append((node_id, sim))
+                if len(results) >= top_k:
+                    break
         return results
+    def _save(self):
+        try:
+            faiss.write_index_binary(self._index, str(self.INDEX_PATH))
+            with open(self.IDMAP_PATH, "w") as f:
+                json.dump({
+                    "id_map": self._id_map,
+                    "use_hnsw": self._use_hnsw,
+                    "stale_count": self._stale_count
+                }, f)
+            if self._vector_store:
+                np.save(str(self.VECTOR_PATH), np.stack(self._vector_store))
+        except Exception as e:
+            logger.error(f"Failed to save HNSW index state: {e}")
+    def _load(self):
+        try:
+            self._index = faiss.read_index_binary(str(self.INDEX_PATH))
+            index_dimension = int(getattr(self._index, "d", self.dimension) or self.dimension)
+            if index_dimension != self.dimension:
+                logger.warning(
+                    f"HNSW index dimension mismatch on load: config={self.dimension}, index={index_dimension}. "
+                    "Using index dimension."
+                )
+                self.dimension = index_dimension
+            with open(self.IDMAP_PATH, "r") as f:
+                state = json.load(f)
+                self._id_map = state.get("id_map", [])
+                self._use_hnsw = state.get("use_hnsw", False)
+                self._stale_count = state.get("stale_count", 0)
+            vecs = np.load(str(self.VECTOR_PATH))
+            self._vector_store = list(vecs)
+            logger.info("Loaded HNSW persistent state from disk")
+        except Exception as e:
+            logger.error(f"Failed to load HNSW index state: {e}")
+            self._build_flat_index()
     @property
     def size(self) -> int:
+        return len([x for x in self._id_map if x is not None])
     @property
     def index_type(self) -> str:
             "ef_construction": self.ef_construction if self._use_hnsw else None,
             "ef_search": self.ef_search if self._use_hnsw else None,
             "faiss_available": FAISS_AVAILABLE,
+            "stale_count": self._stale_count
         }

src/mnemocore/core/memory_model.py ADDED Viewed

	@@ -0,0 +1,132 @@

+"""
+Memory Models
+=============
+Data classes mapping the Cognitive Architecture Phase 5 entities:
+Working Memory (WM), Episodic Memory (EM), Semantic Memory (SM),
+Procedural Memory (PM), and Meta-Memory (MM).
+"""
+from dataclasses import dataclass, field
+from datetime import datetime
+from typing import Any, Literal, Optional, List
+from .binary_hdv import BinaryHDV
+# --- Working Memory (WM) ---
+@dataclass
+class WorkingMemoryItem:
+    id: str
+    agent_id: str
+    created_at: datetime
+    ttl_seconds: int
+    content: str
+    kind: Literal["thought", "observation", "goal", "plan_step", "action", "meta"]
+    importance: float
+    tags: List[str]
+    hdv: Optional[BinaryHDV] = None
+@dataclass
+class WorkingMemoryState:
+    agent_id: str
+    max_items: int
+    items: List[WorkingMemoryItem] = field(default_factory=list)
+# --- Episodic Memory (EM) ---
+@dataclass
+class EpisodeEvent:
+    timestamp: datetime
+    kind: Literal["observation", "action", "thought", "reward", "error", "system"]
+    content: str
+    metadata: dict[str, Any]
+    hdv: Optional[BinaryHDV] = None
+@dataclass
+class Episode:
+    id: str
+    agent_id: str
+    started_at: datetime
+    ended_at: Optional[datetime]
+    goal: Optional[str]
+    context: Optional[str]
+    events: List[EpisodeEvent]
+    outcome: Literal["success", "failure", "partial", "unknown", "in_progress"]
+    reward: Optional[float]
+    links_prev: List[str]
+    links_next: List[str]
+    ltp_strength: float
+    reliability: float
+    @property
+    def is_active(self) -> bool:
+        return self.ended_at is None
+# --- Semantic Memory (SM) ---
+@dataclass
+class SemanticConcept:
+    id: str
+    label: str
+    description: str
+    tags: List[str]
+    prototype_hdv: BinaryHDV
+    support_episode_ids: List[str]
+    reliability: float
+    last_updated_at: datetime
+    metadata: dict[str, Any]
+# --- Procedural Memory (PM) ---
+@dataclass
+class ProcedureStep:
+    order: int
+    instruction: str
+    code_snippet: Optional[str] = None
+    tool_call: Optional[dict[str, Any]] = None
+@dataclass
+class Procedure:
+    id: str
+    name: str
+    description: str
+    created_by_agent: Optional[str]
+    created_at: datetime
+    updated_at: datetime
+    steps: List[ProcedureStep]
+    trigger_pattern: str
+    success_count: int
+    failure_count: int
+    reliability: float
+    tags: List[str]
+# --- Meta-Memory (MM) ---
+@dataclass
+class SelfMetric:
+    name: str
+    value: float
+    window: str  # e.g. "5m", "1h", "24h"
+    updated_at: datetime
+@dataclass
+class SelfImprovementProposal:
+    id: str
+    created_at: datetime
+    author: Literal["system", "agent", "human"]
+    title: str
+    description: str
+    rationale: str
+    expected_effect: str
+    status: Literal["pending", "accepted", "rejected", "implemented"]
+    metadata: dict[str, Any]

src/mnemocore/core/meta_memory.py ADDED Viewed

	@@ -0,0 +1,70 @@

+"""
+Meta Memory Service
+===================
+Maintains a self-model of the memory substrate, gathering metrics and surfacing self-improvement proposals.
+Plays a crucial role in enabling an AGI system to observe and upgrade its own thinking architectures over time.
+"""
+from typing import Dict, List, Optional
+import threading
+import logging
+from datetime import datetime
+from .memory_model import SelfMetric, SelfImprovementProposal
+logger = logging.getLogger(__name__)
+class MetaMemoryService:
+    def __init__(self):
+        self._metrics: List[SelfMetric] = []
+        self._proposals: Dict[str, SelfImprovementProposal] = {}
+        self._lock = threading.RLock()
+    def record_metric(self, name: str, value: float, window: str) -> None:
+        """Log a new performance or algorithmic metric reading."""
+        with self._lock:
+            # We strictly bind this to metrics history for Subconscious AI trend analysis.
+            metric = SelfMetric(
+                name=name, value=value, window=window, updated_at=datetime.utcnow()
+            )
+            self._metrics.append(metric)
+            # Cap local metrics storage bounds
+            if len(self._metrics) > 10000:
+                self._metrics = self._metrics[-5000:]
+            logger.debug(f"Recorded meta-metric: {name}={value} ({window})")
+    def list_metrics(self, limit: int = 100, window: Optional[str] = None) -> List[SelfMetric]:
+        """Fetch historical metric footprints."""
+        with self._lock:
+            filtered = [m for m in self._metrics if (not window) or m.window == window]
+            filtered.sort(key=lambda x: x.updated_at, reverse=True)
+            return filtered[:limit]
+    def create_proposal(self, proposal: SelfImprovementProposal) -> str:
+        """Inject a formally modeled improvement prompt into the queue."""
+        with self._lock:
+            self._proposals[proposal.id] = proposal
+            logger.info(f"New self-improvement proposal created by {proposal.author}: {proposal.title}")
+            return proposal.id
+    def update_proposal_status(self, proposal_id: str, status: str) -> None:
+        """Mark a proposal as accepted, rejected, or implemented by the oversight entity."""
+        with self._lock:
+            proposal = self._proposals.get(proposal_id)
+            if not proposal:
+                logger.warning(f"Could not update unknown proposal ID: {proposal_id}")
+                return
+            proposal.status = status # type: ignore
+            logger.info(f"Proposal {proposal_id} status escalated to: {status}")
+    def list_proposals(self, status: Optional[str] = None) -> List[SelfImprovementProposal]:
+        """Retrieve proposals matching a given state."""
+        with self._lock:
+            if status:
+                return [p for p in self._proposals.values() if p.status == status]
+            return list(self._proposals.values())

src/mnemocore/core/node.py CHANGED Viewed

@@ -1,11 +1,16 @@
 from dataclasses import dataclass, field
 from datetime import datetime, timezone
-from typing import Dict, Any, Optional
 import math
 from .binary_hdv import BinaryHDV
 from .config import get_config
 @dataclass
 class MemoryNode:
@@ -35,6 +40,15 @@ class MemoryNode:
     # Phase 4.3: Episodic Chaining - links to temporally adjacent memories
     previous_id: Optional[str] = None  # UUID of the memory created immediately before this one
     def access(self, update_weights: bool = True):
         """Retrieve memory (reconsolidation)"""
         now = datetime.now(timezone.utc)
@@ -46,6 +60,11 @@ class MemoryNode:
             # We recalculate based on new access count
             self.calculate_ltp()
             # Legacy updates
             self.epistemic_value *= 1.01
             self.epistemic_value = min(self.epistemic_value, 1.0)

+from __future__ import annotations
 from dataclasses import dataclass, field
 from datetime import datetime, timezone
+from typing import TYPE_CHECKING, Dict, Any, Optional
 import math
 from .binary_hdv import BinaryHDV
 from .config import get_config
+if TYPE_CHECKING:
+    from .provenance import ProvenanceRecord
 @dataclass
 class MemoryNode:
     # Phase 4.3: Episodic Chaining - links to temporally adjacent memories
     previous_id: Optional[str] = None  # UUID of the memory created immediately before this one
+    # Phase 5.0 — Agent 1: Trust & Provenance
+    provenance: Optional["ProvenanceRecord"] = field(default=None, repr=False)
+    # Phase 5.0 — Agent 2: Adaptive Temporal Decay
+    # Per-memory stability: S_i = S_base * (1 + k * access_count)
+    # Starts at 1.0; increases logarithmically on access.
+    stability: float = 1.0
+    review_candidate: bool = False  # Set by ForgettingCurveManager when near decay threshold
     def access(self, update_weights: bool = True):
         """Retrieve memory (reconsolidation)"""
         now = datetime.now(timezone.utc)
             # We recalculate based on new access count
             self.calculate_ltp()
+            # Phase 5.0: update per-memory stability on each successful access
+            # S_i grows logarithmically so older frequently-accessed memories are more stable
+            import math as _math
+            self.stability = max(1.0, 1.0 + _math.log1p(self.access_count) * 0.5)
             # Legacy updates
             self.epistemic_value *= 1.01
             self.epistemic_value = min(self.epistemic_value, 1.0)

src/mnemocore/core/prediction_store.py ADDED Viewed

	@@ -0,0 +1,294 @@

+"""
+Prediction Memory Store (Phase 5.0 — Agent 4)
+==============================================
+Stores explicitly made predictions about future events and tracks their outcomes.
+A prediction has a lifecycle:
+    pending → verified (correct) OR falsified (wrong) OR expired (deadline passed)
+Key behaviors:
+  - Verified predictions STRENGTHEN related strategic memories via synaptic binding
+  - Falsified predictions REDUCE confidence on related memories + generate a
+    "lesson learned" via SubconsciousAI
+  - Expired predictions are flagged for manual review
+Backed by a lightweight in-memory + provenance-attached store.
+For persistence, predictions are serialized to node.metadata["prediction"] and
+stored as regular MemoryNodes in the HOT tier with a special tag.
+Public API:
+    store = PredictionStore()
+    pred_id = store.create(content="...", confidence=0.7, deadline_days=90)
+    store.verify(pred_id, success=True, notes="EU AI Act enforced")
+    due = store.get_due()   # predictions past their deadline
+"""
+from __future__ import annotations
+import uuid
+from dataclasses import dataclass, field
+from datetime import datetime, timezone, timedelta
+from typing import Any, Dict, List, Optional
+from loguru import logger
+# ------------------------------------------------------------------ #
+#  Prediction status constants                                       #
+# ------------------------------------------------------------------ #
+STATUS_PENDING = "pending"
+STATUS_VERIFIED = "verified"
+STATUS_FALSIFIED = "falsified"
+STATUS_EXPIRED = "expired"
+# ------------------------------------------------------------------ #
+#  PredictionRecord                                                  #
+# ------------------------------------------------------------------ #
+@dataclass
+class PredictionRecord:
+    """A single forward-looking prediction stored in MnemoCore."""
+    id: str = field(default_factory=lambda: f"pred_{uuid.uuid4().hex[:16]}")
+    content: str = ""
+    predicted_at: str = field(
+        default_factory=lambda: datetime.now(timezone.utc).isoformat()
+    )
+    verification_deadline: Optional[str] = None  # ISO datetime string
+    confidence_at_creation: float = 0.5
+    status: str = STATUS_PENDING
+    outcome: Optional[bool] = None          # True=verified, False=falsified
+    verification_notes: Optional[str] = None
+    verified_at: Optional[str] = None
+    related_memory_ids: List[str] = field(default_factory=list)
+    tags: List[str] = field(default_factory=list)
+    def is_expired(self) -> bool:
+        """True if the deadline has passed and status is still pending."""
+        if self.status != STATUS_PENDING or self.verification_deadline is None:
+            return False
+        deadline = datetime.fromisoformat(self.verification_deadline)
+        if deadline.tzinfo is None:
+            deadline = deadline.replace(tzinfo=timezone.utc)
+        return datetime.now(timezone.utc) > deadline
+    def to_dict(self) -> Dict[str, Any]:
+        return {
+            "id": self.id,
+            "content": self.content,
+            "predicted_at": self.predicted_at,
+            "verification_deadline": self.verification_deadline,
+            "confidence_at_creation": round(self.confidence_at_creation, 4),
+            "status": self.status,
+            "outcome": self.outcome,
+            "verification_notes": self.verification_notes,
+            "verified_at": self.verified_at,
+            "related_memory_ids": self.related_memory_ids,
+            "tags": self.tags,
+        }
+    @classmethod
+    def from_dict(cls, d: Dict[str, Any]) -> "PredictionRecord":
+        return cls(
+            id=d.get("id", f"pred_{uuid.uuid4().hex[:16]}"),
+            content=d.get("content", ""),
+            predicted_at=d.get("predicted_at", datetime.now(timezone.utc).isoformat()),
+            verification_deadline=d.get("verification_deadline"),
+            confidence_at_creation=d.get("confidence_at_creation", 0.5),
+            status=d.get("status", STATUS_PENDING),
+            outcome=d.get("outcome"),
+            verification_notes=d.get("verification_notes"),
+            verified_at=d.get("verified_at"),
+            related_memory_ids=d.get("related_memory_ids", []),
+            tags=d.get("tags", []),
+        )
+# ------------------------------------------------------------------ #
+#  PredictionStore                                                   #
+# ------------------------------------------------------------------ #
+class PredictionStore:
+    """
+    In-memory store for PredictionRecords with lifecycle management.
+    For production use, wire to an engine so verified/falsified predictions
+    can update related MemoryNode synapses and generate LLM insights.
+    """
+    def __init__(self, engine=None) -> None:
+        self.engine = engine
+        self._records: Dict[str, PredictionRecord] = {}
+    # ---- CRUD ---------------------------------------------------- #
+    def create(
+        self,
+        content: str,
+        confidence: float = 0.5,
+        deadline_days: Optional[float] = None,
+        deadline: Optional[datetime] = None,
+        related_memory_ids: Optional[List[str]] = None,
+        tags: Optional[List[str]] = None,
+    ) -> str:
+        """
+        Store a new prediction.
+        Args:
+            content:           The prediction statement.
+            confidence:        Confidence at creation time [0, 1].
+            deadline_days:     Days from now until deadline (alternative to deadline).
+            deadline:          Explicit deadline datetime (overrides deadline_days).
+            related_memory_ids: IDs of memories this prediction relates to.
+            tags:              Optional classification tags.
+        Returns:
+            The prediction ID.
+        """
+        deadline_iso: Optional[str] = None
+        if deadline is not None:
+            if deadline.tzinfo is None:
+                deadline = deadline.replace(tzinfo=timezone.utc)
+            deadline_iso = deadline.isoformat()
+        elif deadline_days is not None:
+            deadline_iso = (
+                datetime.now(timezone.utc) + timedelta(days=deadline_days)
+            ).isoformat()
+        rec = PredictionRecord(
+            content=content,
+            confidence_at_creation=max(0.0, min(1.0, confidence)),
+            verification_deadline=deadline_iso,
+            related_memory_ids=related_memory_ids or [],
+            tags=tags or [],
+        )
+        self._records[rec.id] = rec
+        logger.info(
+            f"Prediction created: {rec.id} | confidence={confidence:.2f} | "
+            f"deadline={deadline_iso or 'none'}"
+        )
+        return rec.id
+    def get(self, pred_id: str) -> Optional[PredictionRecord]:
+        return self._records.get(pred_id)
+    def list_all(self, status: Optional[str] = None) -> List[PredictionRecord]:
+        """Return all predictions, optionally filtered by status."""
+        recs = list(self._records.values())
+        if status:
+            recs = [r for r in recs if r.status == status]
+        return sorted(recs, key=lambda r: r.predicted_at, reverse=True)
+    def get_due(self) -> List[PredictionRecord]:
+        """Return pending predictions that have passed their deadline."""
+        return [r for r in self._records.values() if r.is_expired()]
+    # ---- Lifecycle ----------------------------------------------- #
+    async def verify(
+        self,
+        pred_id: str,
+        success: bool,
+        notes: Optional[str] = None,
+    ) -> Optional[PredictionRecord]:
+        """
+        Verify or falsify a prediction.
+        Side effects:
+          - Verified: strengthens related memories via synaptic binding
+          - Falsified: reduces confidence on related memories + lesson learned
+        """
+        rec = self._records.get(pred_id)
+        if rec is None:
+            logger.warning(f"PredictionStore.verify: unknown id {pred_id!r}")
+            return None
+        rec.status = STATUS_VERIFIED if success else STATUS_FALSIFIED
+        rec.outcome = success
+        rec.verification_notes = notes
+        rec.verified_at = datetime.now(timezone.utc).isoformat()
+        logger.info(
+            f"Prediction {pred_id} → {rec.status} | notes={notes or '—'}"
+        )
+        if self.engine is not None:
+            if success:
+                await self._strengthen_related(rec)
+            else:
+                await self._weaken_related(rec)
+                await self._generate_lesson(rec)
+        return rec
+    async def expire_due(self) -> List[PredictionRecord]:
+        """Mark overdue pending predictions as expired. Returns expired list."""
+        due = self.get_due()
+        for rec in due:
+            rec.status = STATUS_EXPIRED
+            logger.info(f"Prediction {rec.id} expired (deadline passed).")
+        return due
+    # ---- Engine integration -------------------------------------- #
+    async def _strengthen_related(self, rec: PredictionRecord) -> None:
+        """Verified prediction → strengthen synapses on related memories."""
+        for mem_id in rec.related_memory_ids:
+            try:
+                node = await self.engine.get_memory(mem_id)
+                if node:
+                    si = getattr(self.engine, "synapse_index", None)
+                    if si:
+                        si.add_or_strengthen(rec.id, mem_id, delta=0.15)
+                    logger.debug(f"Prediction {rec.id}: strengthened memory {mem_id[:8]}")
+            except Exception as exc:
+                logger.debug(f"Prediction strengthen failed for {mem_id}: {exc}")
+    async def _weaken_related(self, rec: PredictionRecord) -> None:
+        """Falsified prediction → reduce confidence on related memories."""
+        for mem_id in rec.related_memory_ids:
+            try:
+                node = await self.engine.get_memory(mem_id)
+                if node:
+                    from .bayesian_ltp import get_bayesian_updater
+                    updater = get_bayesian_updater()
+                    updater.observe_node_retrieval(node, helpful=False, eig_signal=0.5)
+                    logger.debug(f"Prediction {rec.id}: weakened memory {mem_id[:8]}")
+            except Exception as exc:
+                logger.debug(f"Prediction weaken failed for {mem_id}: {exc}")
+    async def _generate_lesson(self, rec: PredictionRecord) -> None:
+        """Ask SubconsciousAI to synthesize a 'lesson learned' for a falsified prediction."""
+        try:
+            subcon = getattr(self.engine, "subconscious_ai", None)
+            if subcon is None:
+                return
+            prompt = (
+                f"The following prediction was FALSIFIED: '{rec.content}'. "
+                f"Confidence at creation: {rec.confidence_at_creation:.2f}. "
+                f"Notes: {rec.verification_notes or 'none'}. "
+                "In 1-2 sentences, what is the key lesson learned from this failure?"
+            )
+            lesson = await subcon.generate(prompt, max_tokens=128)
+            # Store the lesson as a new memory
+            await self.engine.store(
+                lesson.strip(),
+                metadata={
+                    "type": "lesson_learned",
+                    "source_prediction_id": rec.id,
+                    "domain": "strategic",
+                }
+            )
+            logger.info(f"Lesson learned generated for falsified prediction {rec.id}")
+        except Exception as exc:
+            logger.debug(f"Lesson generation failed: {exc}")
+    # ---- Serialization ------------------------------------------- #
+    def to_list(self) -> List[Dict[str, Any]]:
+        return [r.to_dict() for r in self._records.values()]
+    def __len__(self) -> int:
+        return len(self._records)

src/mnemocore/core/preference_store.py ADDED Viewed

	@@ -0,0 +1,53 @@

+import numpy as np
+from loguru import logger
+from typing import List, Optional
+from .binary_hdv import BinaryHDV, majority_bundle
+from .config import PreferenceConfig
+class PreferenceStore:
+    """
+    Phase 12.3: Preference Learning
+    Maintains a persistent vector representing implicit user preferences
+    based on logged decisions or positive feedback.
+    """
+    def __init__(self, config: PreferenceConfig, dimension: int):
+        self.config = config
+        self.dimension = dimension
+        # The preference vector represents the "ideal" or "preferred" region
+        self.preference_vector: Optional[BinaryHDV] = None
+        self.decision_history: List[BinaryHDV] = []
+    def log_decision(self, context_hdv: BinaryHDV, outcome: float) -> None:
+        """
+        Logs a decision or feedback event.
+        `outcome`: positive value (e.g. 1.0) for good feedback, negative (-1.0) for bad feedback.
+        If outcome is positive, the preference vector shifts slightly toward `context_hdv`.
+        If outcome is negative, the preference vector shifts away (invert context_hdv).
+        """
+        if not self.config.enabled:
+            return
+        target_hdv = context_hdv if outcome >= 0 else context_hdv.invert()
+        self.decision_history.append(target_hdv)
+        # Maintain history size
+        if len(self.decision_history) > self.config.history_limit:
+            self.decision_history.pop(0)
+        # Update preference vector via majority bundling of recent positive shifts
+        self.preference_vector = majority_bundle(self.decision_history)
+        logger.debug(f"Logged decision (outcome={outcome:.2f}). Preference vector updated.")
+    def bias_score(self, target_hdv: BinaryHDV, base_score: float) -> float:
+        """
+        Biases a retrieval score using the preference vector if one exists.
+        Formula: new_score = base_score + (learning_rate * preference_similarity)
+        """
+        if not self.config.enabled or self.preference_vector is None:
+            return base_score
+        pref_sim = self.preference_vector.similarity(target_hdv)
+        # We apply the learning_rate as the max potential boost an item can get from mapping exactly to preferences
+        return base_score + (self.config.learning_rate * pref_sim)

src/mnemocore/core/procedural_store.py ADDED Viewed

	@@ -0,0 +1,77 @@

+"""
+Procedural Store Service
+========================
+Manages actionable skills, procedural routines, and agentic workflows.
+Validates triggering patterns and tracks execution success rates dynamically.
+"""
+from typing import Dict, List, Optional
+import threading
+import logging
+from datetime import datetime
+from .memory_model import Procedure
+logger = logging.getLogger(__name__)
+class ProceduralStoreService:
+    def __init__(self):
+        # Local dictionary for Procedures mapping by ID
+        # Would typically be serialized to SQLite, JSON, or Qdrant for retrieval.
+        self._procedures: Dict[str, Procedure] = {}
+        self._lock = threading.RLock()
+    def store_procedure(self, proc: Procedure) -> None:
+        """Save a new or refined procedure into memory."""
+        with self._lock:
+            proc.updated_at = datetime.utcnow()
+            self._procedures[proc.id] = proc
+            logger.info(f"Stored procedure {proc.id} ('{proc.name}')")
+    def get_procedure(self, proc_id: str) -> Optional[Procedure]:
+        """Retrieve a procedure by exact ID."""
+        with self._lock:
+            return self._procedures.get(proc_id)
+    def find_applicable_procedures(
+        self, query: str, agent_id: Optional[str] = None, top_k: int = 5
+    ) -> List[Procedure]:
+        """
+        Find procedures whose trigger tags or trigger pattern matches the user intent.
+        Simple local text-matching for the prototype layout.
+        """
+        with self._lock:
+            q_lower = query.lower()
+            results = []
+            for proc in self._procedures.values():
+                # Prefer procedures meant directly for this agent, or system globals
+                if proc.created_by_agent is not None and agent_id and proc.created_by_agent != agent_id:
+                    continue
+                if proc.trigger_pattern.lower() in q_lower or any(t.lower() in q_lower for t in proc.tags):
+                    results.append(proc)
+            # Sort by reliability and usage history to surface most competent tools
+            results.sort(key=lambda p: (p.reliability, p.success_count), reverse=True)
+            return results[:top_k]
+    def record_procedure_outcome(self, proc_id: str, success: bool) -> None:
+        """Update procedure success metrics, affecting overall reliability."""
+        with self._lock:
+            proc = self._procedures.get(proc_id)
+            if not proc:
+                return
+            proc.updated_at = datetime.utcnow()
+            if success:
+                proc.success_count += 1
+                # Increase reliability slightly on success
+                proc.reliability = min(1.0, proc.reliability + 0.05)
+            else:
+                proc.failure_count += 1
+                # Decrease reliability heavily on failure
+                proc.reliability = max(0.0, proc.reliability - 0.1)
+            logger.debug(f"Procedure {proc_id} outcome recorded: success={success}, new rel={proc.reliability:.2f}")

src/mnemocore/core/provenance.py ADDED Viewed

	@@ -0,0 +1,297 @@

+"""
+Provenance Tracking Module (Phase 5.0)
+=======================================
+W3C PROV-inspired source tracking for MnemoCore memories.
+Tracks the full lifecycle of every MemoryNode:
+  - origin: where/how the memory was created
+  - lineage: ordered list of transformation events
+  - version: incremented on each significant mutation
+This is the foundation for:
+  - Trust & audit trails (AI Governance)
+  - Contradiction resolution
+  - Memory-as-a-Service lineage API
+  - Source reliability scoring
+Public API:
+    record = ProvenanceRecord.new(origin_type="observation", agent_id="agent-001")
+    record.add_event("consolidated", source_memories=["mem_a", "mem_b"])
+    serialized = record.to_dict()
+    restored = ProvenanceRecord.from_dict(serialized)
+"""
+from __future__ import annotations
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from typing import Any, Dict, List, Optional
+# ------------------------------------------------------------------ #
+#  Origin types                                                       #
+# ------------------------------------------------------------------ #
+ORIGIN_TYPES = {
+    "observation",      # Direct input from agent or user
+    "inference",        # Derived/reasoned by LLM or engine
+    "dream",            # Produced by SubconsciousAI dream cycle
+    "consolidation",    # Result of SemanticConsolidation merge
+    "external_sync",    # Fetched from external source (RSS, API, etc.)
+    "user_correction",  # Explicit user override
+    "prediction",       # Stored as a future prediction
+}
+# ------------------------------------------------------------------ #
+#  Lineage event                                                      #
+# ------------------------------------------------------------------ #
+@dataclass
+class LineageEvent:
+    """
+    A single step in a memory's transformation history.
+    Examples:
+        created       – initial storage
+        accessed      – retrieved by a query
+        consolidated  – merged into or from a proto-memory cluster
+        verified      – reliability confirmed externally
+        contradicted  – flagged as contradicting another memory
+        updated       – content or metadata modified
+        archived      – moved to COLD tier
+        expired       – TTL reached or evicted
+    """
+    event: str
+    timestamp: str  # ISO 8601
+    actor: Optional[str] = None         # agent_id, "system", "user", etc.
+    source_memories: List[str] = field(default_factory=list)  # for consolidation
+    outcome: Optional[bool] = None      # for verification events
+    notes: Optional[str] = None
+    extra: Dict[str, Any] = field(default_factory=dict)
+    def to_dict(self) -> Dict[str, Any]:
+        d: Dict[str, Any] = {
+            "event": self.event,
+            "timestamp": self.timestamp,
+        }
+        if self.actor is not None:
+            d["actor"] = self.actor
+        if self.source_memories:
+            d["source_memories"] = self.source_memories
+        if self.outcome is not None:
+            d["outcome"] = self.outcome
+        if self.notes:
+            d["notes"] = self.notes
+        if self.extra:
+            d["extra"] = self.extra
+        return d
+    @classmethod
+    def from_dict(cls, d: Dict[str, Any]) -> "LineageEvent":
+        return cls(
+            event=d["event"],
+            timestamp=d["timestamp"],
+            actor=d.get("actor"),
+            source_memories=d.get("source_memories", []),
+            outcome=d.get("outcome"),
+            notes=d.get("notes"),
+            extra=d.get("extra", {}),
+        )
+# ------------------------------------------------------------------ #
+#  Origin                                                             #
+# ------------------------------------------------------------------ #
+@dataclass
+class ProvenanceOrigin:
+    """Where/how a memory was first created."""
+    type: str                           # One of ORIGIN_TYPES
+    agent_id: Optional[str] = None
+    session_id: Optional[str] = None
+    source_url: Optional[str] = None   # For external_sync
+    timestamp: str = field(
+        default_factory=lambda: datetime.now(timezone.utc).isoformat()
+    )
+    def to_dict(self) -> Dict[str, Any]:
+        d: Dict[str, Any] = {
+            "type": self.type,
+            "timestamp": self.timestamp,
+        }
+        if self.agent_id:
+            d["agent_id"] = self.agent_id
+        if self.session_id:
+            d["session_id"] = self.session_id
+        if self.source_url:
+            d["source_url"] = self.source_url
+        return d
+    @classmethod
+    def from_dict(cls, d: Dict[str, Any]) -> "ProvenanceOrigin":
+        return cls(
+            type=d.get("type", "observation"),
+            agent_id=d.get("agent_id"),
+            session_id=d.get("session_id"),
+            source_url=d.get("source_url"),
+            timestamp=d.get("timestamp", datetime.now(timezone.utc).isoformat()),
+        )
+# ------------------------------------------------------------------ #
+#  ProvenanceRecord — the full provenance object on a MemoryNode     #
+# ------------------------------------------------------------------ #
+@dataclass
+class ProvenanceRecord:
+    """
+    Full provenance object attached to a MemoryNode.
+    Designed to be serialized into node.metadata["provenance"] for
+    backward compatibility with existing storage layers.
+    """
+    origin: ProvenanceOrigin
+    lineage: List[LineageEvent] = field(default_factory=list)
+    version: int = 1
+    confidence_source: str = "bayesian_ltp"  # How the confidence score is derived
+    # ---- Factory methods ------------------------------------------ #
+    @classmethod
+    def new(
+        cls,
+        origin_type: str = "observation",
+        agent_id: Optional[str] = None,
+        session_id: Optional[str] = None,
+        source_url: Optional[str] = None,
+        actor: Optional[str] = None,
+    ) -> "ProvenanceRecord":
+        """Create a fresh ProvenanceRecord and log the 'created' event."""
+        now = datetime.now(timezone.utc).isoformat()
+        origin = ProvenanceOrigin(
+            type=origin_type if origin_type in ORIGIN_TYPES else "observation",
+            agent_id=agent_id,
+            session_id=session_id,
+            source_url=source_url,
+            timestamp=now,
+        )
+        record = cls(origin=origin)
+        record.add_event(
+            event="created",
+            actor=actor or agent_id or "system",
+        )
+        return record
+    # ---- Mutation ------------------------------------------------- #
+    def add_event(
+        self,
+        event: str,
+        actor: Optional[str] = None,
+        source_memories: Optional[List[str]] = None,
+        outcome: Optional[bool] = None,
+        notes: Optional[str] = None,
+        **extra: Any,
+    ) -> "ProvenanceRecord":
+        """Append a new lineage event and bump the version counter."""
+        evt = LineageEvent(
+            event=event,
+            timestamp=datetime.now(timezone.utc).isoformat(),
+            actor=actor,
+            source_memories=source_memories or [],
+            outcome=outcome,
+            notes=notes,
+            extra=extra,
+        )
+        self.lineage.append(evt)
+        self.version += 1
+        return self
+    def mark_consolidated(
+        self,
+        source_memory_ids: List[str],
+        actor: str = "consolidation_worker",
+    ) -> "ProvenanceRecord":
+        """Convenience wrapper for consolidation events."""
+        return self.add_event(
+            event="consolidated",
+            actor=actor,
+            source_memories=source_memory_ids,
+        )
+    def mark_verified(
+        self,
+        success: bool,
+        actor: str = "system",
+        notes: Optional[str] = None,
+    ) -> "ProvenanceRecord":
+        """Record a verification outcome."""
+        return self.add_event(
+            event="verified",
+            actor=actor,
+            outcome=success,
+            notes=notes,
+        )
+    def mark_contradicted(
+        self,
+        contradiction_group_id: str,
+        actor: str = "contradiction_detector",
+    ) -> "ProvenanceRecord":
+        """Flag this memory as contradicted."""
+        return self.add_event(
+            event="contradicted",
+            actor=actor,
+            contradiction_group_id=contradiction_group_id,
+        )
+    # ---- Serialization -------------------------------------------- #
+    def to_dict(self) -> Dict[str, Any]:
+        return {
+            "origin": self.origin.to_dict(),
+            "lineage": [e.to_dict() for e in self.lineage],
+            "version": self.version,
+            "confidence_source": self.confidence_source,
+        }
+    @classmethod
+    def from_dict(cls, d: Dict[str, Any]) -> "ProvenanceRecord":
+        return cls(
+            origin=ProvenanceOrigin.from_dict(d.get("origin", {"type": "observation"})),
+            lineage=[LineageEvent.from_dict(e) for e in d.get("lineage", [])],
+            version=d.get("version", 1),
+            confidence_source=d.get("confidence_source", "bayesian_ltp"),
+        )
+    # ---- Helpers -------------------------------------------------- #
+    @property
+    def created_at(self) -> str:
+        """ISO timestamp of the creation event."""
+        for event in self.lineage:
+            if event.event == "created":
+                return event.timestamp
+        return self.origin.timestamp
+    @property
+    def last_event(self) -> Optional[LineageEvent]:
+        """Most recent lineage event."""
+        return self.lineage[-1] if self.lineage else None
+    def is_contradicted(self) -> bool:
+        return any(e.event == "contradicted" for e in self.lineage)
+    def is_verified(self) -> bool:
+        return any(
+            e.event == "verified" and e.outcome is True for e in self.lineage
+        )
+    def __repr__(self) -> str:
+        return (
+            f"ProvenanceRecord(origin_type={self.origin.type!r}, "
+            f"version={self.version}, events={len(self.lineage)})"
+        )

src/mnemocore/core/pulse.py ADDED Viewed

	@@ -0,0 +1,110 @@

+"""
+Pulse Heartbeat Loop
+====================
+The central background orchestrator that binds together the AGI cognitive cycles.
+Triggers working memory maintenance, episodic sequence linking, gap tracking, and subconscious inferences.
+"""
+from typing import Optional
+from enum import Enum
+import threading
+import asyncio
+import logging
+import traceback
+from datetime import datetime
+logger = logging.getLogger(__name__)
+class PulseTick(Enum):
+    WM_MAINTENANCE = "wm_maintenance"
+    EPISODIC_CHAINING = "episodic_chaining"
+    SEMANTIC_REFRESH = "semantic_refresh"
+    GAP_DETECTION = "gap_detection"
+    INSIGHT_GENERATION = "insight_generation"
+    PROCEDURE_REFINEMENT = "procedure_refinement"
+    META_SELF_REFLECTION = "meta_self_reflection"
+class PulseLoop:
+    def __init__(self, container, config):
+        """
+        Args:
+            container: The fully built DI Container containing all memory sub-services.
+            config: Specifically the `config.pulse` section settings.
+        """
+        self.container = container
+        self.config = config
+        self._running = False
+        self._task: Optional[asyncio.Task] = None
+    async def start(self) -> None:
+        """Begin the background pulse orchestrator."""
+        if not getattr(self.config, "enabled", False):
+            logger.info("Pulse loop is disabled via configuration.")
+            return
+        self._running = True
+        interval = getattr(self.config, "interval_seconds", 30)
+        logger.info(f"Starting AGI Pulse Loop (interval={interval}s).")
+        while self._running:
+            start_time = datetime.utcnow()
+            try:
+                await self.tick()
+            except asyncio.CancelledError:
+                break
+            except Exception as e:
+                logger.error(f"Error during Pulse tick: {e}", exc_info=True)
+            elapsed = (datetime.utcnow() - start_time).total_seconds()
+            sleep_time = max(0.1, interval - elapsed)
+            await asyncio.sleep(sleep_time)
+    def stop(self) -> None:
+        """Gracefully interrupt and unbind the Pulse loop."""
+        self._running = False
+        if self._task and not self._task.done():
+            self._task.cancel()
+        logger.info("AGI Pulse Loop stopped.")
+    async def tick(self) -> None:
+        """Execute a full iteration across the cognitive architecture planes."""
+        await self._wm_maintenance()
+        await self._episodic_chaining()
+        await self._semantic_refresh()
+        await self._gap_detection()
+        await self._insight_generation()
+        await self._procedure_refinement()
+        await self._meta_self_reflection()
+    async def _wm_maintenance(self) -> None:
+        """Prune overloaded short-term buffers and cull expired items."""
+        if hasattr(self.container, "working_memory") and self.container.working_memory:
+            self.container.working_memory.prune_all()
+            logger.debug(f"Pulse: [{PulseTick.WM_MAINTENANCE.value}] Executed.")
+    async def _episodic_chaining(self) -> None:
+        """Retroactively verify event streams and apply temporal links between episodic contexts."""
+        logger.debug(f"Pulse: [{PulseTick.EPISODIC_CHAINING.value}] Stubbed.")
+    async def _semantic_refresh(self) -> None:
+        """Prompt Qdrant abstractions or run `semantic_consolidation` loops over episodic data."""
+        logger.debug(f"Pulse: [{PulseTick.SEMANTIC_REFRESH.value}] Stubbed.")
+    async def _gap_detection(self) -> None:
+        """Unearth missing knowledge vectors (GapDetector integration)."""
+        logger.debug(f"Pulse: [{PulseTick.GAP_DETECTION.value}] Stubbed.")
+    async def _insight_generation(self) -> None:
+        """Forward memory patterns to LLM for spontaneous inference generation."""
+        logger.debug(f"Pulse: [{PulseTick.INSIGHT_GENERATION.value}] Stubbed.")
+    async def _procedure_refinement(self) -> None:
+        """Modify procedure reliabilities directly depending on episode occurrences."""
+        logger.debug(f"Pulse: [{PulseTick.PROCEDURE_REFINEMENT.value}] Stubbed.")
+    async def _meta_self_reflection(self) -> None:
+        """Collate macro anomalies and submit SelfImprovementProposals."""
+        logger.debug(f"Pulse: [{PulseTick.META_SELF_REFLECTION.value}] Stubbed.")

src/mnemocore/core/qdrant_store.py CHANGED Viewed

@@ -6,7 +6,7 @@ Provides async access to Qdrant for vector storage and similarity search.
 Phase 4.3: Temporal Recall - supports time-based filtering and indexing.
 """
-from typing import List, Any, Optional, Tuple
 from datetime import datetime
 import asyncio
@@ -100,7 +100,7 @@ class QdrantStore:
                 collection_name=self.collection_hot,
                 vectors_config=models.VectorParams(
                     size=self.dim,
-                    distance=models.Distance.COSINE,
                     on_disk=False
                 ),
                 quantization_config=quantization_config,
@@ -118,7 +118,7 @@ class QdrantStore:
                 collection_name=self.collection_warm,
                 vectors_config=models.VectorParams(
                     size=self.dim,
-                    distance=models.Distance.MANHATTAN,
                     on_disk=True
                 ),
                 quantization_config=quantization_config,
@@ -169,6 +169,7 @@ class QdrantStore:
         limit: int = 5,
         score_threshold: float = 0.0,
         time_range: Optional[Tuple[datetime, datetime]] = None,
     ) -> List[models.ScoredPoint]:
         """
         Async semantic search.
@@ -189,30 +190,51 @@ class QdrantStore:
             as search failures should not crash the calling code.
         """
         try:
-            # Build time filter if provided (Phase 4.3)
-            query_filter = None
             if time_range:
                 start_ts = int(time_range[0].timestamp())
                 end_ts = int(time_range[1].timestamp())
-                query_filter = models.Filter(
-                    must=[
-                        models.FieldCondition(
-                            key="unix_timestamp",
-                            range=models.Range(
-                                gte=start_ts,
-                                lte=end_ts,
-                            ),
                         ),
-                    ]
                 )
             return await qdrant_breaker.call(
-                self.client.search,
                 collection_name=collection,
-                query_vector=query_vector,
                 limit=limit,
                 score_threshold=score_threshold,
                 query_filter=query_filter,
             )
         except CircuitOpenError:
             logger.warning(f"Qdrant search blocked for {collection}: circuit breaker open")

 Phase 4.3: Temporal Recall - supports time-based filtering and indexing.
 """
+from typing import List, Any, Optional, Tuple, Dict
 from datetime import datetime
 import asyncio
                 collection_name=self.collection_hot,
                 vectors_config=models.VectorParams(
                     size=self.dim,
+                    distance=models.Distance.DOT,
                     on_disk=False
                 ),
                 quantization_config=quantization_config,
                 collection_name=self.collection_warm,
                 vectors_config=models.VectorParams(
                     size=self.dim,
+                    distance=models.Distance.DOT,
                     on_disk=True
                 ),
                 quantization_config=quantization_config,
         limit: int = 5,
         score_threshold: float = 0.0,
         time_range: Optional[Tuple[datetime, datetime]] = None,
+        metadata_filter: Optional[Dict[str, Any]] = None,
     ) -> List[models.ScoredPoint]:
         """
         Async semantic search.
             as search failures should not crash the calling code.
         """
         try:
+            must_conditions = []
             if time_range:
                 start_ts = int(time_range[0].timestamp())
                 end_ts = int(time_range[1].timestamp())
+                must_conditions.append(
+                    models.FieldCondition(
+                        key="unix_timestamp",
+                        range=models.Range(
+                            gte=start_ts,
+                            lte=end_ts,
                         ),
+                    )
+                )
+            if metadata_filter:
+                for k, v in metadata_filter.items():
+                    must_conditions.append(
+                        models.FieldCondition(
+                            key=k,
+                            match=models.MatchValue(value=v)
+                        )
+                    )
+            if must_conditions:
+                query_filter = models.Filter(must=must_conditions)
+            # Support for Binary Quantization rescoring (BUG-04)
+            search_params = None
+            if self.binary_quantization:
+                search_params = models.SearchParams(
+                    quantization=models.QuantizationSearchParams(
+                        ignore=False,
+                        rescore=True,
+                        oversampling=2.0
+                    )
                 )
             return await qdrant_breaker.call(
+                self.client.query_points,
                 collection_name=collection,
+                query=query_vector,
                 limit=limit,
                 score_threshold=score_threshold,
                 query_filter=query_filter,
+                search_params=search_params,
             )
         except CircuitOpenError:
             logger.warning(f"Qdrant search blocked for {collection}: circuit breaker open")

src/mnemocore/core/semantic_consolidation.py CHANGED Viewed

@@ -37,6 +37,7 @@ from loguru import logger
 from .binary_hdv import BinaryHDV, majority_bundle
 from .config import get_config
 from .node import MemoryNode
 # ------------------------------------------------------------------ #
@@ -266,6 +267,18 @@ class SemanticConsolidationWorker:
             medoid_node.metadata["proto_updated_at"] = datetime.now(timezone.utc).isoformat()
             proto_count += 1
         elapsed = time.monotonic() - t0
         self.last_run = datetime.now(timezone.utc)
         self.stats = {

 from .binary_hdv import BinaryHDV, majority_bundle
 from .config import get_config
 from .node import MemoryNode
+from .provenance import ProvenanceRecord
 # ------------------------------------------------------------------ #
             medoid_node.metadata["proto_updated_at"] = datetime.now(timezone.utc).isoformat()
             proto_count += 1
+            # Phase 5.0: record consolidation in provenance lineage
+            source_ids = [n.id for n in member_nodes if n.id != medoid_node.id]
+            if medoid_node.provenance is None:
+                medoid_node.provenance = ProvenanceRecord.new(
+                    origin_type="consolidation",
+                    actor="consolidation_worker",
+                )
+            medoid_node.provenance.mark_consolidated(
+                source_memory_ids=source_ids,
+                actor="consolidation_worker",
+            )
         elapsed = time.monotonic() - t0
         self.last_run = datetime.now(timezone.utc)
         self.stats = {