AthelaPerk
/

mnemo-memory

@@ -1,14 +1,23 @@
 #!/usr/bin/env python3
 """
-Mnemo v3 TUNED - Final Version with Optimized Parameters
-=========================================================
-Based on benchmark testing:
-- Optimal similarity threshold: 0.4-0.5 (not 0.6)
-- Quality threshold: 0.35
-- Context window detection enabled
-- Relevance re-ranking enabled
 """
 import hashlib
@@ -16,10 +25,13 @@ import time
 import re
 import threading
 import numpy as np
-from typing import Dict, List, Optional, Tuple, Any, Callable
 from dataclasses import dataclass, field
 from collections import defaultdict
 try:
     import faiss
     HAS_FAISS = True
@@ -39,138 +51,706 @@ except ImportError:
     HAS_BM25 = False
 @dataclass
 class Memory:
     id: str
     content: str
     embedding: np.ndarray
     namespace: str = "default"
-    quality_score: float = 1.0
     access_count: int = 0
-    usefulness_score: float = 0.5
     metadata: Dict = field(default_factory=dict)
     created_at: float = field(default_factory=time.time)
-@dataclass
 class SearchResult:
     id: str
     content: str
     score: float
-    relevance_score: float = 0.0
     strategy_scores: Dict[str, float] = field(default_factory=dict)
     metadata: Dict = field(default_factory=dict)
-# Smart injection signals
-MEMORY_INJECTION_SIGNALS = [
-    "previous", "earlier", "before", "you said", "you mentioned",
-    "as you", "based on", "using your", "your analysis", "your framework",
-    "we discussed", "we analyzed", "refer to", "from your",
-    "compare", "contrast", "synthesize", "combine", "integrate",
-    "apply your", "using your", "based on your",
-    "you previously", "your earlier", "you have analyzed"
-]
-def should_inject_memory(query: str, context: str = "", conversation_history: str = "") -> Tuple[bool, str]:
-    """Smart context-check with 90% accuracy"""
-    combined = (query + " " + context).lower()
-    for signal in MEMORY_INJECTION_SIGNALS:
-        if signal in combined:
-            # Check if conversation already has context
-            if conversation_history and len(conversation_history.split()) > 500:
-                query_kws = set(query.lower().split()) - {"the", "a", "is", "are", "to", "of"}
-                if sum(1 for kw in query_kws if kw in conversation_history.lower()) >= len(query_kws) * 0.7:
-                    return False, "context_window_has_info"
-            return True, f"signal:{signal}"
-    return False, "no_signal"
-def estimate_quality(content: str) -> float:
-    """Estimate content quality before storing"""
-    score = 0.5
-    words = len(content.split())
-    if words < 5:
-        score -= 0.3
-    elif words > 20:
-        score += 0.1
-    if any(r in content.lower() for r in ["because", "therefore", "shows", "indicates"]):
-        score += 0.2
-    if re.search(r'\d+', content):
-        score += 0.1
-    if any(v in content.lower() for v in ["something", "stuff", "maybe"]):
-        score -= 0.2
-    if any(e in content.lower() for e in ["error", "failed", "wrong"]):
-        score -= 0.3
-    return max(0.0, min(1.0, score))
-def rerank_by_relevance(query: str, results: List[SearchResult]) -> List[SearchResult]:
-    """Re-rank by task relevance"""
-    query_lower = query.lower()
-    query_kws = set(query_lower.split()) - {"the", "a", "is", "are", "to", "of"}
-    for result in results:
-        content_lower = result.content.lower()
-        content_words = set(content_lower.split())
-        overlap = len(query_kws & content_words) / max(len(query_kws), 1)
-        qa_bonus = 0
-        if "why" in query_lower and "because" in content_lower:
-            qa_bonus = 0.2
-        if "compare" in query_lower and any(w in content_lower for w in ["differ", "similar", "both"]):
-            qa_bonus = 0.3
-        result.relevance_score = overlap * 0.5 + qa_bonus + result.score * 0.3
-    results.sort(key=lambda x: x.relevance_score, reverse=True)
-    return results
 class Mnemo:
     """
-    Mnemo v3 TUNED - Optimized AI Memory System
-    Tuned parameters based on benchmarks:
-    - similarity_threshold: 0.45 (optimal range 0.4-0.5)
-    - quality_threshold: 0.35
-    """
-    # TUNED DEFAULTS
-    DEFAULT_SIMILARITY_THRESHOLD = 0.45  # TUNED from 0.6
-    DEFAULT_QUALITY_THRESHOLD = 0.35     # TUNED from 0.4
     STOP_WORDS = {"a", "an", "the", "is", "are", "was", "were", "be", "been",
                   "to", "of", "in", "for", "on", "with", "at", "by", "from",
                   "and", "but", "or", "not", "this", "that", "i", "me", "my"}
-    def __init__(self,
-                 embedding_dim: int = 384,
-                 similarity_threshold: float = 0.45,  # TUNED
-                 quality_threshold: float = 0.35,     # TUNED
-                 semantic_weight: float = 0.5,
-                 bm25_weight: float = 0.3,
-                 graph_weight: float = 0.2):
         self.embedding_dim = embedding_dim
-        self.similarity_threshold = similarity_threshold
-        self.quality_threshold = quality_threshold
-        self.semantic_weight = semantic_weight
-        self.bm25_weight = bm25_weight
-        self.graph_weight = graph_weight
-        self.memories: Dict[str, Memory] = {}
-        self.namespaces: Dict[str, List[str]] = defaultdict(list)
         self._embeddings: List[np.ndarray] = []
         self._ids: List[str] = []
@@ -179,35 +759,40 @@ class Mnemo:
         else:
             self.index = None
         self.bm25 = None
         self._tokenized_docs: List[List[str]] = []
         if HAS_NETWORKX:
             self.graph = nx.DiGraph()
         else:
             self.graph = None
-        self._doc_boosts: Dict[str, float] = defaultdict(float)
-        self._query_doc_scores: Dict[str, Dict[str, float]] = defaultdict(dict)
         self._cache: Dict[str, Any] = {}
         self._cache_lock = threading.Lock()
         self.stats = {
-            "adds": 0, "adds_rejected": 0, "searches": 0,
-            "results_filtered": 0, "feedback": 0,
-            "cache_hits": 0, "cache_misses": 0,
-            "injections_triggered": 0, "injections_skipped": 0
         }
     def _get_embedding(self, text: str) -> np.ndarray:
         cache_key = f"emb:{hashlib.md5(text.encode()).hexdigest()}"
         with self._cache_lock:
             if cache_key in self._cache:
                 self.stats["cache_hits"] += 1
                 return self._cache[cache_key]
             self.stats["cache_misses"] += 1
         embedding = np.zeros(self.embedding_dim, dtype=np.float32)
         words = text.lower().split()
         for i, word in enumerate(words):
@@ -223,23 +808,49 @@ class Mnemo:
         return embedding
-    def should_inject(self, query: str, context: str = "", conversation_history: str = "") -> bool:
-        should, reason = should_inject_memory(query, context, conversation_history)
-        if should:
-            self.stats["injections_triggered"] += 1
-        else:
-            self.stats["injections_skipped"] += 1
         return should
     def add(self, content: str, namespace: str = "default",
             metadata: Dict = None, skip_quality_check: bool = False) -> Optional[str]:
-        quality = estimate_quality(content)
-        if not skip_quality_check and quality < self.quality_threshold:
             self.stats["adds_rejected"] += 1
             return None
         memory_id = f"mem_{hashlib.md5(content.encode()).hexdigest()[:8]}"
@@ -254,8 +865,10 @@ class Mnemo:
             metadata=metadata or {}
         )
-        self.memories[memory_id] = memory
-        self.namespaces[namespace].append(memory_id)
         self._embeddings.append(embedding)
         self._ids.append(memory_id)
@@ -267,26 +880,53 @@ class Mnemo:
         if HAS_BM25:
             self.bm25 = BM25Okapi(self._tokenized_docs)
-        if HAS_NETWORKX and self.graph is not None:
-            self.graph.add_node(memory_id, content=content, namespace=namespace)
-            keywords = [w for w in tokens if w not in self.STOP_WORDS and len(w) > 2][:5]
-            for kw in keywords:
-                entity_id = f"entity_{kw}"
-                if not self.graph.has_node(entity_id):
-                    self.graph.add_node(entity_id, type="keyword")
-                self.graph.add_edge(memory_id, entity_id, relation="contains")
         self.stats["adds"] += 1
         return memory_id
-    def search(self, query: str, top_k: int = 5, namespace: Optional[str] = None) -> List[SearchResult]:
-        if not self.memories:
             return []
         self.stats["searches"] += 1
         query_embedding = self._get_embedding(query)
-        # Semantic search
         semantic_scores = {}
         if HAS_FAISS and self.index is not None and self.index.ntotal > 0:
             k = min(top_k * 3, self.index.ntotal)
@@ -295,10 +935,10 @@ class Mnemo:
                 if 0 <= idx < len(self._ids):
                     semantic_scores[self._ids[idx]] = float(score)
         else:
-            for mem_id, embedding in zip(self._ids, self._embeddings):
-                semantic_scores[mem_id] = float(np.dot(query_embedding, embedding))
-        # BM25
         bm25_scores = {}
         if HAS_BM25 and self.bm25 is not None:
             tokens = query.lower().split()
@@ -308,64 +948,67 @@ class Mnemo:
                 if score > 0.1 * max_score:
                     bm25_scores[self._ids[idx]] = float(score / max_score)
-        # Graph
-        graph_scores = {}
-        if HAS_NETWORKX and self.graph is not None:
-            keywords = [w for w in query.lower().split() if w not in self.STOP_WORDS and len(w) > 2]
-            for kw in keywords:
-                entity_id = f"entity_{kw}"
-                if self.graph.has_node(entity_id):
-                    for neighbor in self.graph.predecessors(entity_id):
-                        if neighbor.startswith("mem_"):
-                            graph_scores[neighbor] = graph_scores.get(neighbor, 0) + 0.5
-        # Combine
-        all_ids = set(semantic_scores.keys()) | set(bm25_scores.keys()) | set(graph_scores.keys())
         if namespace:
-            all_ids = all_ids & set(self.namespaces.get(namespace, []))
         results = []
         for mem_id in all_ids:
             strat = {
                 "semantic": semantic_scores.get(mem_id, 0),
                 "bm25": bm25_scores.get(mem_id, 0),
-                "graph": graph_scores.get(mem_id, 0)
             }
             combined = (
-                self.semantic_weight * strat["semantic"] +
-                self.bm25_weight * strat["bm25"] +
-                self.graph_weight * strat["graph"]
             )
-            # Feedback adjustment
-            query_key = " ".join(sorted(set(query.lower().split()))[:5])
-            combined += self._doc_boosts.get(mem_id, 0) * 0.1
-            combined += self._query_doc_scores.get(query_key, {}).get(mem_id, 0) * 0.2
-            memory = self.memories.get(mem_id)
-            if memory:
-                combined *= (0.5 + 0.5 * memory.quality_score)
-                if combined >= self.similarity_threshold:
-                    memory.access_count += 1
-                    results.append(SearchResult(
-                        id=mem_id, content=memory.content, score=combined,
-                        strategy_scores=strat, metadata=memory.metadata
-                    ))
-                else:
-                    self.stats["results_filtered"] += 1
         results.sort(key=lambda x: x.score, reverse=True)
-        # Re-rank
-        if results:
-            results = rerank_by_relevance(query, results)
         return results[:top_k]
-    def get_context(self, query: str, top_k: int = 3, namespace: Optional[str] = None) -> str:
         results = self.search(query, top_k=top_k, namespace=namespace)
         if not results:
@@ -373,112 +1016,155 @@ class Mnemo:
         parts = ["[RELEVANT CONTEXT FROM MEMORY]"]
         for r in results:
-            parts.append(f"• {r.content}")
         parts.append("[END CONTEXT]\n")
         return "\n".join(parts)
     def feedback(self, query: str, memory_id: str, relevance: float):
         relevance = max(-1, min(1, relevance))
-        self._doc_boosts[memory_id] += 0.1 * relevance
-        query_key = " ".join(sorted(set(query.lower().split()))[:5])
-        current = self._query_doc_scores[query_key].get(memory_id, 0)
-        self._query_doc_scores[query_key][memory_id] = current + 0.1 * relevance
-        if memory_id in self.memories:
-            mem = self.memories[memory_id]
-            mem.usefulness_score = 0.7 * mem.usefulness_score + 0.3 * ((relevance + 1) / 2)
-            if mem.usefulness_score < 0.3:
-                mem.quality_score *= 0.9
-        self.stats["feedback"] += 1
-    def get(self, memory_id: str) -> Optional[Memory]:
-        return self.memories.get(memory_id)
-    def delete(self, memory_id: str) -> bool:
-        if memory_id in self.memories:
-            mem = self.memories[memory_id]
-            if mem.namespace in self.namespaces:
-                try:
-                    self.namespaces[mem.namespace].remove(memory_id)
-                except ValueError:
-                    pass
-            del self.memories[memory_id]
-            return True
-        return False
-    def list_all(self, namespace: Optional[str] = None) -> List[Memory]:
-        if namespace:
-            return [self.memories[mid] for mid in self.namespaces.get(namespace, []) if mid in self.memories]
-        return list(self.memories.values())
     def get_stats(self) -> Dict:
         return {
-            "total_memories": len(self.memories),
-            "namespaces": {ns: len(ids) for ns, ids in self.namespaces.items()},
-            "adds": self.stats["adds"],
-            "adds_rejected": self.stats["adds_rejected"],
-            "searches": self.stats["searches"],
-            "results_filtered": self.stats["results_filtered"],
-            "feedback": self.stats["feedback"],
-            "similarity_threshold": self.similarity_threshold,
-            "quality_threshold": self.quality_threshold,
-            "has_faiss": HAS_FAISS,
-            "has_bm25": HAS_BM25,
-            "has_graph": HAS_NETWORKX
         }
-    def clear(self, namespace: Optional[str] = None):
-        if namespace:
-            for mid in list(self.namespaces.get(namespace, [])):
-                self.delete(mid)
-        else:
-            self.memories.clear()
-            self.namespaces.clear()
-            self._embeddings.clear()
-            self._ids.clear()
-            self._tokenized_docs.clear()
-            self.bm25 = None
-            self._cache.clear()
-            if HAS_FAISS:
-                self.index = faiss.IndexFlatIP(self.embedding_dim)
-            if HAS_NETWORKX:
-                self.graph = nx.DiGraph()
     def __len__(self):
-        return len(self.memories)
     def __repr__(self):
-        return f"Mnemo(memories={len(self.memories)}, threshold={self.similarity_threshold})"
 def demo():
-    print("="*60)
-    print("MNEMO v3 TUNED - Optimized Parameters")
-    print("="*60)
-    m = Mnemo()  # Uses tuned defaults
-    print(f"\n✓ {m}")
-    print(f"  Similarity threshold: {m.similarity_threshold}")
-    print(f"  Quality threshold: {m.quality_threshold}")
-    # Quick test
-    m.add("User prefers Python because it has clean syntax")
-    m.add("Previous analysis showed gender bias patterns")
-    m.add("Framework has 5 checkpoints for detection")
-    print(f"\n✓ Added {len(m)} memories")
-    results = m.search("previous analysis", top_k=2)
-    print(f"✓ Search returned {len(results)} results")
     for r in results:
-        print(f"  [{r.id}] score={r.score:.3f}: {r.content[:50]}...")
-    print("\n" + "="*60)
-    print("✅ Ready for production!")
 if __name__ == "__main__":

 #!/usr/bin/env python3
 """
+Mnemo v4: SLM-Inspired Architecture
+====================================
+Implements key SLM architecture features with parameter adjustments
+based on Mnemo benchmark findings.
+SLM Features Implemented:
+1. Three-Tiered Memory (Working → Token → Semantic)
+2. Promotion/Demotion Algorithms
+3. Neural Link Types (8 types with decay)
+4. Self-Tuning Parameters
+5. Memory Utility Predictor (NEW - from benchmarks)
+Key Parameter Adjustments (from benchmarks):
+- Semantic threshold: 0.65 → 0.50 (SLM was too high)
+- Quality acceptance: 0.30 → 0.50 (SLM too permissive)
+- Promotion threshold: 0.65 → 0.55 (faster promotion)
+- Link pruning: 60 days → 30 days (faster cleanup)
 """
 import hashlib
 import re
 import threading
 import numpy as np
+from typing import Dict, List, Optional, Tuple, Any, Set
 from dataclasses import dataclass, field
 from collections import defaultdict
+from enum import Enum
+import json
+# Optional imports
 try:
     import faiss
     HAS_FAISS = True
     HAS_BM25 = False
+# =============================================================================
+# ENUMS AND CONSTANTS (from SLM spec)
+# =============================================================================
+class MemoryTier(Enum):
+    """Three-tiered memory hierarchy from SLM"""
+    WORKING = "working"      # 32MB, <1ms, current context
+    TOKEN = "token"          # 100-250 items, 1-10ms, compressed
+    SEMANTIC = "semantic"    # Persistent, 10-100ms, full knowledge
+class LinkType(Enum):
+    """Eight link types from SLM Neural Link system"""
+    DIRECT_REFERENCE = "direct_reference"      # Explicit reference
+    SEMANTIC_SIMILARITY = "semantic_similarity" # Vector similarity
+    CO_OCCURRENCE = "co_occurrence"            # Appear together
+    HIERARCHICAL = "hierarchical"              # Parent-child
+    TEMPORAL = "temporal"                      # Time-based
+    CAUSAL = "causal"                          # Cause-effect
+    CROSS_DOMAIN = "cross_domain"              # Different domains
+    ASSOCIATIVE = "associative"                # General association
+# SLM Link Type Properties (adjusted based on benchmarks)
+LINK_PROPERTIES = {
+    LinkType.DIRECT_REFERENCE: {
+        "creation_threshold": 0.85,  # SLM: 0.90
+        "initial_strength": 0.90,
+        "decay_rate": 0.005,         # per day
+        "usage_boost": 0.05
+    },
+    LinkType.SEMANTIC_SIMILARITY: {
+        "creation_threshold": 0.50,  # SLM: 0.65, ADJUSTED from benchmarks
+        "initial_strength": 0.75,
+        "decay_rate": 0.01,
+        "usage_boost": 0.03
+    },
+    LinkType.CO_OCCURRENCE: {
+        "creation_threshold": 0.60,
+        "initial_strength": 0.70,
+        "decay_rate": 0.015,
+        "usage_boost": 0.04
+    },
+    LinkType.HIERARCHICAL: {
+        "creation_threshold": 0.80,  # SLM: 0.85
+        "initial_strength": 0.85,
+        "decay_rate": 0.003,
+        "usage_boost": 0.02
+    },
+    LinkType.TEMPORAL: {
+        "creation_threshold": 0.55,
+        "initial_strength": 0.65,
+        "decay_rate": 0.02,
+        "usage_boost": 0.05
+    },
+    LinkType.CAUSAL: {
+        "creation_threshold": 0.75,
+        "initial_strength": 0.80,
+        "decay_rate": 0.005,
+        "usage_boost": 0.03
+    },
+    LinkType.CROSS_DOMAIN: {
+        "creation_threshold": 0.70,  # SLM: 0.80
+        "initial_strength": 0.65,    # SLM: 0.70
+        "decay_rate": 0.008,
+        "usage_boost": 0.04
+    },
+    LinkType.ASSOCIATIVE: {
+        "creation_threshold": 0.45,  # Permissive for exploration
+        "initial_strength": 0.60,
+        "decay_rate": 0.025,
+        "usage_boost": 0.06
+    }
+}
+# =============================================================================
+# DATA CLASSES
+# =============================================================================
 @dataclass
 class Memory:
+    """Memory unit with SLM-style metadata"""
     id: str
     content: str
     embedding: np.ndarray
+    tier: MemoryTier = MemoryTier.SEMANTIC
     namespace: str = "default"
+    # Quality and relevance (SLM quality gates)
+    quality_score: float = 0.5
+    relevance_score: float = 0.5
+    confidence: float = 0.5
+    # Access tracking (for promotion/demotion)
     access_count: int = 0
+    last_accessed: float = field(default_factory=time.time)
+    created_at: float = field(default_factory=time.time)
+    # SLM priority decay
+    priority: float = 1.0
     metadata: Dict = field(default_factory=dict)
+@dataclass
+class NeuralLink:
+    """SLM Neural Link between memories"""
+    source_id: str
+    target_id: str
+    link_type: LinkType
+    strength: float
     created_at: float = field(default_factory=time.time)
+    last_traversed: float = field(default_factory=time.time)
+    traversal_count: int = 0
+@dataclass
 class SearchResult:
+    """Search result with multi-strategy scores"""
     id: str
     content: str
     score: float
+    tier: MemoryTier = MemoryTier.SEMANTIC
+    link_path: List[str] = field(default_factory=list)
     strategy_scores: Dict[str, float] = field(default_factory=dict)
     metadata: Dict = field(default_factory=dict)
+# =============================================================================
+# MEMORY UTILITY PREDICTOR (NEW - from Mnemo benchmarks)
+# =============================================================================
+class MemoryUtilityPredictor:
+    """
+    Predicts whether memory injection will help or hurt.
+    Key finding from benchmarks:
+    - Within-conversation: Memory often HURTS (-3 to -12 pts)
+    - Cross-session: Memory HELPS (+2 pts on dependent questions)
+    """
+    # Signals that indicate memory should be used
+    INJECTION_SIGNALS = [
+        "previous", "earlier", "before", "you said", "you mentioned",
+        "as you", "based on", "using your", "your analysis", "your framework",
+        "we discussed", "we analyzed", "refer to", "from your",
+        "compare", "contrast", "synthesize", "combine", "integrate",
+        "apply your", "using your", "based on your",
+        "you previously", "your earlier", "you have analyzed"
+    ]
+    # Signals that indicate memory should NOT be used
+    SKIP_SIGNALS = [
+        "this is a new", "new topic", "different subject",
+        "what is", "define", "explain what"
+    ]
+    def __init__(self):
+        self.stats = {
+            "predictions": 0,
+            "inject_recommended": 0,
+            "skip_recommended": 0,
+            "skip_context_window": 0
+        }
+    def should_inject(self,
+                      query: str,
+                      context: str = "",
+                      conversation_history: str = "",
+                      model_confidence: float = 0.5) -> Tuple[bool, str, float]:
+        """
+        Predict if memory injection will help.
+        Returns:
+            (should_inject, reason, confidence)
+        """
+        self.stats["predictions"] += 1
+        combined = (query + " " + context).lower()
+        # Check skip signals first
+        for signal in self.SKIP_SIGNALS:
+            if signal in combined:
+                self.stats["skip_recommended"] += 1
+                return False, f"skip_signal:{signal}", 0.8
+        # Check injection signals
+        for signal in self.INJECTION_SIGNALS:
+            if signal in combined:
+                # But check if context window already has info
+                if self._context_has_info(query, conversation_history):
+                    self.stats["skip_context_window"] += 1
+                    return False, "context_window_sufficient", 0.7
+                self.stats["inject_recommended"] += 1
+                return True, f"inject_signal:{signal}", 0.85
+        # No clear signal - default to skip for simple queries
+        if self._is_simple_query(query):
+            self.stats["skip_recommended"] += 1
+            return False, "simple_query", 0.6
+        # Model is very confident - skip memory
+        if model_confidence > 0.85:
+            self.stats["skip_recommended"] += 1
+            return False, "model_confident", 0.7
+        # Default: don't inject (memory often hurts)
+        self.stats["skip_recommended"] += 1
+        return False, "no_signal", 0.5
+    def _context_has_info(self, query: str, history: str) -> bool:
+        """Check if conversation history already has needed context"""
+        if not history or len(history.split()) < 200:
+            return False
+        query_keywords = set(query.lower().split()) - {
+            "the", "a", "is", "are", "to", "of", "in", "for", "what", "how"
+        }
+        history_lower = history.lower()
+        overlap = sum(1 for kw in query_keywords if kw in history_lower)
+        return overlap >= len(query_keywords) * 0.6
+    def _is_simple_query(self, query: str) -> bool:
+        """Detect simple factual queries that don't need memory"""
+        simple_patterns = [
+            r"^what is\b", r"^who is\b", r"^when did\b",
+            r"^where is\b", r"^how many\b", r"^define\b"
+        ]
+        query_lower = query.lower()
+        return any(re.search(p, query_lower) for p in simple_patterns)
+# =============================================================================
+# SELF-TUNING SYSTEM (from SLM)
+# =============================================================================
+class SelfTuner:
+    """
+    SLM Self-Tuning Parameter System
+    Tracks performance and auto-adjusts parameters.
+    """
+    def __init__(self):
+        self.parameters = {
+            "similarity_threshold": 0.50,  # ADJUSTED from SLM 0.65
+            "quality_threshold": 0.50,     # ADJUSTED from SLM 0.30
+            "promotion_threshold": 0.55,   # ADJUSTED from SLM 0.65
+            "demotion_threshold": 0.70,    # ADJUSTED from SLM 0.75
+        }
+        self.performance_history = defaultdict(list)
+        self.adjustment_count = 0
+        # SLM learning rates
+        self.learning_rates = {
+            "similarity_threshold": 0.01,
+            "quality_threshold": 0.02,
+            "promotion_threshold": 0.05,
+        }
+    def record_outcome(self, param_name: str, value: float, success: bool):
+        """Record outcome for a parameter setting"""
+        self.performance_history[param_name].append({
+            "value": value,
+            "success": success,
+            "timestamp": time.time()
+        })
+        # Keep last 100 outcomes
+        if len(self.performance_history[param_name]) > 100:
+            self.performance_history[param_name] = \
+                self.performance_history[param_name][-100:]
+    def should_adjust(self, param_name: str) -> bool:
+        """Check if parameter should be adjusted (every 10 samples)"""
+        history = self.performance_history.get(param_name, [])
+        return len(history) >= 10 and len(history) % 10 == 0
+    def get_adjustment(self, param_name: str) -> float:
+        """Calculate parameter adjustment based on recent performance"""
+        history = self.performance_history.get(param_name, [])
+        if len(history) < 10:
+            return 0.0
+        recent = history[-10:]
+        success_rate = sum(1 for h in recent if h["success"]) / len(recent)
+        lr = self.learning_rates.get(param_name, 0.01)
+        if success_rate < 0.5:
+            # Performance poor - try lower threshold
+            return -lr
+        elif success_rate > 0.8:
+            # Performance good - can be more selective
+            return lr * 0.5
+        return 0.0
+    def auto_tune(self):
+        """Run auto-tuning cycle"""
+        adjusted = []
+        for param_name in self.parameters:
+            if self.should_adjust(param_name):
+                adjustment = self.get_adjustment(param_name)
+                if adjustment != 0:
+                    old_val = self.parameters[param_name]
+                    new_val = max(0.1, min(0.9, old_val + adjustment))
+                    self.parameters[param_name] = new_val
+                    adjusted.append((param_name, old_val, new_val))
+                    self.adjustment_count += 1
+        return adjusted
+# =============================================================================
+# THREE-TIERED MEMORY MANAGER (from SLM)
+# =============================================================================
+class TieredMemoryManager:
+    """
+    SLM Three-Tiered Memory Hierarchy
+    Working Memory (32MB, <1ms):
+      - Currently active info
+      - Priority decay: 0.95/minute
+      - Eviction threshold: 0.2
+    Token Memory (100-250 items, 1-10ms):
+      - Compressed representations
+      - Loop-based organization
+      - Merging at 0.8 similarity
+    Semantic Memory (persistent, 10-100ms):
+      - Full knowledge representations
+      - Partition-based organization
+    """
+    # SLM spec values (some adjusted based on benchmarks)
+    WORKING_MEMORY_SIZE = 50  # items (simplified from 32MB)
+    TOKEN_LOOP_CAPACITY = 100  # default
+    TOKEN_LOOP_MAX = 250       # expandable
+    PRIORITY_DECAY = 0.95      # per access cycle
+    EVICTION_THRESHOLD = 0.2
+    LOOP_MERGE_THRESHOLD = 0.8
+    def __init__(self, tuner: SelfTuner):
+        self.tuner = tuner
+        # Three tiers
+        self.working_memory: Dict[str, Memory] = {}
+        self.token_loops: Dict[str, List[str]] = defaultdict(list)  # namespace -> ids
+        self.semantic_memory: Dict[str, Memory] = {}
+        self.stats = {
+            "promotions": 0,
+            "demotions": 0,
+            "evictions": 0
+        }
+    def add_to_tier(self, memory: Memory, tier: MemoryTier):
+        """Add memory to specific tier"""
+        memory.tier = tier
+        if tier == MemoryTier.WORKING:
+            self._add_to_working(memory)
+        elif tier == MemoryTier.TOKEN:
+            self._add_to_token(memory)
+        else:
+            self.semantic_memory[memory.id] = memory
+    def _add_to_working(self, memory: Memory):
+        """Add to working memory with eviction if needed"""
+        if len(self.working_memory) >= self.WORKING_MEMORY_SIZE:
+            self._evict_from_working()
+        memory.priority = 1.0
+        self.working_memory[memory.id] = memory
+    def _add_to_token(self, memory: Memory):
+        """Add to token memory loop"""
+        loop = self.token_loops[memory.namespace]
+        if len(loop) >= self.TOKEN_LOOP_CAPACITY:
+            # Demote oldest to semantic
+            oldest_id = loop.pop(0)
+            if oldest_id in self.semantic_memory:
+                self.semantic_memory[oldest_id].tier = MemoryTier.SEMANTIC
+        loop.append(memory.id)
+        self.semantic_memory[memory.id] = memory  # Store actual data in semantic
+        memory.tier = MemoryTier.TOKEN
+    def _evict_from_working(self):
+        """Evict lowest priority items from working memory"""
+        if not self.working_memory:
+            return
+        # Find lowest priority
+        min_id = min(self.working_memory, key=lambda k: self.working_memory[k].priority)
+        evicted = self.working_memory.pop(min_id)
+        # Demote to token memory
+        self._add_to_token(evicted)
+        self.stats["evictions"] += 1
+    def decay_priorities(self):
+        """Apply SLM priority decay (0.95 per cycle)"""
+        for memory in self.working_memory.values():
+            memory.priority *= self.PRIORITY_DECAY
+            # Evict if below threshold
+            if memory.priority < self.EVICTION_THRESHOLD:
+                self._evict_from_working()
+    def calculate_promotion_score(self, memory: Memory, query_relevance: float) -> float:
+        """
+        SLM Promotion Score:
+        PromotionScore = (QueryRelevance * 0.6) + (AccessFrequency * 0.3) + (RecencyScore * 0.1)
+        """
+        # Normalize access frequency (0-1)
+        access_freq = min(memory.access_count / 10, 1.0)
+        # Recency score (higher = more recent)
+        age_hours = (time.time() - memory.last_accessed) / 3600
+        recency = max(0, 1 - (age_hours / 24))  # Decay over 24 hours
+        return (query_relevance * 0.6) + (access_freq * 0.3) + (recency * 0.1)
+    def calculate_demotion_score(self, memory: Memory, query_relevance: float) -> float:
+        """
+        SLM Demotion Score:
+        DemotionScore = (1-QueryRelevance)*0.5 + (1-AccessFrequency)*0.3 + (Age/MAX_AGE)*0.2
+        """
+        access_freq = min(memory.access_count / 10, 1.0)
+        age_hours = (time.time() - memory.created_at) / 3600
+        age_score = min(age_hours / 168, 1.0)  # MAX_AGE = 1 week
+        return ((1 - query_relevance) * 0.5) + ((1 - access_freq) * 0.3) + (age_score * 0.2)
+    def try_promote(self, memory_id: str, query_relevance: float) -> bool:
+        """Try to promote memory to higher tier"""
+        if memory_id not in self.semantic_memory:
+            return False
+        memory = self.semantic_memory[memory_id]
+        score = self.calculate_promotion_score(memory, query_relevance)
+        threshold = self.tuner.parameters["promotion_threshold"]
+        if score > threshold:
+            if memory.tier == MemoryTier.SEMANTIC:
+                self._add_to_token(memory)
+                self.stats["promotions"] += 1
+                return True
+            elif memory.tier == MemoryTier.TOKEN:
+                self._add_to_working(memory)
+                self.stats["promotions"] += 1
+                return True
+        return False
+    def try_demote(self, memory_id: str, query_relevance: float) -> bool:
+        """Try to demote memory to lower tier"""
+        if memory_id in self.working_memory:
+            memory = self.working_memory[memory_id]
+            score = self.calculate_demotion_score(memory, query_relevance)
+            threshold = self.tuner.parameters["demotion_threshold"]
+            # Also check capacity (SLM: demote if >80% capacity)
+            capacity_pressure = len(self.working_memory) / self.WORKING_MEMORY_SIZE
+            if score > threshold and capacity_pressure > 0.8:
+                self.working_memory.pop(memory_id)
+                self._add_to_token(memory)
+                self.stats["demotions"] += 1
+                return True
+        return False
+    def get_all_memories(self) -> Dict[str, Memory]:
+        """Get all memories across tiers"""
+        return {**self.semantic_memory, **self.working_memory}
+    def get_tier_stats(self) -> Dict:
+        """Get tier statistics"""
+        return {
+            "working_memory_count": len(self.working_memory),
+            "working_memory_capacity": self.WORKING_MEMORY_SIZE,
+            "token_loops": {ns: len(ids) for ns, ids in self.token_loops.items()},
+            "semantic_memory_count": len(self.semantic_memory),
+            "promotions": self.stats["promotions"],
+            "demotions": self.stats["demotions"],
+            "evictions": self.stats["evictions"]
+        }
+# =============================================================================
+# NEURAL LINK MANAGER (from SLM)
+# =============================================================================
+class NeuralLinkManager:
+    """
+    SLM Neural Link Pathway System
+    Creates and manages typed connections between memories.
+    """
+    # SLM path finding limits (adjusted based on benchmarks)
+    MAX_PATH_DEPTH = 4          # SLM: 4 standard, 6 exhaustive
+    MIN_PATH_STRENGTH = 0.40    # SLM: 0.45
+    PATH_STRENGTH_DECAY = 0.9   # SLM: 0.9 per hop
+    MAX_BRANCHING = 12          # SLM: 12
+    # Pruning (adjusted based on benchmarks)
+    PRUNE_STRENGTH_THRESHOLD = 0.25  # SLM: 0.30
+    PRUNE_AGE_DAYS = 30              # SLM: 60, ADJUSTED
+    def __init__(self):
+        self.links: Dict[str, NeuralLink] = {}  # link_id -> NeuralLink
+        self.outgoing: Dict[str, Set[str]] = defaultdict(set)  # source -> link_ids
+        self.incoming: Dict[str, Set[str]] = defaultdict(set)  # target -> link_ids
+        self.stats = {
+            "links_created": 0,
+            "links_pruned": 0,
+            "traversals": 0
+        }
+    def _link_id(self, source: str, target: str, link_type: LinkType) -> str:
+        """Generate link ID"""
+        return f"{source}:{target}:{link_type.value}"
+    def create_link(self, source_id: str, target_id: str,
+                    link_type: LinkType, similarity: float) -> Optional[str]:
+        """
+        Create link if similarity exceeds type-specific threshold.
+        SLM LinkScore = (VectorSimilarity * 0.6) + (CoOccurrence * 0.25) + (DomainRelatedness * 0.15)
+        Simplified here to just similarity.
+        """
+        props = LINK_PROPERTIES[link_type]
+        if similarity < props["creation_threshold"]:
+            return None
+        link_id = self._link_id(source_id, target_id, link_type)
+        if link_id in self.links:
+            # Strengthen existing link
+            self.links[link_id].strength = min(
+                1.0,
+                self.links[link_id].strength + props["usage_boost"]
+            )
+            return link_id
+        # Create new link
+        link = NeuralLink(
+            source_id=source_id,
+            target_id=target_id,
+            link_type=link_type,
+            strength=props["initial_strength"]
+        )
+        self.links[link_id] = link
+        self.outgoing[source_id].add(link_id)
+        self.incoming[target_id].add(link_id)
+        self.stats["links_created"] += 1
+        return link_id
+    def traverse_link(self, link_id: str) -> Optional[NeuralLink]:
+        """Traverse a link, strengthening it"""
+        if link_id not in self.links:
+            return None
+        link = self.links[link_id]
+        link.traversal_count += 1
+        link.last_traversed = time.time()
+        # Strengthen on traversal (up to daily max)
+        props = LINK_PROPERTIES[link.link_type]
+        link.strength = min(1.0, link.strength + props["usage_boost"])
+        self.stats["traversals"] += 1
+        return link
+    def find_paths(self, source_id: str, target_id: str,
+                   max_depth: int = None) -> List[List[str]]:
+        """Find paths between memories (SLM path finding)"""
+        max_depth = max_depth or self.MAX_PATH_DEPTH
+        paths = []
+        def dfs(current: str, target: str, path: List[str],
+                strength: float, depth: int):
+            if depth > max_depth or strength < self.MIN_PATH_STRENGTH:
+                return
+            if current == target:
+                paths.append(path.copy())
+                return
+            # Limit branching
+            link_ids = list(self.outgoing.get(current, set()))[:self.MAX_BRANCHING]
+            for link_id in link_ids:
+                link = self.links.get(link_id)
+                if link and link.target_id not in path:
+                    new_strength = strength * link.strength * self.PATH_STRENGTH_DECAY
+                    path.append(link.target_id)
+                    dfs(link.target_id, target, path, new_strength, depth + 1)
+                    path.pop()
+        dfs(source_id, target_id, [source_id], 1.0, 0)
+        return paths
+    def get_connected(self, memory_id: str, link_types: List[LinkType] = None) -> List[str]:
+        """Get memories connected to this one"""
+        connected = []
+        for link_id in self.outgoing.get(memory_id, set()):
+            link = self.links.get(link_id)
+            if link:
+                if link_types is None or link.link_type in link_types:
+                    connected.append(link.target_id)
+        return connected
+    def decay_links(self):
+        """Apply daily decay to all links"""
+        for link in self.links.values():
+            props = LINK_PROPERTIES[link.link_type]
+            link.strength *= (1 - props["decay_rate"])
+    def prune_weak_links(self) -> int:
+        """Prune links below strength threshold and unused for too long"""
+        to_prune = []
+        now = time.time()
+        age_threshold = self.PRUNE_AGE_DAYS * 24 * 3600
+        for link_id, link in self.links.items():
+            age = now - link.last_traversed
+            if link.strength < self.PRUNE_STRENGTH_THRESHOLD and age > age_threshold:
+                to_prune.append(link_id)
+        for link_id in to_prune:
+            link = self.links.pop(link_id)
+            self.outgoing[link.source_id].discard(link_id)
+            self.incoming[link.target_id].discard(link_id)
+            self.stats["links_pruned"] += 1
+        return len(to_prune)
+    def get_stats(self) -> Dict:
+        return {
+            "total_links": len(self.links),
+            "links_by_type": {
+                lt.value: sum(1 for l in self.links.values() if l.link_type == lt)
+                for lt in LinkType
+            },
+            **self.stats
+        }
+# =============================================================================
+# MAIN MNEMO v4 CLASS
+# =============================================================================
 class Mnemo:
     """
+    Mnemo v4: SLM-Inspired Memory System
+    Implements:
+    - Three-tiered memory hierarchy
+    - Neural link pathways (8 types)
+    - Self-tuning parameters
+    - Memory utility prediction
+    With parameter adjustments based on Mnemo benchmarks.
+    """
     STOP_WORDS = {"a", "an", "the", "is", "are", "was", "were", "be", "been",
                   "to", "of", "in", "for", "on", "with", "at", "by", "from",
                   "and", "but", "or", "not", "this", "that", "i", "me", "my"}
+    def __init__(self, embedding_dim: int = 384):
         self.embedding_dim = embedding_dim
+        # Core components
+        self.tuner = SelfTuner()
+        self.memory_manager = TieredMemoryManager(self.tuner)
+        self.link_manager = NeuralLinkManager()
+        self.utility_predictor = MemoryUtilityPredictor()
+        # Vector index
         self._embeddings: List[np.ndarray] = []
         self._ids: List[str] = []
         else:
             self.index = None
+        # BM25
         self.bm25 = None
         self._tokenized_docs: List[List[str]] = []
+        # Knowledge Graph
         if HAS_NETWORKX:
             self.graph = nx.DiGraph()
         else:
             self.graph = None
+        # Cache
         self._cache: Dict[str, Any] = {}
         self._cache_lock = threading.Lock()
+        # Stats
         self.stats = {
+            "adds": 0,
+            "adds_rejected": 0,
+            "searches": 0,
+            "cache_hits": 0,
+            "cache_misses": 0
         }
     def _get_embedding(self, text: str) -> np.ndarray:
+        """Generate embedding (hash-based for POC)"""
         cache_key = f"emb:{hashlib.md5(text.encode()).hexdigest()}"
         with self._cache_lock:
             if cache_key in self._cache:
                 self.stats["cache_hits"] += 1
                 return self._cache[cache_key]
             self.stats["cache_misses"] += 1
+        # Hash-based embedding
         embedding = np.zeros(self.embedding_dim, dtype=np.float32)
         words = text.lower().split()
         for i, word in enumerate(words):
         return embedding
+    def _estimate_quality(self, content: str) -> float:
+        """Estimate content quality (SLM quality gates)"""
+        score = 0.5
+        words = len(content.split())
+        if words < 5:
+            score -= 0.3
+        elif words > 20:
+            score += 0.1
+        if any(r in content.lower() for r in ["because", "therefore", "shows"]):
+            score += 0.2
+        if re.search(r'\d+', content):
+            score += 0.1
+        if any(v in content.lower() for v in ["something", "stuff", "maybe"]):
+            score -= 0.2
+        return max(0.0, min(1.0, score))
+    def should_inject(self, query: str, context: str = "",
+                      conversation_history: str = "",
+                      model_confidence: float = 0.5) -> bool:
+        """
+        Memory Utility Predictor - should we inject memory?
+        Based on benchmark findings that memory often hurts performance.
+        """
+        should, reason, confidence = self.utility_predictor.should_inject(
+            query, context, conversation_history, model_confidence
+        )
         return should
     def add(self, content: str, namespace: str = "default",
             metadata: Dict = None, skip_quality_check: bool = False) -> Optional[str]:
+        """Add memory with SLM quality gates"""
+        quality = self._estimate_quality(content)
+        threshold = self.tuner.parameters["quality_threshold"]
+        if not skip_quality_check and quality < threshold:
             self.stats["adds_rejected"] += 1
+            self.tuner.record_outcome("quality_threshold", threshold, False)
             return None
         memory_id = f"mem_{hashlib.md5(content.encode()).hexdigest()[:8]}"
             metadata=metadata or {}
         )
+        # Add to semantic memory (lowest tier)
+        self.memory_manager.add_to_tier(memory, MemoryTier.SEMANTIC)
+        # Update indices
         self._embeddings.append(embedding)
         self._ids.append(memory_id)
         if HAS_BM25:
             self.bm25 = BM25Okapi(self._tokenized_docs)
+        # Create links to similar memories
+        self._create_links_for_new_memory(memory_id, embedding)
         self.stats["adds"] += 1
+        self.tuner.record_outcome("quality_threshold", threshold, True)
         return memory_id
+    def _create_links_for_new_memory(self, memory_id: str, embedding: np.ndarray):
+        """Create neural links to similar memories"""
+        if len(self._ids) < 2:
+            return
+        # Find similar memories
+        similarities = []
+        for other_id, other_emb in zip(self._ids, self._embeddings):
+            if other_id != memory_id:
+                sim = float(np.dot(embedding, other_emb))
+                similarities.append((other_id, sim))
+        # Sort by similarity
+        similarities.sort(key=lambda x: x[1], reverse=True)
+        # Create links for top matches
+        for other_id, sim in similarities[:5]:
+            # Try different link types
+            self.link_manager.create_link(
+                memory_id, other_id, LinkType.SEMANTIC_SIMILARITY, sim
+            )
+            self.link_manager.create_link(
+                other_id, memory_id, LinkType.SEMANTIC_SIMILARITY, sim
+            )
+    def search(self, query: str, top_k: int = 5,
+               namespace: Optional[str] = None,
+               use_links: bool = True) -> List[SearchResult]:
+        """
+        Search with multi-strategy retrieval + neural links
+        """
+        if not self.memory_manager.semantic_memory:
             return []
         self.stats["searches"] += 1
         query_embedding = self._get_embedding(query)
+        threshold = self.tuner.parameters["similarity_threshold"]
+        # Strategy 1: Vector similarity
         semantic_scores = {}
         if HAS_FAISS and self.index is not None and self.index.ntotal > 0:
             k = min(top_k * 3, self.index.ntotal)
                 if 0 <= idx < len(self._ids):
                     semantic_scores[self._ids[idx]] = float(score)
         else:
+            for mem_id, emb in zip(self._ids, self._embeddings):
+                semantic_scores[mem_id] = float(np.dot(query_embedding, emb))
+        # Strategy 2: BM25
         bm25_scores = {}
         if HAS_BM25 and self.bm25 is not None:
             tokens = query.lower().split()
                 if score > 0.1 * max_score:
                     bm25_scores[self._ids[idx]] = float(score / max_score)
+        # Strategy 3: Neural link traversal
+        link_scores = {}
+        if use_links:
+            # Find top semantic matches and traverse their links
+            top_semantic = sorted(semantic_scores.items(), key=lambda x: x[1], reverse=True)[:3]
+            for mem_id, _ in top_semantic:
+                connected = self.link_manager.get_connected(mem_id)
+                for conn_id in connected[:5]:
+                    link_scores[conn_id] = link_scores.get(conn_id, 0) + 0.3
+        # Combine scores (SLM-style weighting)
+        all_ids = set(semantic_scores.keys()) | set(bm25_scores.keys()) | set(link_scores.keys())
         if namespace:
+            # Filter by namespace
+            all_ids = {mid for mid in all_ids
+                      if mid in self.memory_manager.semantic_memory
+                      and self.memory_manager.semantic_memory[mid].namespace == namespace}
         results = []
         for mem_id in all_ids:
             strat = {
                 "semantic": semantic_scores.get(mem_id, 0),
                 "bm25": bm25_scores.get(mem_id, 0),
+                "links": link_scores.get(mem_id, 0)
             }
             combined = (
+                strat["semantic"] * 0.5 +
+                strat["bm25"] * 0.3 +
+                strat["links"] * 0.2
             )
+            memory = self.memory_manager.semantic_memory.get(mem_id)
+            if memory and combined >= threshold:
+                # Update access tracking
+                memory.access_count += 1
+                memory.last_accessed = time.time()
+                # Try promotion
+                self.memory_manager.try_promote(mem_id, combined)
+                results.append(SearchResult(
+                    id=mem_id,
+                    content=memory.content,
+                    score=combined,
+                    tier=memory.tier,
+                    strategy_scores=strat,
+                    metadata=memory.metadata
+                ))
+                self.tuner.record_outcome("similarity_threshold", threshold, True)
+            else:
+                self.tuner.record_outcome("similarity_threshold", threshold, False)
         results.sort(key=lambda x: x.score, reverse=True)
         return results[:top_k]
+    def get_context(self, query: str, top_k: int = 3,
+                    namespace: Optional[str] = None) -> str:
+        """Get formatted context for prompt injection"""
         results = self.search(query, top_k=top_k, namespace=namespace)
         if not results:
         parts = ["[RELEVANT CONTEXT FROM MEMORY]"]
         for r in results:
+            tier_marker = f"[{r.tier.value.upper()}]" if r.tier != MemoryTier.SEMANTIC else ""
+            parts.append(f"• {tier_marker} {r.content}")
         parts.append("[END CONTEXT]\n")
         return "\n".join(parts)
     def feedback(self, query: str, memory_id: str, relevance: float):
+        """Record feedback for learning"""
         relevance = max(-1, min(1, relevance))
+        if memory_id in self.memory_manager.semantic_memory:
+            memory = self.memory_manager.semantic_memory[memory_id]
+            # Update relevance score
+            memory.relevance_score = 0.7 * memory.relevance_score + 0.3 * ((relevance + 1) / 2)
+            # Strengthen/weaken links based on feedback
+            for link_id in self.link_manager.outgoing.get(memory_id, set()):
+                link = self.link_manager.links.get(link_id)
+                if link:
+                    link.strength = max(0, min(1, link.strength + relevance * 0.05))
+    def maintenance_cycle(self):
+        """Run SLM maintenance operations"""
+        # Decay priorities in working memory
+        self.memory_manager.decay_priorities()
+        # Decay link strengths
+        self.link_manager.decay_links()
+        # Prune weak links
+        pruned = self.link_manager.prune_weak_links()
+        # Auto-tune parameters
+        adjustments = self.tuner.auto_tune()
+        return {
+            "links_pruned": pruned,
+            "parameter_adjustments": adjustments
+        }
     def get_stats(self) -> Dict:
+        """Get comprehensive statistics"""
         return {
+            "memories": {
+                "total": len(self.memory_manager.semantic_memory),
+                **self.memory_manager.get_tier_stats()
+            },
+            "links": self.link_manager.get_stats(),
+            "utility_predictor": self.utility_predictor.stats,
+            "tuner": {
+                "parameters": self.tuner.parameters,
+                "adjustments": self.tuner.adjustment_count
+            },
+            "operations": self.stats
         }
+    def clear(self):
+        """Clear all memory"""
+        self.memory_manager = TieredMemoryManager(self.tuner)
+        self.link_manager = NeuralLinkManager()
+        self._embeddings.clear()
+        self._ids.clear()
+        self._tokenized_docs.clear()
+        self.bm25 = None
+        self._cache.clear()
+        if HAS_FAISS:
+            self.index = faiss.IndexFlatIP(self.embedding_dim)
     def __len__(self):
+        return len(self.memory_manager.semantic_memory)
     def __repr__(self):
+        return f"Mnemo(memories={len(self)}, links={len(self.link_manager.links)})"
+# =============================================================================
+# DEMO
+# =============================================================================
 def demo():
+    print("="*70)
+    print("MNEMO v4: SLM-INSPIRED ARCHITECTURE")
+    print("="*70)
+    m = Mnemo()
+    print(f"\n✓ Initialized: {m}")
+    # Show tuned parameters
+    print("\n📊 Tuned Parameters (adjusted from SLM):")
+    for param, value in m.tuner.parameters.items():
+        print(f"   {param}: {value}")
+    # Add memories
+    print("\n📝 Adding memories...")
+    memories = [
+        "User prefers Python because it has clean syntax and good libraries",
+        "Previous analysis showed gender bias in Victorian psychiatry diagnoses",
+        "Framework has 5 checkpoints for detecting historical medical bias",
+        "The project deadline is March 15th for the API redesign",
+        "User's coffee preference is cappuccino with oat milk"
+    ]
+    for mem in memories:
+        result = m.add(mem)
+        status = "✓" if result else "✗"
+        print(f"   {status} {mem[:50]}...")
+    # Test memory utility predictor
+    print("\n🧠 Memory Utility Predictions:")
+    tests = [
+        ("What is Python?", False),
+        ("Based on your previous analysis...", True),
+        ("Compare to your earlier findings", True),
+        ("This is a NEW topic", False),
+    ]
+    for query, expected in tests:
+        result = m.should_inject(query)
+        status = "✓" if result == expected else "✗"
+        action = "INJECT" if result else "SKIP"
+        print(f"   {status} {action}: {query}")
+    # Search
+    print("\n🔍 Search Results:")
+    results = m.search("previous analysis framework", top_k=3)
     for r in results:
+        print(f"   [{r.tier.value}] score={r.score:.3f}: {r.content[:50]}...")
+    # Show neural links
+    print("\n🔗 Neural Links:")
+    link_stats = m.link_manager.get_stats()
+    print(f"   Total links: {link_stats['total_links']}")
+    for lt, count in link_stats['links_by_type'].items():
+        if count > 0:
+            print(f"   {lt}: {count}")
+    # Full stats
+    print("\n📊 Full Statistics:")
+    stats = m.get_stats()
+    print(f"   Memories: {stats['memories']['total']}")
+    print(f"   Working memory: {stats['memories']['working_memory_count']}")
+    print(f"   Links: {stats['links']['total_links']}")
+    print(f"   Utility predictions: {stats['utility_predictor']['predictions']}")
+    print("\n" + "="*70)
+    print("✅ Demo complete!")
+    print("="*70)
 if __name__ == "__main__":