""" MnemoCore Subconscious Daemon ========================= Continuous background processing using Gemma 1B via Ollama. Performs: concept extraction, parallel drawing, memory valuation, thought sorting. Integrates with Redis Subconscious Bus to publish insights. """ import asyncio import aiohttp import json import random import time from datetime import datetime, timezone from typing import List, Dict, Any, Optional import sys import os sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))) from mnemocore.core.engine import HAIMEngine from mnemocore.core.async_storage import AsyncRedisStorage from mnemocore.core.config import get_config from mnemocore.meta.learning_journal import LearningJournal from mnemocore.core.node import MemoryNode from mnemocore.core.metrics import ( DREAM_LOOP_TOTAL, DREAM_LOOP_ITERATION_SECONDS, DREAM_LOOP_INSIGHTS_GENERATED, DREAM_LOOP_ACTIVE ) # Default Config (overridden by config.yaml) DEFAULT_OLLAMA_URL = "http://localhost:11434/api/generate" DEFAULT_MODEL = "gemma3:1b" HAIM_DATA_PATH = "./data/memory.jsonl" DEFAULT_CYCLE_INTERVAL = 60 # seconds between thought cycles LOG_PATH = "/tmp/subconscious.log" EVOLUTION_STATE_PATH = "./data/subconscious_evolution.json" def _write_state_to_disk(state: Dict[str, Any], filepath: str): """Write state to disk synchronously (to be used in executor).""" os.makedirs(os.path.dirname(filepath), exist_ok=True) with open(filepath, "w") as f: json.dump(state, f, indent=2) class SubconsciousDaemon: """The always-running background mind.""" def __init__(self, storage: Optional[AsyncRedisStorage] = None, config: Optional[Any] = None): """ Initialize SubconsciousDaemon with optional dependency injection. Args: storage: AsyncRedisStorage instance. If None, creates one in run(). config: Configuration object. If None, loads from get_config(). """ # Load configuration self._config = config or get_config() # Dream loop configuration from config.yaml dream_loop_config = getattr(self._config, 'dream_loop', None) if dream_loop_config: self.ollama_url = getattr(dream_loop_config, 'ollama_url', DEFAULT_OLLAMA_URL) self.model = getattr(dream_loop_config, 'model', DEFAULT_MODEL) self.frequency_seconds = getattr(dream_loop_config, 'frequency_seconds', DEFAULT_CYCLE_INTERVAL) self.batch_size = getattr(dream_loop_config, 'batch_size', 10) self.max_iterations = getattr(dream_loop_config, 'max_iterations', 0) self.dream_loop_enabled = getattr(dream_loop_config, 'enabled', True) else: self.ollama_url = DEFAULT_OLLAMA_URL self.model = DEFAULT_MODEL self.frequency_seconds = DEFAULT_CYCLE_INTERVAL self.batch_size = 10 self.max_iterations = 0 self.dream_loop_enabled = True self.engine = HAIMEngine(persist_path=HAIM_DATA_PATH) self.journal = LearningJournal() # Graceful shutdown support using asyncio.Event self._stop_event = asyncio.Event() self.running = False self.cycle_count = 0 self.insights_generated = 0 self.current_cycle_interval = self.frequency_seconds self.schedule = { "concept_every": 5, "parallel_every": 3, "value_every": 10, "meta_every": 7, "cleanup_every": 20 } self.activity_window: List[int] = [] self.low_activity_streak = 0 self.last_cycle_metrics: Dict[str, Any] = {} self._load_evolution_state() # Async Redis Storage (injected or initialized in run) self.storage: Optional[AsyncRedisStorage] = storage def _should_stop(self) -> bool: """Check if the daemon should stop (non-blocking check).""" return self._stop_event.is_set() async def request_stop(self): """Request graceful stop of the daemon (async-safe).""" self._stop_event.set() self.running = False def log(self, msg: str): timestamp = datetime.now().strftime("%Y-%m-%d %H:%M:%S") line = f"[{timestamp}] {msg}" print(line) with open(LOG_PATH, "a") as f: f.write(line + "\n") def _load_evolution_state(self): """Load persistent evolution state from disk.""" if not os.path.exists(EVOLUTION_STATE_PATH): return try: with open(EVOLUTION_STATE_PATH, "r") as f: state = json.load(f) self.cycle_count = int(state.get("cycle_count", self.cycle_count)) self.insights_generated = int(state.get("insights_generated", self.insights_generated)) self.current_cycle_interval = int(state.get("current_cycle_interval", self.current_cycle_interval)) saved_schedule = state.get("schedule", {}) if isinstance(saved_schedule, dict): for k in self.schedule: if k in saved_schedule: self.schedule[k] = max(2, int(saved_schedule[k])) self.activity_window = list(state.get("activity_window", []))[-12:] self.low_activity_streak = int(state.get("low_activity_streak", 0)) except Exception as e: self.log(f"Failed to load evolution state: {e}") async def _save_evolution_state(self): """Persist state so evolution continues across restarts.""" state = { "updated_at": datetime.now(timezone.utc).isoformat(), "cycle_count": self.cycle_count, "insights_generated": self.insights_generated, "current_cycle_interval": self.current_cycle_interval, "schedule": self.schedule, "activity_window": self.activity_window[-12:], "low_activity_streak": self.low_activity_streak, "last_cycle_metrics": self.last_cycle_metrics, } try: loop = asyncio.get_running_loop() await loop.run_in_executor(None, _write_state_to_disk, state, EVOLUTION_STATE_PATH) except Exception as e: self.log(f"Failed to save evolution state: {e}") def _compute_surprise(self, metrics: Dict[str, Any]) -> float: """Estimate surprise from novelty/output dynamics.""" score = 0.0 score += 0.12 * metrics.get("concepts", 0) score += 0.20 * metrics.get("parallels", 0) score += 0.30 * metrics.get("meta_insights", 0) if metrics.get("adaptation") and metrics.get("adaptation") != "none": score += 0.25 return min(1.0, score) def _adapt_evolution_policy(self, metrics: Dict[str, Any]): """ Adapt cadence and schedule so the subconscious keeps evolving. Low activity -> stimulate exploration. High sustained activity -> stabilize to preserve quality. """ activity_score = ( metrics.get("concepts", 0) + metrics.get("parallels", 0) + metrics.get("meta_insights", 0) ) self.activity_window.append(activity_score) self.activity_window = self.activity_window[-12:] if activity_score == 0: self.low_activity_streak += 1 else: self.low_activity_streak = 0 adaptation = "none" avg_activity = sum(self.activity_window) / max(1, len(self.activity_window)) if self.low_activity_streak >= 4: self.schedule["concept_every"] = max(2, self.schedule["concept_every"] - 1) self.schedule["parallel_every"] = max(2, self.schedule["parallel_every"] - 1) self.schedule["meta_every"] = max(3, self.schedule["meta_every"] - 1) self.current_cycle_interval = max(35, self.current_cycle_interval - 5) self.low_activity_streak = 0 adaptation = "stimulate" elif avg_activity >= 2.0: self.current_cycle_interval = min(90, self.current_cycle_interval + 5) self.schedule["value_every"] = min(15, self.schedule["value_every"] + 1) adaptation = "stabilize" metrics["activity_score"] = activity_score metrics["avg_activity"] = round(avg_activity, 3) metrics["adaptation"] = adaptation def _record_cycle_learning(self, metrics: Dict[str, Any]): """Write periodic learning traces so evolution is continuous and explicit.""" should_record = ( self.cycle_count % 5 == 0 or metrics.get("meta_insights", 0) > 0 or metrics.get("adaptation", "none") != "none" ) if not should_record: return surprise = self._compute_surprise(metrics) lesson = ( f"Cycle {self.cycle_count}: concepts={metrics.get('concepts', 0)}, " f"parallels={metrics.get('parallels', 0)}, meta={metrics.get('meta_insights', 0)}, " f"adaptation={metrics.get('adaptation', 'none')}, interval={self.current_cycle_interval}s." ) context = ( f"memories={metrics.get('memories', 0)}, synapses={metrics.get('synapses', 0)}, " f"schedule={self.schedule}" ) self.journal.record( lesson=lesson, context=context, outcome="success", confidence=0.7, tags=["subconscious", "continuous-evolution"], surprise=surprise, ) async def query_ollama(self, prompt: str, max_tokens: int = 200) -> str: """Query local Gemma model.""" payload = { "model": self.model, "prompt": prompt, "stream": False, "options": { "num_predict": max_tokens, "temperature": 0.7 } } try: async with aiohttp.ClientSession() as session: async with session.post(self.ollama_url, json=payload, timeout=30) as resp: if resp.status == 200: data = await resp.json() return data.get("response", "").strip() else: self.log(f"Ollama error: {resp.status}") return "" except Exception as e: self.log(f"Ollama connection error: {e}") return "" async def extract_concepts(self, memories: List[MemoryNode]) -> List[Dict]: """Extract concepts from recent memories.""" if not memories: return [] # Sample up to 5 memories sample = random.sample(memories, min(5, len(memories))) contents = [m.content[:200] for m in sample] prompt = f"""Analyze these memory fragments and extract key concepts. Output JSON array of concepts with attributes. Memories: {chr(10).join(f'- {c}' for c in contents)} Output format: [{{"name": "concept", "category": "type", "connections": ["related1", "related2"]}}] Only output valid JSON array, nothing else.""" response = await self.query_ollama(prompt, max_tokens=300) try: # Try to parse JSON if "[" in response: start = response.index("[") end = response.rindex("]") + 1 concepts = json.loads(response[start:end]) return concepts except: pass return [] async def draw_parallels(self, memories: List[MemoryNode]) -> List[str]: """Find unexpected connections between memories.""" if len(memories) < 2: return [] # Pick 2 random memories sample = random.sample(memories, 2) prompt = f"""Find a non-obvious parallel or connection between these two ideas: 1: {sample[0].content[:200]} 2: {sample[1].content[:200]} Output ONE insight about how these connect. Be creative but logical. Max 50 words.""" response = await self.query_ollama(prompt, max_tokens=100) if response and len(response) > 20: return [response] return [] async def value_memories(self, memories: List[MemoryNode]) -> Dict[str, float]: """Re-evaluate memory importance based on patterns.""" if not memories: return {} # Sample memories for valuation sample = random.sample(memories, min(10, len(memories))) prompt = f"""Rate each memory's strategic value (0.0-1.0) for a tech entrepreneur focused on expansion. Memories: {chr(10).join(f'{i+1}. {m.content[:100]}' for i, m in enumerate(sample))} Output format: {{"1": 0.8, "2": 0.3, ...}} Only output valid JSON object.""" response = await self.query_ollama(prompt, max_tokens=200) try: if "{" in response: start = response.index("{") end = response.rindex("}") + 1 values = json.loads(response[start:end]) # Map back to memory IDs result = {} for i, m in enumerate(sample): key = str(i + 1) if key in values: result[m.id] = float(values[key]) return result except: pass return {} async def generate_insight(self, memories: List[MemoryNode]) -> Optional[str]: """Generate a meta-insight from memory patterns.""" if len(memories) < 3: return None sample = random.sample(memories, min(8, len(memories))) contents = [m.content[:150] for m in sample] prompt = f"""You are analyzing patterns in an entrepreneur's memory system. Recent memories: {chr(10).join(f'- {c}' for c in contents)} Generate ONE actionable insight or pattern you notice. Focus on: - Recurring themes - Opportunities being missed - Contradictions to resolve - Strategic blind spots Output just the insight, max 60 words.""" response = await self.query_ollama(prompt, max_tokens=120) if response and len(response) > 30: return response return None async def store_insight(self, content: str, meta: Dict[str, Any]): """Helper to store insight and publish event.""" # Store in Engine (Sync) # Offload sync I/O to thread to avoid blocking loop mem_id = await asyncio.to_thread(self.engine.store, content, metadata=meta) # Publish Event (Async) if self.storage: try: await self.storage.publish_event( "insight.generated", {"id": mem_id, "type": meta.get("type", "insight"), "content": content[:50]} ) except Exception as e: self.log(f"Failed to publish event: {e}") return mem_id async def run_cycle(self): """Execute one thought cycle.""" iteration_start_time = time.time() self.cycle_count += 1 self.log(f"=== Cycle {self.cycle_count} ===") metrics: Dict[str, Any] = { "concepts": 0, "parallels": 0, "meta_insights": 0, "valuations": 0, "memories": len(self.engine.tier_manager.hot), "synapses": len(self.engine.synapses), } # Get all hot memories as list (references only, no copy) memories = list(self.engine.tier_manager.hot.values()) if not memories: self.log("No memories to process") metrics["adaptation"] = "none" self.last_cycle_metrics = metrics await self._save_evolution_state() # Record metrics DREAM_LOOP_TOTAL.labels(status="success").inc() return self.log(f"Processing {len(memories)} memories") # 1. Extract concepts (every 5 cycles) if self.cycle_count % self.schedule["concept_every"] == 0: concepts = await self.extract_concepts(memories) for concept in concepts: if "name" in concept: attrs = {k: str(v) for k, v in concept.items() if k != "name"} self.engine.define_concept(concept["name"], attrs) metrics["concepts"] += 1 self.log(f"Concept extracted: {concept['name']}") # Record insight metric DREAM_LOOP_INSIGHTS_GENERATED.labels(type="concept").inc() # Publish concept event? if self.storage: await self.storage.publish_event("concept.extracted", {"name": concept["name"]}) # 2. Draw parallels (every 3 cycles) if self.cycle_count % self.schedule["parallel_every"] == 0: parallels = await self.draw_parallels(memories) for p in parallels: # Store parallel as new memory await self.store_insight( f"[PARALLEL] {p}", meta={"type": "insight", "source": "subconscious", "cycle": self.cycle_count} ) self.insights_generated += 1 metrics["parallels"] += 1 self.log(f"Parallel found: {p[:80]}...") # Record insight metric DREAM_LOOP_INSIGHTS_GENERATED.labels(type="parallel").inc() # 3. Value memories (every 10 cycles) if self.cycle_count % self.schedule["value_every"] == 0: values = await self.value_memories(memories) for mem_id, value in values.items(): if mem_id in self.engine.tier_manager.hot: self.engine.tier_manager.hot[mem_id].pragmatic_value = value metrics["valuations"] += 1 self.log(f"Valued {len(values)} memories") # 4. Generate meta-insight (every 7 cycles) if self.cycle_count % self.schedule["meta_every"] == 0: insight = await self.generate_insight(memories) if insight: await self.store_insight( f"[META-INSIGHT] {insight}", meta={"type": "meta", "source": "subconscious", "cycle": self.cycle_count} ) self.insights_generated += 1 metrics["meta_insights"] += 1 self.log(f"Meta-insight: {insight[:80]}...") # Record insight metric DREAM_LOOP_INSIGHTS_GENERATED.labels(type="meta").inc() # 5. Cleanup decayed synapses (every 20 cycles) if self.cycle_count % self.schedule["cleanup_every"] == 0: before = len(self.engine.synapses) self.engine.cleanup_decay(threshold=0.1) removed = max(0, before - len(self.engine.synapses)) self.log(f"Synapse cleanup complete (removed {removed})") metrics["memories"] = len(self.engine.tier_manager.hot) metrics["synapses"] = len(self.engine.synapses) self._adapt_evolution_policy(metrics) self._record_cycle_learning(metrics) self.last_cycle_metrics = metrics await self._save_evolution_state() # Record iteration duration metric iteration_duration = time.time() - iteration_start_time DREAM_LOOP_ITERATION_SECONDS.observe(iteration_duration) DREAM_LOOP_TOTAL.labels(status="success").inc() self.log( "Cycle complete. " f"Insights={self.insights_generated} " f"(concepts={metrics['concepts']}, parallels={metrics['parallels']}, meta={metrics['meta_insights']}) " f"adaptation={metrics.get('adaptation', 'none')} interval={self.current_cycle_interval}s " f"duration={iteration_duration:.2f}s" ) async def _consume_events(self): """Consume events from the Subconscious Bus (Redis Stream).""" if not self.storage: return last_id = "$" # New events only config = get_config() stream_key = config.redis.stream_key self.log(f"Starting event consumer on {stream_key}") while self.running: try: # XREAD is blocking streams = await self.storage.redis_client.xread( {stream_key: last_id}, count=1, block=1000 ) if not streams: await asyncio.sleep(0.1) continue for _, events in streams: for event_id, event_data in events: last_id = event_id await self._process_event(event_data) except Exception as e: self.log(f"Event consumer error: {e}") await asyncio.sleep(1) async def _process_event(self, event_data: Dict[str, Any]): """Handle incoming events.""" event_type = event_data.get("type") if event_type == "memory.created": mem_id = event_data.get("id") if not mem_id: return # Check if we already have it (created by us?) if mem_id in self.engine.tier_manager.hot: return self.log(f"Received sync event: memory.created ({mem_id})") # Fetch full memory from Redis data = await self.storage.retrieve_memory(mem_id) if not data: self.log(f"Could not retrieve memory {mem_id} from storage") return # Reconstruct and add to Engine try: # Need to handle HDV reconstruction. # For now, we might need to load it via Engine's logic or construct manually. # Engine's logic is best to ensure consistency. # But Engine doesn't have a "load_from_redis" method readily available on single node. # TierManager has _load_from_warm, but that's for Qdrant/File. # We can manually reconstruct ephemeral node for HOT tier. # Check if it has HDV vector in Redis? # AsyncRedisStorage store_memory stores metadata + content. # It does NOT store the vector currently in the metadata payload in `store_memory` in `api/main.py`. # API calls engine.store -> which creates node -> then API calls storage.store_memory. # The node in engine has the vector. # But Daemon is a separate process. It needs the vector. # Critical Gap: Redis payload doesn't have the vector. # We need to fetch it from Qdrant/Warm if it was persisted there? # Engine.store puts it in HOT (RAM) and Appends to `memory.jsonl` (Legacy). # It does NOT immediately put it in Qdrant (Warm). # So Daemon cannot load it from Qdrant yet. # It can load it from `memory.jsonl` if it reads the file? # Or we must include the vector in the Redis payload or `memory.created` event? # Including vector in Redis event is heavy. # Option A: Read from `memory.jsonl` tail? # Option B: Pass vector in Redis (might be large). # Option C: API should also save to Qdrant immediately if we want shared state? # But TierManager logic says "Starts in HOT". # Workaround for Phase 3.5: # Since Engine appends to `memory.jsonl`, we can try to re-load from there. # Or, we update API to include the vector/seed in Redis? # Re-encoding in Daemon is an option if we have the content. # HAIM is distinct: Same content = Same Vector (if deterministic). # Let's use re-encoding for now. content = data.get("content", "") if content: # Encode hdv = self.engine.encode_content(content) # Create Node node = MemoryNode( id=data["id"], hdv=hdv, content=content, metadata=data.get("metadata", {}) ) node.ltp_strength = float(data.get("ltp_strength", 0.5)) node.created_at = datetime.fromisoformat(data["created_at"]) # Add to Daemon's Engine self.engine.tier_manager.add_memory(node) self.log(f"Synced memory {mem_id} to HOT tier") except Exception as e: self.log(f"Failed to process sync for {mem_id}: {e}") async def run(self): """Main daemon loop.""" if not self.dream_loop_enabled: self.log("Dream loop is disabled in configuration. Exiting.") return # Clear stop event for restart support self._stop_event.clear() self.running = True DREAM_LOOP_ACTIVE.set(1) if not self.storage: # Create storage from config if not injected config = get_config() self.storage = AsyncRedisStorage( url=config.redis.url, stream_key=config.redis.stream_key, max_connections=config.redis.max_connections, socket_timeout=config.redis.socket_timeout, password=config.redis.password, ) self.log("Subconscious daemon starting...") self.log(f"Model: {self.model} | Cycle interval: {self.frequency_seconds}s | Max iterations: {self.max_iterations or 'unlimited'}") # Start event consumer task asyncio.create_task(self._consume_events()) iterations = 0 while self.running and not self._should_stop(): # Check max_iterations limit (0 = unlimited) if self.max_iterations > 0 and iterations >= self.max_iterations: self.log(f"Reached max iterations ({self.max_iterations}). Stopping.") break try: await self.run_cycle() iterations += 1 except Exception as e: self.log(f"Cycle error: {e}") DREAM_LOOP_TOTAL.labels(status="error").inc() # Non-blocking sleep with periodic stop check sleep_interval = self.current_cycle_interval sleep_remaining = sleep_interval check_interval = 0.5 # Check for stop every 0.5 seconds while sleep_remaining > 0 and not self._should_stop(): sleep_time = min(check_interval, sleep_remaining) await asyncio.sleep(sleep_time) sleep_remaining -= sleep_time self.running = False DREAM_LOOP_ACTIVE.set(0) self.log("Daemon stopped.") def stop(self): """Request daemon stop (can be called from signal handler).""" self._stop_event.set() self.running = False self.log("Daemon stop requested...") async def main(): daemon = SubconsciousDaemon() # Handle graceful shutdown import signal def shutdown(sig, frame): daemon.stop() signal.signal(signal.SIGINT, shutdown) signal.signal(signal.SIGTERM, shutdown) await daemon.run() if __name__ == "__main__": asyncio.run(main())