Spaces:

ruslanmv
/

HomePilot

Running

HomePilot Deploy Bot

chore(hf): sync HomePilot to HF Space

23b413b 1 day ago

22.4 kB

	"""
	Memory V2 — Brain-inspired hierarchical memory engine (additive).

	Implements Working -> Consolidation -> Semantic memory with:
	- Exponential decay (activation fades over time)
	- Reinforcement (accessed/confirmed memories grow stronger)
	- Consolidation (repeated working items promote to semantic)
	- Pruning (low-activation + low-importance semantic items are forgotten)
	- Persona Integrity Kernel isolation (never modifies persona identity)

	Memory types:
	P = Pinned (user-approved "core memories"; never auto-pruned, tau=infinity)
	S = Semantic (stable facts/preferences; slow decay tau~30 days; prunable)
	W = Working (short-lived context traces; fast decay tau~6 hours)
	A = Anchor (profile/persona kernel — not stored here; injected from profile.py)

	IMPORTANT: This module is additive-only.
	- Reuses the existing persona_memory table
	- Adds optional columns via safe ALTER TABLE (ignored by V1 code)
	- V1 (ltm.py) continues to work unchanged
	- V2 is opt-in via memoryEngine='v2' in settings

	IMPORTANT: Persona identity is NEVER learned/changed here.
	This stores only user-overlay memories (facts about the user, preferences,
	boundaries). The persona's voice/role/rules remain immutable in the
	PersonalityAgent definitions.
	"""
	from __future__ import annotations

	import hashlib
	import math
	import re
	import sqlite3
	import time
	from dataclasses import dataclass
	from typing import Any, Dict, List, Optional, Tuple

	from .storage import _get_db_path


	# ---------------------------------------------------------------------------
	# Configuration
	# ---------------------------------------------------------------------------

	@dataclass
	class V2Config:
	# Decay time constants (seconds)
	tau_working: float = 6 * 3600.0 # 6 hours
	tau_semantic: float = 30 * 24 * 3600.0 # 30 days

	# Reinforcement increments (eta in the saturating update: s <- 1-(1-s)*e^{-eta})
	eta_user_confirmed: float = 0.25
	eta_inferred: float = 0.05

	# Consolidation thresholds (promote W -> S)
	consolidate_min_repeats: int = 2
	consolidate_min_importance: float = 0.45
	consolidate_min_activation: float = 0.25

	# Prune thresholds (S only; Pinned never auto-pruned)
	prune_activation_thresh: float = 0.05
	prune_importance_thresh: float = 0.25

	# Retrieval budget (items per category injected into prompt)
	top_pinned: int = 4
	top_semantic: int = 8
	top_working: int = 1

	# Safety: max value length stored
	max_value_chars: int = 600

	# Throttle: min seconds between consolidation/pruning passes
	maintenance_interval: float = 30.0


	# ---------------------------------------------------------------------------
	# Math helpers
	# ---------------------------------------------------------------------------

	def _now() -> float:
	return time.time()


	def _clamp(x: float, lo: float, hi: float) -> float:
	return max(lo, min(hi, x))


	def _activation(strength: float, last_access_at: float, tau: float) -> float:
	"""Compute retrievability: A(t) = s * exp(-dt / tau)."""
	dt = max(0.0, _now() - (last_access_at or _now()))
	return float(strength) * math.exp(-dt / tau)


	def _reinforce(strength: float, eta: float) -> float:
	"""Saturating reinforcement: s <- 1 - (1-s) * exp(-eta)."""
	s = _clamp(float(strength), 0.0, 1.0)
	return 1.0 - (1.0 - s) * math.exp(-float(eta))


	def _stable_hash(text: str) -> str:
	"""Deterministic hash (stable across Python restarts, unlike hash())."""
	return hashlib.md5(text.encode("utf-8", errors="replace")).hexdigest()[:12]


	def _clean_value(s: str, max_chars: int) -> str:
	s2 = (s or "").strip()
	s2 = re.sub(r"\s+", " ", s2)
	if len(s2) > max_chars:
	s2 = s2[:max_chars - 1].rstrip() + "..."
	return s2


	def _keyword_score(query: str, text: str) -> float:
	"""Lightweight relevance: normalized token overlap."""
	q = set(re.findall(r"[a-z0-9]{3,}", (query or "").lower()))
	t = set(re.findall(r"[a-z0-9]{3,}", (text or "").lower()))
	if not q or not t:
	return 0.0
	overlap = len(q.intersection(t))
	return overlap / max(1, min(len(q), 8))


	# ---------------------------------------------------------------------------
	# Explicit "remember this" detector (conservative — avoids false positives)
	# ---------------------------------------------------------------------------

	_RE_REMEMBER = re.compile(
	r"\b(remember this\|remember that\|don't forget\|do not forget\|please remember)\b",
	re.I,
	)


	# ---------------------------------------------------------------------------
	# Schema extension (additive ALTER TABLE — safe to run repeatedly)
	# ---------------------------------------------------------------------------

	def ensure_v2_columns() -> None:
	"""
	Add V2-specific columns to persona_memory table.
	Safe to call on every startup — skips columns that already exist.
	V1 code ignores these columns (uses SELECT * with sqlite3.Row).
	"""
	path = _get_db_path()
	con = sqlite3.connect(path)
	cur = con.cursor()
	cur.execute("PRAGMA table_info(persona_memory)")
	existing = {row[1] for row in cur.fetchall()}

	additions = [
	("mem_type", "TEXT DEFAULT 'S'"), # P/S/W
	("strength", "REAL DEFAULT 0.5"), # reinforcement strength
	("importance", "REAL DEFAULT 0.3"), # importance score
	("last_access_at", "REAL DEFAULT 0"), # unix timestamp of last retrieval
	("access_count", "INTEGER DEFAULT 0"), # how many times retrieved/reinforced
	("last_seen_at", "REAL DEFAULT 0"), # unix timestamp when last ingested/seen
	]

	for col_name, col_def in additions:
	if col_name not in existing:
	cur.execute(f"ALTER TABLE persona_memory ADD COLUMN {col_name} {col_def}")

	con.commit()
	con.close()


	# ---------------------------------------------------------------------------
	# DB helpers (using sqlite3.Row for safe column-name access)
	# ---------------------------------------------------------------------------

	def _connect() -> sqlite3.Connection:
	"""Create a connection with Row factory (dict-like access by column name)."""
	con = sqlite3.connect(_get_db_path())
	con.row_factory = sqlite3.Row
	return con


	def _select_memories(project_id: str, user_id: Optional[str] = None) -> List[Dict[str, Any]]:
	"""Fetch all V2 memories for a project, optionally scoped to user."""
	con = _connect()
	cur = con.cursor()
	if user_id:
	cur.execute(
	"SELECT * FROM persona_memory WHERE project_id = ? AND user_id = ?",
	(project_id, user_id),
	)
	else:
	cur.execute("SELECT * FROM persona_memory WHERE project_id = ?", (project_id,))
	rows = [dict(r) for r in cur.fetchall()]
	con.close()
	return rows


	def _upsert_memory(
	project_id: str,
	category: str,
	key: str,
	value: str,
	mem_type: str,
	source_type: str,
	confidence: float,
	strength: float,
	importance: float,
	seen_now: bool = True,
	reinforce_eta: Optional[float] = None,
	user_id: Optional[str] = None,
	) -> None:
	"""
	Additive upsert using existing UNIQUE(project_id, category, key).
	On conflict: updates value/confidence/source_type, preserves V2 fields.
	"""
	con = sqlite3.connect(_get_db_path())
	cur = con.cursor()
	now_ts = _now()
	now_dt = time.strftime("%Y-%m-%d %H:%M:%S")
	value = _clean_value(value, max_chars=600)

	# Try update first
	cur.execute(
	"""
	UPDATE persona_memory
	SET
	value = ?,
	confidence = ?,
	source_type = ?,
	updated_at = ?,
	mem_type = COALESCE(mem_type, ?),
	strength = COALESCE(strength, 0.5),
	importance = COALESCE(importance, ?),
	last_seen_at = CASE WHEN ? THEN ? ELSE COALESCE(last_seen_at, 0) END
	WHERE project_id = ? AND category = ? AND key = ?
	""",
	(value, float(confidence), source_type, now_dt,
	mem_type, float(importance),
	1 if seen_now else 0, now_ts,
	project_id, category, key),
	)

	if cur.rowcount == 0:
	# Insert new
	cur.execute(
	"""
	INSERT INTO persona_memory
	(project_id, category, key, value, confidence, source_session,
	source_type, created_at, updated_at,
	mem_type, strength, importance, last_access_at, access_count, last_seen_at,
	user_id)
	VALUES
	(?, ?, ?, ?, ?, NULL,
	?, ?, ?,
	?, ?, ?, 0, 0, ?,
	?)
	""",
	(project_id, category, key, value, float(confidence),
	source_type, now_dt, now_dt,
	mem_type, float(_clamp(strength, 0.0, 1.0)),
	float(_clamp(importance, 0.0, 1.0)),
	now_ts if seen_now else 0.0,
	user_id),
	)

	# Reinforce if requested (on existing or just-inserted row)
	if reinforce_eta is not None:
	cur.execute(
	"""
	UPDATE persona_memory
	SET
	strength = MIN(1.0, 1.0 - (1.0 - COALESCE(strength, 0.5)) * EXP(-?)),
	last_access_at = ?,
	access_count = COALESCE(access_count, 0) + 1
	WHERE project_id = ? AND category = ? AND key = ?
	""",
	(float(reinforce_eta), now_ts, project_id, category, key),
	)

	con.commit()
	con.close()


	def _touch_access(project_id: str, mem_id: int, eta: float) -> None:
	"""Reinforce an existing memory entry by ID (light touch on retrieval)."""
	con = sqlite3.connect(_get_db_path())
	cur = con.cursor()
	now_ts = _now()
	cur.execute(
	"""
	UPDATE persona_memory
	SET
	strength = MIN(1.0, 1.0 - (1.0 - COALESCE(strength, 0.5)) * EXP(-?)),
	last_access_at = ?,
	access_count = COALESCE(access_count, 0) + 1
	WHERE project_id = ? AND id = ?
	""",
	(float(eta), now_ts, project_id, int(mem_id)),
	)
	con.commit()
	con.close()


	def _delete_by_id(project_id: str, mem_id: int) -> None:
	con = sqlite3.connect(_get_db_path())
	cur = con.cursor()
	cur.execute(
	"DELETE FROM persona_memory WHERE project_id = ? AND id = ?",
	(project_id, int(mem_id)),
	)
	con.commit()
	con.close()


	def purge_memories_by_keyword(project_id: str, keyword: str) -> int:
	"""
	Delete all Working and Semantic memories whose value mentions `keyword`.
	Called when an outfit/item is deleted from the wardrobe so stale references
	don't linger. Pinned (P) memories are preserved — the user explicitly
	asked to remember those.

	Returns count of deleted entries.
	"""
	if not keyword or not keyword.strip():
	return 0
	kw = keyword.strip().lower()
	con = sqlite3.connect(_get_db_path())
	con.row_factory = sqlite3.Row
	cur = con.cursor()
	cur.execute(
	"SELECT id, value, mem_type FROM persona_memory WHERE project_id = ?",
	(project_id,),
	)
	to_delete: List[int] = []
	for row in cur.fetchall():
	mem_type = (row["mem_type"] or "S").upper()
	if mem_type == "P":
	continue # Never auto-delete pinned memories
	val = (row["value"] or "").lower()
	if kw in val:
	to_delete.append(int(row["id"]))
	for mid in to_delete:
	cur.execute("DELETE FROM persona_memory WHERE id = ?", (mid,))
	con.commit()
	con.close()
	return len(to_delete)


	# ---------------------------------------------------------------------------
	# V2 Engine
	# ---------------------------------------------------------------------------

	class MemoryV2Engine:
	def __init__(self, config: Optional[V2Config] = None) -> None:
	self.cfg = config or V2Config()
	self._last_maintenance: Dict[str, float] = {} # project_id -> timestamp

	# ---- ingest (called per user message) ----

	def ingest_user_text(self, project_id: str, user_text: str, user_id: Optional[str] = None) -> None:
	"""
	Ingest user text as memory. Three paths:
	1. Explicit "remember this" -> Pinned (P), never decays
	2. Default -> Working trace (W), fast decay
	Consolidation + pruning run on a throttled schedule (not every message).
	"""
	t = _clean_value(user_text, self.cfg.max_value_chars)
	if not t or len(t) < 5:
	return

	# Path 1: Explicit "remember" -> pinned
	if _RE_REMEMBER.search(t):
	_upsert_memory(
	project_id=project_id,
	category="user",
	key=f"pinned:{_stable_hash(t)}",
	value=t,
	mem_type="P",
	source_type="user",
	confidence=1.0,
	strength=1.0,
	importance=0.95,
	reinforce_eta=self.cfg.eta_user_confirmed,
	user_id=user_id,
	)
	return

	# Path 2: Working trace (fast decay, cheap to store)
	_upsert_memory(
	project_id=project_id,
	category="working",
	key=f"w:{_stable_hash(t)}",
	value=t,
	mem_type="W",
	source_type="user",
	confidence=0.5,
	strength=0.5,
	importance=0.25,
	reinforce_eta=None,
	user_id=user_id,
	)

	# Throttled maintenance (consolidation + pruning)
	self._maybe_maintain(project_id, user_id=user_id)

	# ---- throttled maintenance ----

	def _maybe_maintain(self, project_id: str, user_id: Optional[str] = None) -> None:
	"""Run consolidation + pruning at most once per maintenance_interval."""
	now = _now()
	last = self._last_maintenance.get(project_id, 0.0)
	if now - last < self.cfg.maintenance_interval:
	return
	self._last_maintenance[project_id] = now
	try:
	self.consolidate(project_id, user_id=user_id)
	self.prune(project_id, user_id=user_id)
	except Exception as e:
	print(f"[MEMORY_V2] Maintenance warning (non-fatal): {e}")

	# ---- consolidate (promote W -> S when reinforced) ----

	def consolidate(self, project_id: str, user_id: Optional[str] = None) -> None:
	"""
	Promote Working -> Semantic if:
	- Repetition (similar to 2+ other W items OR similar to existing S item)
	- Still active (activation >= threshold)
	- Important enough (importance >= threshold)

	Also: when W overlaps with an existing S entry, reinforce that S entry.
	"""
	mem = _select_memories(project_id, user_id=user_id)
	working = [m for m in mem if (m.get("mem_type") or "S") == "W"]
	semantic = [m for m in mem if (m.get("mem_type") or "S") == "S"]

	if not working:
	return

	# Recent working items only
	working_sorted = sorted(
	working,
	key=lambda x: float(x.get("last_seen_at") or 0),
	reverse=True,
	)[:15]

	for w in working_sorted:
	w_text = w.get("value") or ""
	w_strength = float(w.get("strength") or 0.5)
	w_last = float(w.get("last_access_at") or w.get("last_seen_at") or 0.0)
	if w_last <= 0:
	w_last = _now()

	# Activation in working space
	act = _activation(w_strength, w_last, self.cfg.tau_working)

	# Repetition: count similar W items
	rep = 0
	for w2 in working_sorted:
	if w2["id"] == w["id"]:
	continue
	if _keyword_score(w2.get("value") or "", w_text) >= 0.6:
	rep += 1

	# Importance heuristic: longer text + specific words
	imp = float(w.get("importance") or 0.25)
	if re.search(r"\b(prefer\|always\|never\|important\|boundary\|hate\|love)\b", w_text, re.I):
	imp = max(imp, 0.5)

	# Check overlap with existing semantic entries
	best_sem = None
	best_score = 0.0
	for s in semantic:
	sc = _keyword_score(w_text, s.get("value") or "")
	if sc > best_score:
	best_score = sc
	best_sem = s

	# If it maps to existing semantic, reinforce that entry
	if best_sem and best_score >= 0.45:
	_touch_access(project_id, int(best_sem["id"]), self.cfg.eta_inferred)
	continue

	# Otherwise: promote W -> S if thresholds met
	if (
	rep >= self.cfg.consolidate_min_repeats
	and imp >= self.cfg.consolidate_min_importance
	and act >= self.cfg.consolidate_min_activation
	):
	_upsert_memory(
	project_id=project_id,
	category="semantic",
	key=f"s:{_stable_hash(w_text)}",
	value=f"Stable note: {w_text}",
	mem_type="S",
	source_type="inferred",
	confidence=0.55,
	strength=0.55,
	importance=_clamp(imp, 0.0, 1.0),
	reinforce_eta=self.cfg.eta_inferred,
	user_id=user_id,
	)
	# Clean up promoted working item
	_delete_by_id(project_id, int(w["id"]))

	# ---- prune (human-like forgetting) ----

	def prune(self, project_id: str, user_id: Optional[str] = None) -> None:
	"""
	Prune low-activation + low-importance Semantic entries (forgetting).
	Never prune Pinned (P). Trim excessive Working noise to ~25 items.
	"""
	mem = _select_memories(project_id, user_id=user_id)

	# Prune semantic (decay-based)
	for s in mem:
	if (s.get("mem_type") or "S") != "S":
	continue
	strength = float(s.get("strength") or 0.5)
	last = float(s.get("last_access_at") or s.get("last_seen_at") or 0.0)
	if last <= 0:
	last = _now()
	imp = float(s.get("importance") or 0.3)
	act = _activation(strength, last, self.cfg.tau_semantic)
	if act < self.cfg.prune_activation_thresh and imp < self.cfg.prune_importance_thresh:
	_delete_by_id(project_id, int(s["id"]))

	# Trim Working noise: keep only latest ~25
	working = [m for m in mem if (m.get("mem_type") or "S") == "W"]
	if len(working) > 25:
	working_sorted = sorted(
	working,
	key=lambda x: float(x.get("last_seen_at") or 0.0),
	reverse=True,
	)
	for w in working_sorted[25:]:
	_delete_by_id(project_id, int(w["id"]))

	# ---- retrieve (build context for system prompt injection) ----

	def build_context(self, project_id: str, query: str, user_id: Optional[str] = None) -> str:
	"""
	Build a compact memory context block for the system prompt.
	Retrieves: top Pinned + top Semantic (scored by relevance+activation) + 1 Working.
	Reinforces retrieved Semantic entries (light touch).
	"""
	mem = _select_memories(project_id, user_id=user_id)

	pinned = [m for m in mem if (m.get("mem_type") or "S") == "P"]
	sem = [m for m in mem if (m.get("mem_type") or "S") == "S"]
	working = [m for m in mem if (m.get("mem_type") or "S") == "W"]

	# Rank pinned by importance then recency
	pinned_sorted = sorted(
	pinned,
	key=lambda x: (
	float(x.get("importance") or 0.9),
	float(x.get("last_seen_at") or 0.0),
	),
	reverse=True,
	)[:self.cfg.top_pinned]

	# Rank semantic by composite score: relevance + activation + importance
	scored_sem: List[Tuple[float, Dict[str, Any]]] = []
	for s in sem:
	strength = float(s.get("strength") or 0.5)
	last = float(s.get("last_access_at") or s.get("last_seen_at") or 0.0)
	if last <= 0:
	last = _now()
	imp = float(s.get("importance") or 0.3)
	act = _activation(strength, last, self.cfg.tau_semantic)
	rel = _keyword_score(query, s.get("value") or "")
	score = 0.55 * rel + 0.30 * act + 0.15 * imp
	scored_sem.append((score, s))
	scored_sem.sort(key=lambda x: x[0], reverse=True)
	sem_top = [s for _, s in scored_sem[:self.cfg.top_semantic]]

	# Reinforce retrieved semantic memories (light touch)
	for s in sem_top:
	try:
	_touch_access(project_id, int(s["id"]), self.cfg.eta_inferred)
	except Exception:
	pass

	# Working: keep 1 most recent
	working_sorted = sorted(
	working,
	key=lambda x: float(x.get("last_seen_at") or 0.0),
	reverse=True,
	)[:self.cfg.top_working]

	# Build output
	lines: List[str] = []

	if pinned_sorted:
	lines.append("PINNED MEMORY (user-approved, permanent):")
	for m in pinned_sorted:
	lines.append(f" - {m.get('value')}")
	lines.append("")

	if sem_top:
	lines.append("LEARNED MEMORY (semantic, long-term):")
	for m in sem_top:
	conf = float(m.get("confidence") or 0.5)
	tag = "" if conf >= 0.8 else " (uncertain)"
	lines.append(f" - {m.get('value')}{tag}")
	lines.append("")

	if working_sorted:
	lines.append("WORKING CONTEXT (short-lived):")
	for m in working_sorted:
	lines.append(f" - {m.get('value')}")
	lines.append("")

	return "\n".join(lines).strip()


	# ---------------------------------------------------------------------------
	# Singleton (lazy)
	# ---------------------------------------------------------------------------

	_engine: Optional[MemoryV2Engine] = None


	def get_memory_v2() -> MemoryV2Engine:
	global _engine
	if _engine is None:
	_engine = MemoryV2Engine()
	return _engine