File size: 3,926 Bytes
266dba2
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
import { ScoredMemory, MemoryConfig, DEFAULT_MEMORY_CONFIG, MemoryType } from './types';
import { applyDecayWeighting } from './memoryDecay';
import { formatMemoriesByType } from './typedMemory';

type QueryComplexity = 'simple' | 'moderate' | 'complex';

export function estimateQueryComplexity(query: string): QueryComplexity {
  const wc = query.split(/\s+/).length;
  if (wc <= 5) return 'simple';
  if (/\b(what('s|\s+is)\s+my|am\s+i|do\s+i|where\s+do\s+i)\b/i.test(query)) return 'simple';
  if (wc >= 15) return 'complex';
  if (/\b(plan|schedule|organize|considering|taking\s+into\s+account|based\s+on)\b/i.test(query)) return 'complex';
  if (/\band\b.*\band\b/i.test(query)) return 'complex';
  return 'moderate';
}

export function inferRelevantMemoryTypes(query: string): MemoryType[] {
  const types: MemoryType[] = []; const q = query.toLowerCase();
  if (/\b(yesterday|last|when|recently|remember\s+when|did\s+we|did\s+i|what\s+happened)\b/.test(q)) types.push('episodic');
  if (/\b(how\s+(should|do)|what's\s+the\s+rule|format|style|remind|procedure)\b/.test(q)) types.push('procedural');
  if (/\b(what('s|\s+is)\s+my|suggest|recommend|prefer|like|allergic|favorite|do\s+i\s+(like|have|live))\b/.test(q)) types.push('semantic');
  return types.length ? types : ['semantic', 'episodic', 'procedural'];
}

export interface RetrievalParams { topK: number; similarityThreshold: number; maxTokenBudget: number; priorityTypes: MemoryType[]; boostRecent: boolean; }

export function computeRetrievalParams(query: string, config: MemoryConfig = DEFAULT_MEMORY_CONFIG): RetrievalParams {
  const complexity = estimateQueryComplexity(query);
  const priorityTypes = inferRelevantMemoryTypes(query);
  const boostRecent = /\b(today|just|now|this\s+(morning|afternoon|evening)|recently|latest)\b/i.test(query);
  switch (complexity) {
    case 'simple': return { topK: 3, similarityThreshold: 0.50, maxTokenBudget: 100, priorityTypes, boostRecent };
    case 'moderate': return { topK: config.defaultTopK, similarityThreshold: config.minSimilarityThreshold, maxTokenBudget: config.maxContextTokens, priorityTypes, boostRecent };
    case 'complex': return { topK: 12, similarityThreshold: 0.35, maxTokenBudget: 500, priorityTypes, boostRecent };
  }
}

export function buildDynamicRetrievalQuery(embedding: number[], params: RetrievalParams) {
  const typeFilter = params.priorityTypes.length < 3 ? `AND type IN (${params.priorityTypes.map(() => '?').join(',')})` : '';
  const orderClause = params.boostRecent
    ? `ORDER BY (1 - vec_distance_cosine(embedding, vec_f32(?))) * (1 + 0.2 * CASE WHEN (julianday('now') - julianday(last_accessed_at / 1000, 'unixepoch')) < 1 THEN 1 ELSE 0 END) DESC`
    : `ORDER BY vec_distance_cosine(embedding, vec_f32(?)) ASC`;
  const sql = `SELECT id, text, embedding, type, source, created_at, last_accessed_at, access_count, importance, (1 - vec_distance_cosine(embedding, vec_f32(?))) AS similarity FROM memories WHERE (1 - vec_distance_cosine(embedding, vec_f32(?))) >= ? ${typeFilter} ${orderClause} LIMIT ?`;
  const queryParams: unknown[] = [JSON.stringify(embedding), JSON.stringify(embedding), params.similarityThreshold, ...params.priorityTypes.length < 3 ? params.priorityTypes : [], JSON.stringify(embedding), params.topK];
  return { sql, queryParams };
}

export function processRetrievedMemories(rawResults: Array<{ record: any; cosineSimilarity: number }>, params: RetrievalParams, config: MemoryConfig = DEFAULT_MEMORY_CONFIG) {
  const scored = applyDecayWeighting(rawResults, config);
  let tokenCount = 0; const selected: ScoredMemory[] = [];
  for (const m of scored) { const t = Math.ceil(m.text.length / 4); if (tokenCount + t > params.maxTokenBudget) break; selected.push(m); tokenCount += t; }
  return { formattedContext: formatMemoriesByType(selected.map(m => ({ text: m.text, type: m.type, source: m.source }))), memoriesUsed: selected.map(m => m.id) };
}