| import { ScoredMemory, MemoryConfig, DEFAULT_MEMORY_CONFIG, MemoryType } from './types'; |
| import { applyDecayWeighting } from './memoryDecay'; |
| import { formatMemoriesByType } from './typedMemory'; |
|
|
| type QueryComplexity = 'simple' | 'moderate' | 'complex'; |
|
|
| export function estimateQueryComplexity(query: string): QueryComplexity { |
| const wc = query.split(/\s+/).length; |
| if (wc <= 5) return 'simple'; |
| if (/\b(what('s|\s+is)\s+my|am\s+i|do\s+i|where\s+do\s+i)\b/i.test(query)) return 'simple'; |
| if (wc >= 15) return 'complex'; |
| if (/\b(plan|schedule|organize|considering|taking\s+into\s+account|based\s+on)\b/i.test(query)) return 'complex'; |
| if (/\band\b.*\band\b/i.test(query)) return 'complex'; |
| return 'moderate'; |
| } |
|
|
| export function inferRelevantMemoryTypes(query: string): MemoryType[] { |
| const types: MemoryType[] = []; const q = query.toLowerCase(); |
| if (/\b(yesterday|last|when|recently|remember\s+when|did\s+we|did\s+i|what\s+happened)\b/.test(q)) types.push('episodic'); |
| if (/\b(how\s+(should|do)|what's\s+the\s+rule|format|style|remind|procedure)\b/.test(q)) types.push('procedural'); |
| if (/\b(what('s|\s+is)\s+my|suggest|recommend|prefer|like|allergic|favorite|do\s+i\s+(like|have|live))\b/.test(q)) types.push('semantic'); |
| return types.length ? types : ['semantic', 'episodic', 'procedural']; |
| } |
|
|
| export interface RetrievalParams { topK: number; similarityThreshold: number; maxTokenBudget: number; priorityTypes: MemoryType[]; boostRecent: boolean; } |
|
|
| export function computeRetrievalParams(query: string, config: MemoryConfig = DEFAULT_MEMORY_CONFIG): RetrievalParams { |
| const complexity = estimateQueryComplexity(query); |
| const priorityTypes = inferRelevantMemoryTypes(query); |
| const boostRecent = /\b(today|just|now|this\s+(morning|afternoon|evening)|recently|latest)\b/i.test(query); |
| switch (complexity) { |
| case 'simple': return { topK: 3, similarityThreshold: 0.50, maxTokenBudget: 100, priorityTypes, boostRecent }; |
| case 'moderate': return { topK: config.defaultTopK, similarityThreshold: config.minSimilarityThreshold, maxTokenBudget: config.maxContextTokens, priorityTypes, boostRecent }; |
| case 'complex': return { topK: 12, similarityThreshold: 0.35, maxTokenBudget: 500, priorityTypes, boostRecent }; |
| } |
| } |
|
|
| export function buildDynamicRetrievalQuery(embedding: number[], params: RetrievalParams) { |
| const typeFilter = params.priorityTypes.length < 3 ? `AND type IN (${params.priorityTypes.map(() => '?').join(',')})` : ''; |
| const orderClause = params.boostRecent |
| ? `ORDER BY (1 - vec_distance_cosine(embedding, vec_f32(?))) * (1 + 0.2 * CASE WHEN (julianday('now') - julianday(last_accessed_at / 1000, 'unixepoch')) < 1 THEN 1 ELSE 0 END) DESC` |
| : `ORDER BY vec_distance_cosine(embedding, vec_f32(?)) ASC`; |
| const sql = `SELECT id, text, embedding, type, source, created_at, last_accessed_at, access_count, importance, (1 - vec_distance_cosine(embedding, vec_f32(?))) AS similarity FROM memories WHERE (1 - vec_distance_cosine(embedding, vec_f32(?))) >= ? ${typeFilter} ${orderClause} LIMIT ?`; |
| const queryParams: unknown[] = [JSON.stringify(embedding), JSON.stringify(embedding), params.similarityThreshold, ...params.priorityTypes.length < 3 ? params.priorityTypes : [], JSON.stringify(embedding), params.topK]; |
| return { sql, queryParams }; |
| } |
|
|
| export function processRetrievedMemories(rawResults: Array<{ record: any; cosineSimilarity: number }>, params: RetrievalParams, config: MemoryConfig = DEFAULT_MEMORY_CONFIG) { |
| const scored = applyDecayWeighting(rawResults, config); |
| let tokenCount = 0; const selected: ScoredMemory[] = []; |
| for (const m of scored) { const t = Math.ceil(m.text.length / 4); if (tokenCount + t > params.maxTokenBudget) break; selected.push(m); tokenCount += t; } |
| return { formattedContext: formatMemoriesByType(selected.map(m => ({ text: m.text, type: m.type, source: m.source }))), memoriesUsed: selected.map(m => m.id) }; |
| } |
|
|