Spaces:

mishig
/

chat-ui

Running on CPU Upgrade

App Files Files Community

victor HF Staff commited on Dec 21, 2025

Commit

2d994c9

unverified ·

1 Parent(s): d4e1a40

fix(mcp): reduce Exa API context size sent to LLM (#2026)

Browse files

Use highlights instead of full page text to minimize context size.
The previous implementation requested `text: true` which returned
entire page contents (5-20K+ chars per result), overwhelming LLM context.

Now uses:
- highlights: 3 sentences, 2 per URL (concise, query-relevant)
- text fallback: max 500 chars (only if highlights empty)

This matches what the MCP server at mcp.exa.ai likely returns.

Files changed (1) hide show

src/lib/server/mcp/exaDirect.ts +17 -6

src/lib/server/mcp/exaDirect.ts CHANGED Viewed

@@ -140,6 +140,7 @@ interface ExaSearchResponse {
 /**
  * Format Exa search results as human-readable text
  */
 function formatSearchResultsAsText(results: ExaSearchResult[]): string {
 	if (results.length === 0) {
@@ -154,10 +155,11 @@ function formatSearchResultsAsText(results: ExaSearchResult[]): string {
 				parts.push(`   Published: ${result.publishedDate}`);
 			}
-			if (result.text) {
-				parts.push(`   ${result.text}`);
-			} else if (result.highlights && result.highlights.length > 0) {
 				parts.push(`   ${result.highlights.join(" ... ")}`);
 			}
 			return parts.join("\n");
@@ -186,13 +188,22 @@ export async function callExaDirectApi(
 		throw new Error("Missing required parameter: query");
 	}
-	// Build request body - pass through all args, ensure query exists and request text content
 	const requestBody: Record<string, unknown> = {
 		...args,
 		query,
-		// Required to get page text content, not just metadata
 		contents: {
-			text: true,
 		},
 	};

 /**
  * Format Exa search results as human-readable text
+ * Prioritizes highlights (concise snippets) over full text to minimize LLM context
  */
 function formatSearchResultsAsText(results: ExaSearchResult[]): string {
 	if (results.length === 0) {
 				parts.push(`   Published: ${result.publishedDate}`);
 			}
+			// Prefer highlights (concise, query-relevant) over full text
+			if (result.highlights && result.highlights.length > 0) {
 				parts.push(`   ${result.highlights.join(" ... ")}`);
+			} else if (result.text) {
+				parts.push(`   ${result.text}`);
 			}
 			return parts.join("\n");
 		throw new Error("Missing required parameter: query");
 	}
+	// Build request body - pass through all args, ensure query exists
+	// Use highlights (not full text) to minimize context size sent to LLM
+	// This matches what the MCP server at mcp.exa.ai returns
 	const requestBody: Record<string, unknown> = {
 		...args,
 		query,
 		contents: {
+			// Use highlights for concise, query-relevant snippets (much smaller than full text)
+			highlights: {
+				numSentences: 3,
+				highlightsPerUrl: 2,
+			},
+			// Also get limited text as fallback if highlights are empty
+			text: {
+				maxCharacters: 500,
+			},
 		},
 	};