Spaces:

devjhawar
/

policylens-rag-api

Running

DEVJHAWAR11

sync: deploy to HuggingFace Space

5b7955a 2 months ago

1.58 kB

	"""Build the final context string fed to the LLM from retrieved chunks."""

	from __future__ import annotations

	from rag_engine.utils.logger import get_logger

	logger = get_logger(__name__)

	_TOKEN_MULTIPLIER = 1.3 # rough word → token ratio


	class ContextBuilder:
	"""Assemble a formatted context block from scored retrieval results."""

	def build(self, results: list[dict], max_tokens: int = 3000) -> str:
	"""Format results into a single context string, respecting max_tokens."""
	parts: list[str] = []
	token_estimate = 0.0
	used = 0

	for i, result in enumerate(results):
	metadata = result.get("metadata", {})
	score = result.get("rerank_score", result.get("score", 0))
	content = result.get("content", "")

	block = (
	f"--- Source {i + 1} ---\n"
	f"Section: {metadata.get('section_name', 'Unknown')}\n"
	f"Clause Type: {metadata.get('clause_type', 'Unknown')}\n"
	f"Relevance: {score:.3f}\n\n"
	f"{content}\n"
	)

	block_tokens = len(block.split()) * _TOKEN_MULTIPLIER
	if token_estimate + block_tokens > max_tokens and used > 0:
	break

	parts.append(block)
	token_estimate += block_tokens
	used += 1

	context = "\n".join(parts)
	logger.info(
	"Context built: %d/%d chunks, ~%d tokens",
	used,
	len(results),
	int(token_estimate),
	)
	return context