Spaces:
Running
Running
| """Build the final context string fed to the LLM from retrieved chunks.""" | |
| from __future__ import annotations | |
| from rag_engine.utils.logger import get_logger | |
| logger = get_logger(__name__) | |
| _TOKEN_MULTIPLIER = 1.3 # rough word → token ratio | |
| class ContextBuilder: | |
| """Assemble a formatted context block from scored retrieval results.""" | |
| def build(self, results: list[dict], max_tokens: int = 3000) -> str: | |
| """Format *results* into a single context string, respecting *max_tokens*.""" | |
| parts: list[str] = [] | |
| token_estimate = 0.0 | |
| used = 0 | |
| for i, result in enumerate(results): | |
| metadata = result.get("metadata", {}) | |
| score = result.get("rerank_score", result.get("score", 0)) | |
| content = result.get("content", "") | |
| block = ( | |
| f"--- Source {i + 1} ---\n" | |
| f"Section: {metadata.get('section_name', 'Unknown')}\n" | |
| f"Clause Type: {metadata.get('clause_type', 'Unknown')}\n" | |
| f"Relevance: {score:.3f}\n\n" | |
| f"{content}\n" | |
| ) | |
| block_tokens = len(block.split()) * _TOKEN_MULTIPLIER | |
| if token_estimate + block_tokens > max_tokens and used > 0: | |
| break | |
| parts.append(block) | |
| token_estimate += block_tokens | |
| used += 1 | |
| context = "\n".join(parts) | |
| logger.info( | |
| "Context built: %d/%d chunks, ~%d tokens", | |
| used, | |
| len(results), | |
| int(token_estimate), | |
| ) | |
| return context | |