Spaces:

fahmiaziz
/

api-embedding

Running

App Files Files Community

fahmiaziz98 commited on Nov 2

Commit

fb8f5fc

1 Parent(s): 9958d9a

[DEBUG]

Browse files

Files changed (2) hide show

src/api/routers/rerank.py +36 -21
src/models/embeddings/rank.py +74 -34

src/api/routers/rerank.py CHANGED Viewed

@@ -80,37 +80,52 @@ async def rerank_documents(
                 detail=f"Model '{request.model_id}' is not a rerank model. Type: {config.type}",
             )
         start = time.time()
-        # Call rank_document with clean kwargs
-        scores = model.rank_document(
             query=request.query,
-            documents=[doc for _, doc in valid_docs],  # Use filtered documents
             top_k=request.top_k,
             **kwargs,
         )
         processing_time = time.time() - start
-        # Sebelum memanggil rank_document, tambahkan:
-        logger.debug(f"Rerank request - Query: '{request.query}'")
-        logger.debug(f"Documents to rank: {len(request.documents)}")
-        logger.debug(f"First document: {request.documents[-1][:100]}...")
-        logger.debug(f"Top K: {request.top_k}")
-        # Setelah rank_document, tambahkan:
-        logger.debug(f"Ranking returned {len(scores)} scores")
-        logger.debug(f"Sample scores: {scores[:5] if scores else 'None'}")
-        # Build results with original indices
-        original_indices, documents_list = zip(*valid_docs)
         results = []
-        for i, (orig_idx, doc) in enumerate(zip(original_indices, documents_list)):
-            results.append(RerankResult(text=doc, score=scores[i], index=orig_idx))
-        # Sort results by score in descending order
-        results.sort(key=lambda x: x.score, reverse=True)
         logger.info(
             f"Reranked {len(results)} documents in {processing_time:.3f}s "
@@ -135,4 +150,4 @@ async def rerank_documents(
         raise HTTPException(
             status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
             detail=f"Failed to rerank documents: {str(e)}",
-        )

                 detail=f"Model '{request.model_id}' is not a rerank model. Type: {config.type}",
             )
+        # Debug logs BEFORE calling rank_document
+        logger.debug(f"Rerank request - Query: '{request.query}'")
+        logger.debug(f"Documents to rank: {len(valid_docs)}")
+        if valid_docs:
+            logger.debug(f"First document: {valid_docs[0][1][:100]}...")
+        logger.debug(f"Top K: {request.top_k}")
         start = time.time()
+        # Extract documents for ranking
+        documents_list = [doc for _, doc in valid_docs]
+        # Call rank_document - returns only top_k results
+        ranking_results = model.rank_document(
             query=request.query,
+            documents=documents_list,
             top_k=request.top_k,
             **kwargs,
         )
         processing_time = time.time() - start
+        # Debug logs AFTER rank_document
+        logger.debug(f"Ranking returned {len(ranking_results)} results")
+        if ranking_results:
+            logger.debug(f"Top result score: {ranking_results[0]}")
+        # Build results from ranking_results
+        # ranking_results already contains top_k items with scores
         results = []
+        for rank_result in ranking_results:
+            # Get original index from valid_docs
+            doc_idx = rank_result.get('corpus_id', 0)  # Index in filtered list
+            if doc_idx < len(valid_docs):
+                original_idx = valid_docs[doc_idx][0]  # Original index
+                doc_text = documents_list[doc_idx]
+                score = rank_result['score']
+                results.append(
+                    RerankResult(
+                        text=doc_text,
+                        score=score,
+                        index=original_idx
+                    )
+                )
         logger.info(
             f"Reranked {len(results)} documents in {processing_time:.3f}s "
         raise HTTPException(
             status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
             detail=f"Failed to rerank documents: {str(e)}",
+        )

src/models/embeddings/rank.py CHANGED Viewed

@@ -5,7 +5,7 @@ This module provides the RerankModel class for reranking
 documents using sentence-transformers.
 """
-from typing import List, Optional
 from sentence_transformers import CrossEncoder
 from loguru import logger
@@ -18,18 +18,18 @@ class RerankModel:
     """
     Cross-encoder model wrapper using sentence-transformers.
-    This class wraps sentence-transformers SentenceTransformer models
-    to ranking documents
     Attributes:
         config: ModelConfig instance
-        model: SentenceTransformer instance
         _loaded: Flag indicating if the model is loaded
     """
     def __init__(self, config: ModelConfig):
         """
-        Initialize the dense embedding model.
         Args:
             config: ModelConfig instance with model configuration
@@ -48,6 +48,7 @@ class RerankModel:
         """
         if self._loaded:
             logger.debug(f"Model {self.model_id} already loaded")
         logger.info(f"Loading rerank model: {self.config.name}")
@@ -58,7 +59,7 @@ class RerankModel:
                 trust_remote_code=self.settings.TRUST_REMOTE_CODE,
             )
             self._loaded = True
-            logger.success(f"✓ Loaded dense model: {self.model_id}")
         except Exception as e:
             error_msg = f"Failed to load model: {str(e)}"
@@ -93,28 +94,44 @@ class RerankModel:
         documents: List[str],
         top_k: int,
         **kwargs,
-    ) -> List[float]:
         """
         Rerank documents using the CrossEncoder model.
         Args:
             query (str): The search query string.
             documents (List[str]): List of documents to be reranked.
-            top_k (int): top n documents
-            **kwargs
         Returns:
-            List[float]: List of relevance scores for each document.
-        Raises:.
-            Exception: If reranking fails.
         """
         if not self._loaded or self.model is None:
             self.load()
         try:
-            scores = self.model.rank(query, documents, top_k=top_k, **kwargs)
-            normalized_score = self._normalize_rerank_scores(scores)
-            return normalized_score
         except Exception as e:
             error_msg = f"Reranking documents failed: {str(e)}"
@@ -122,34 +139,57 @@ class RerankModel:
             raise RerankingDocumentError(self.model_id, error_msg)
     def _normalize_rerank_scores(
-        self, rankings: List[dict], target_range: tuple = (0, 1)
-    ) -> List[float]:
         """
-        Normalize reranking scores menggunakan berbagai metode.
         Args:
-            rankings: List of ranking dictionaries dari cross-encoder
-            target_range: Target range untuk minmax normalization (min, max)
         Returns:
-            List of normalized scores
         """
         raw_scores = [ranking["score"] for ranking in rankings]
-        # Min-Max normalization ke target range
         min_score = min(raw_scores)
         max_score = max(raw_scores)
         if max_score == min_score:
-            return [target_range[1]] * len(raw_scores)  # All same score
         target_min, target_max = target_range
-        normalized = [
-            target_min
-            + (score - min_score) * (target_max - target_min) / (max_score - min_score)
-            for score in raw_scores
-        ]
-        return normalized
     @property
     def is_loaded(self) -> bool:
@@ -177,7 +217,7 @@ class RerankModel:
         Get the model type.
         Returns:
-            Model type ('embeddings' or 'sparse-embeddings')
         """
         return self.config.type
@@ -188,4 +228,4 @@ class RerankModel:
             f"id={self.model_id}, "
             f"type={self.model_type}, "
             f"loaded={self.is_loaded})"
-        )

 documents using sentence-transformers.
 """
+from typing import List, Optional, Dict
 from sentence_transformers import CrossEncoder
 from loguru import logger
     """
     Cross-encoder model wrapper using sentence-transformers.
+    This class wraps sentence-transformers CrossEncoder models
+    for ranking documents
     Attributes:
         config: ModelConfig instance
+        model: CrossEncoder instance
         _loaded: Flag indicating if the model is loaded
     """
     def __init__(self, config: ModelConfig):
         """
+        Initialize the rerank model.
         Args:
             config: ModelConfig instance with model configuration
         """
         if self._loaded:
             logger.debug(f"Model {self.model_id} already loaded")
+            return
         logger.info(f"Loading rerank model: {self.config.name}")
                 trust_remote_code=self.settings.TRUST_REMOTE_CODE,
             )
             self._loaded = True
+            logger.success(f"✓ Loaded rerank model: {self.model_id}")
         except Exception as e:
             error_msg = f"Failed to load model: {str(e)}"
         documents: List[str],
         top_k: int,
         **kwargs,
+    ) -> List[Dict]:
         """
         Rerank documents using the CrossEncoder model.
         Args:
             query (str): The search query string.
             documents (List[str]): List of documents to be reranked.
+            top_k (int): Number of top documents to return
+            **kwargs: Additional arguments passed to model.rank()
         Returns:
+            List[Dict]: List of ranking results with 'corpus_id' and 'score'.
+                       Returns top_k results sorted by score (highest first).
+        Raises:
+            RerankingDocumentError: If reranking fails.
         """
         if not self._loaded or self.model is None:
             self.load()
         try:
+            # model.rank returns List[Dict] with 'corpus_id' and 'score'
+            # Already sorted by score (highest first) and limited to top_k
+            ranking_results = self.model.rank(
+                query,
+                documents,
+                top_k=top_k,
+                **kwargs
+            )
+            # Normalize scores to 0-1 range for consistency
+            normalized_results = self._normalize_rerank_scores(ranking_results)
+            logger.debug(
+                f"Reranked {len(documents)} docs, returned top {len(normalized_results)}"
+            )
+            return normalized_results
         except Exception as e:
             error_msg = f"Reranking documents failed: {str(e)}"
             raise RerankingDocumentError(self.model_id, error_msg)
     def _normalize_rerank_scores(
+        self,
+        rankings: List[Dict],
+        target_range: tuple = (0, 1)
+    ) -> List[Dict]:
         """
+        Normalize reranking scores using min-max normalization.
         Args:
+            rankings: List of ranking dictionaries from cross-encoder
+                     Format: [{'corpus_id': int, 'score': float}, ...]
+            target_range: Target range for normalization (min, max)
         Returns:
+            List[Dict]: Rankings with normalized scores
         """
+        if not rankings:
+            return []
+        # Extract raw scores
         raw_scores = [ranking["score"] for ranking in rankings]
+        # Min-Max normalization
         min_score = min(raw_scores)
         max_score = max(raw_scores)
+        # If all scores are the same, return max target value
         if max_score == min_score:
+            return [
+                {
+                    "corpus_id": r["corpus_id"],
+                    "score": target_range[1]
+                }
+                for r in rankings
+            ]
+        # Normalize to target range
         target_min, target_max = target_range
+        normalized_rankings = []
+        for ranking in rankings:
+            score = ranking["score"]
+            normalized_score = (
+                target_min +
+                (score - min_score) * (target_max - target_min) / (max_score - min_score)
+            )
+            normalized_rankings.append({
+                "corpus_id": ranking["corpus_id"],
+                "score": float(normalized_score)
+            })
+        return normalized_rankings
     @property
     def is_loaded(self) -> bool:
         Get the model type.
         Returns:
+            Model type ('rerank')
         """
         return self.config.type
             f"id={self.model_id}, "
             f"type={self.model_type}, "
             f"loaded={self.is_loaded})"
+        )