Spaces:

klydekushy
/

Vortex-Flux

Running

App Files Files Community

klydekushy commited on Jan 28

Commit

f330fba

verified ·

1 Parent(s): f600486

Update src/Algorithms/vector_search.py

Browse files

Files changed (1) hide show

src/Algorithms/vector_search.py +18 -6

src/Algorithms/vector_search.py CHANGED Viewed

@@ -1,17 +1,22 @@
 """
-MODULE: VECTOR SEARCH ENGINE (OG-RAG VERSION)
-=============================================
 """
 import faiss
 import numpy as np
 from sentence_transformers import SentenceTransformer
 class SemanticIndex:
     def __init__(self, model_name='all-MiniLM-L6-v2'):
         self.model = SentenceTransformer(model_name)
         self.index = None
         self.uris = []
-        self.content_map = {} # Pour retrouver le texte du bloc
     def build_from_ontology_blocks(self, blocks):
         """Vectorise les Hyper-blocs enrichis"""
@@ -20,6 +25,7 @@ class SemanticIndex:
         corpus = [b['text'] for b in blocks]
         self.uris = [b['uri'] for b in blocks]
         self.content_map = {b['uri']: b['text'] for b in blocks}
         embeddings = self.model.encode(corpus, show_progress_bar=True)
         dimension = embeddings.shape[1]
@@ -28,18 +34,24 @@ class SemanticIndex:
         print("✅ [VECTOR] Index OG-RAG prêt.")
     def search(self, query, top_k=3):
         if not self.index: return []
         query_vec = self.model.encode([query]).astype('float32')
         dist, indices = self.index.search(query_vec, top_k)
         results = []
-        for idx in indices[0]:
             if idx != -1:
                 uri = self.uris[idx]
                 results.append({
                     "uri": uri,
-                    "text": self.content_map[uri],
-                    "score": float(dist[0][0])
                 })
         return results

 """
+MODULE: VECTOR SEARCH ENGINE (OG-RAG FIXED)
+===========================================
+Correction : Ajout de la gestion des métadonnées (meta_map) pour éviter le KeyError.
 """
 import faiss
 import numpy as np
 from sentence_transformers import SentenceTransformer
+import os
 class SemanticIndex:
     def __init__(self, model_name='all-MiniLM-L6-v2'):
+        # Gestion du cache pour éviter de re-télécharger le modèle à chaque fois
+        os.environ['HF_HUB_DISABLE_SYMLINKS_WARNING'] = '1'
         self.model = SentenceTransformer(model_name)
         self.index = None
         self.uris = []
+        self.content_map = {}
+        self.meta_map = {} # <--- AJOUT CRITIQUE
     def build_from_ontology_blocks(self, blocks):
         """Vectorise les Hyper-blocs enrichis"""
         corpus = [b['text'] for b in blocks]
         self.uris = [b['uri'] for b in blocks]
         self.content_map = {b['uri']: b['text'] for b in blocks}
+        self.meta_map = {b['uri']: b['metadata'] for b in blocks} # <--- ON STOCKE LES METAS
         embeddings = self.model.encode(corpus, show_progress_bar=True)
         dimension = embeddings.shape[1]
         print("✅ [VECTOR] Index OG-RAG prêt.")
+    def build_from_networkx(self, G):
+        """Compatibilité arrière (Phase 1)"""
+        # (Version simplifiée si besoin de fallback)
+        pass
     def search(self, query, top_k=3):
         if not self.index: return []
         query_vec = self.model.encode([query]).astype('float32')
         dist, indices = self.index.search(query_vec, top_k)
         results = []
+        for i, idx in enumerate(indices[0]):
             if idx != -1:
                 uri = self.uris[idx]
                 results.append({
                     "uri": uri,
+                    "text": self.content_map.get(uri, ""),
+                    "meta": self.meta_map.get(uri, {"type": "Unknown", "label": "?"}), # <--- ON RENVOIE LES METAS
+                    "score": float(dist[0][i])
                 })
         return results