Spaces:

rishadaz
/

amazon_retriever

Sleeping

App Files Files Community

github-actions[bot] commited on Apr 22

Commit

2ef07e4

1 Parent(s): 05b9d1b

chore: sync app/ and src/ from GitHub

Browse files

Files changed (2) hide show

app/app.py +10 -8
src/semantic.py +18 -15

app/app.py CHANGED Viewed

@@ -55,15 +55,17 @@ def load_vector_store_cached():
     login(token=HF_TOKEN, add_to_git_credential=False)
     VECTOR_STORE_DIR.mkdir(parents=True, exist_ok=True)
-    snapshot_path = snapshot_download(
-        repo_id="rishadaz/amazon_retriever-storage",
-        repo_type="dataset",
-        local_dir=str(VECTOR_STORE_DIR),
-        split='full',
-        token=HF_TOKEN,
-    )
-    mini_index_path = Path(snapshot_path) / "tokenisation" / "bm25_index_mini.pkl"
     embeddings_dir  = Path(snapshot_path) / "embeddings"
     vector_store    = load_vector_store(embeddings_dir)

     login(token=HF_TOKEN, add_to_git_credential=False)
     VECTOR_STORE_DIR.mkdir(parents=True, exist_ok=True)
+    if not any(VECTOR_STORE_DIR.iterdir()):
+        snapshot_path = Path(snapshot_download(
+            repo_id="rishadaz/amazon_retriever-storage",
+            repo_type="dataset",
+            local_dir=str(VECTOR_STORE_DIR),
+            token=HF_TOKEN,
+        ))
+    else:
+        snapshot_path = VECTOR_STORE_DIR
+    mini_index_path = Path(snapshot_path) / "tokenisation" / "bm25_index.pkl"
     embeddings_dir  = Path(snapshot_path) / "embeddings"
     vector_store    = load_vector_store(embeddings_dir)

src/semantic.py CHANGED Viewed

@@ -17,6 +17,7 @@ Typical usage
 import logging
 from typing import Any
 import torch
 import json, os, sys
@@ -45,17 +46,19 @@ DEFAULT_TOP_REVIEWS = 5
 DEFAULT_TOP_K = 5
 DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
-EMBEDDINGS = HuggingFaceEmbeddings(
-    model_name=DEFAULT_EMBEDDING_MODEL,
-    model_kwargs={
-        "device": DEVICE,
-        "model_kwargs": {"torch_dtype": torch.float16},
-    },
-    encode_kwargs={
-        "batch_size": 128 if DEVICE == 'cpu' else 512,
-        "normalize_embeddings": True,
-    },
-)
 # ---------------------------------------------------------------------------
 # Document construction
@@ -178,11 +181,11 @@ def build_vector_store(
     # --- Create new store if needed ---
     if existing_store is None:
-        dim = len(EMBEDDINGS.embed_query("probe"))
         index = faiss.IndexFlatL2(dim)
         vector_store = FAISS(
-            embedding_function=EMBEDDINGS,
             index=index,
             docstore=InMemoryDocstore(),
             index_to_docstore_id={},
@@ -208,7 +211,7 @@ def build_and_save_vector_store(
     # --- Resume / initialize ---
     if os.path.exists(os.path.join(save_path, "index.faiss")):
         vector_store = FAISS.load_local(
-            save_path, EMBEDDINGS, allow_dangerous_deserialization=True
         )
         already_indexed = set(vector_store.index_to_docstore_id.values())
         print(f"Resuming — {len(already_indexed)} docs already indexed.")
@@ -297,6 +300,6 @@ def load_vector_store(
     return FAISS.load_local(
         load_path,
-        embeddings=EMBEDDINGS,
         allow_dangerous_deserialization=True,
     )

 import logging
 from typing import Any
+import streamlit as st
 import torch
 import json, os, sys
 DEFAULT_TOP_K = 5
 DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
+@st.cache_resource(show_spinner=False)
+def get_embeddings():
+    return HuggingFaceEmbeddings(
+        model_name=DEFAULT_EMBEDDING_MODEL,
+        model_kwargs={
+            "device": DEVICE,
+            "model_kwargs": {"torch_dtype": torch.float16},
+        },
+        encode_kwargs={
+            "batch_size": 128 if DEVICE == "cpu" else 512,
+            "normalize_embeddings": True,
+        },
+    )
 # ---------------------------------------------------------------------------
 # Document construction
     # --- Create new store if needed ---
     if existing_store is None:
+        dim = len(get_embeddings().embed_query("probe"))
         index = faiss.IndexFlatL2(dim)
         vector_store = FAISS(
+            embedding_function=get_embeddings(),
             index=index,
             docstore=InMemoryDocstore(),
             index_to_docstore_id={},
     # --- Resume / initialize ---
     if os.path.exists(os.path.join(save_path, "index.faiss")):
         vector_store = FAISS.load_local(
+            save_path, get_embeddings(), allow_dangerous_deserialization=True
         )
         already_indexed = set(vector_store.index_to_docstore_id.values())
         print(f"Resuming — {len(already_indexed)} docs already indexed.")
     return FAISS.load_local(
         load_path,
+        embeddings=get_embeddings(),
         allow_dangerous_deserialization=True,
     )