NimrodDev commited on
Commit
2aa887d
·
1 Parent(s): 286debb

use pre-installed MiniLM (no cache, no internet)

Browse files
Files changed (1) hide show
  1. rag.py +3 -11
rag.py CHANGED
@@ -103,23 +103,15 @@ def get_texts() -> List[str]:
103
  print(f"⚠ Dataset fetch failed: {e} – using empty corpus")
104
  return []
105
 
 
106
  # ------------------------------------------------------------------
107
  @lru_cache(maxsize=1)
108
  def get_vectorstore() -> FAISS:
109
  texts = get_texts()
110
 
111
- # --- FINAL: load local MiniLM (no internet, no cache) -----------------
112
- import os
113
- local_model_path = os.path.abspath(
114
- os.path.join(os.path.dirname(__file__), "st_model")
115
- )
116
-
117
- # force transformers to read local files only
118
- os.environ["TRANSFORMERS_OFFLINE"] = "1"
119
- os.environ["HF_DATASETS_OFFLINE"] = "1"
120
-
121
  from sentence_transformers import SentenceTransformer
122
- model = SentenceTransformer(local_model_path, device="cpu", cache_folder=None)
123
 
124
  from langchain.embeddings import SentenceTransformerEmbeddings
125
  embeddings = SentenceTransformerEmbeddings(model=model)
 
103
  print(f"⚠ Dataset fetch failed: {e} – using empty corpus")
104
  return []
105
 
106
+ # ------------------------------------------------------------------
107
  # ------------------------------------------------------------------
108
  @lru_cache(maxsize=1)
109
  def get_vectorstore() -> FAISS:
110
  texts = get_texts()
111
 
112
+ # --- FINAL: use pre-installed MiniLM (no cache, no internet) ----------
 
 
 
 
 
 
 
 
 
113
  from sentence_transformers import SentenceTransformer
114
+ model = SentenceTransformer("all-MiniLM-L6-v2", device="cpu", cache_folder=None)
115
 
116
  from langchain.embeddings import SentenceTransformerEmbeddings
117
  embeddings = SentenceTransformerEmbeddings(model=model)