Spaces:

projectsorg
/

digital-twin-backend

Sleeping

AlexKurian commited on Jan 16

Commit

a2f12e1

1 Parent(s): d7b3396

Disable RAG model download for instant startup (Light Mode)

Files changed (1) hide show

policy_engine.py CHANGED Viewed

@@ -77,41 +77,28 @@ class PolicyEngine:
     def __init__(self):
         """Initialize FAISS index and LLM."""
-        from huggingface_hub import snapshot_download
-        print(f"Initializing PolicyEngine with model: {config.EMBEDDINGS_MODEL}")
-        # Robust download with retries
-        try:
-            snapshot_download(
-                repo_id=config.EMBEDDINGS_MODEL,
-                resume_download=True,
-                etag_timeout=60,
-                ignore_patterns=["*.onnx", "*.tflite", "*.ot", "*.h5", "*.msgpack", "*.safetensors"]
-            )
-        except Exception as e:
-             print(f"Standard download failed, retrying without hf_transfer: {e}")
-             os.environ["HF_HUB_ENABLE_HF_TRANSFER"] = "0"
-             # Fallback
-             pass
-        self.embeddings = HuggingFaceEmbeddings(
-            model_name=config.EMBEDDINGS_MODEL,
-            model_kwargs={'device': 'cpu'},
-            encode_kwargs={'normalize_embeddings': True}
-        )
-        try:
-            self.db = FAISS.load_local(
-                str(config.FAISS_INDEX_PATH),
-                self.embeddings,
-                allow_dangerous_deserialization=True
-            )
-        except Exception as e:
-            print(f"Warning: FAISS index not found at {config.FAISS_INDEX_PATH}")
-            print(f"Error: {e}")
-            self.db = None
         self.llm = ChatGroq(
             model=config.LLM_MODEL,
             temperature=0.5,

     def __init__(self):
         """Initialize FAISS index and LLM."""
+        # SKIP EMBEDDINGS DOWNLOAD: "Can we not do it at all?"
+        # User requested instant startup without RAG.
+        # -----------------------------------------------------------------
+        # from huggingface_hub import snapshot_download
+        print("\n[INFO] RAG/Embeddings initialization SKIPPED by configuration.")
+        print("[INFO] Policy Engine running in 'Direct Query' mode (LLM only).")
+        self.embeddings = None
+        self.db = None
+        # -----------------------------------------------------------------
+        # Original logic commented out to prevent 400MB+ download on Spaces:
+        #
+        # print(f"Initializing PolicyEngine with model: {config.EMBEDDINGS_MODEL}")
+        # try:
+        #     snapshot_download(...)
+        # except Exception: ...
+        # self.embeddings = HuggingFaceEmbeddings(...)
+        # self.db = FAISS.load_local(...)
+        # -----------------------------------------------------------------
         self.llm = ChatGroq(
             model=config.LLM_MODEL,
             temperature=0.5,