Spaces:
Sleeping
Sleeping
Update rag.py
Browse files
rag.py
CHANGED
|
@@ -16,11 +16,19 @@ from llama_index.core.agent import ReActAgent
|
|
| 16 |
from chromadb import PersistentClient
|
| 17 |
|
| 18 |
# writable cache directories
|
| 19 |
-
|
| 20 |
-
os.
|
| 21 |
-
|
|
|
|
| 22 |
|
| 23 |
-
os.makedirs(
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 24 |
|
| 25 |
@st.cache_resource
|
| 26 |
def setup_rag_system(debug=False):
|
|
@@ -40,7 +48,11 @@ def setup_rag_system(debug=False):
|
|
| 40 |
)
|
| 41 |
|
| 42 |
# Embeddings
|
| 43 |
-
embedding_model = HuggingFaceEmbedding(
|
|
|
|
|
|
|
|
|
|
|
|
|
| 44 |
|
| 45 |
# Persisted vector DBs
|
| 46 |
persist_dirs = [
|
|
@@ -80,7 +92,7 @@ def setup_rag_system(debug=False):
|
|
| 80 |
hybrid_retriever = RecursiveRetriever(
|
| 81 |
"vector",
|
| 82 |
retriever_dict={"vector": vector_retriever, "bm25": bm25_retriever},
|
| 83 |
-
verbose=
|
| 84 |
)
|
| 85 |
hybrid_retrievers.append(hybrid_retriever)
|
| 86 |
|
|
@@ -166,7 +178,7 @@ def setup_rag_system(debug=False):
|
|
| 166 |
agent = ReActAgent(
|
| 167 |
tools=retriever_tools,
|
| 168 |
llm=llm,
|
| 169 |
-
verbose=
|
| 170 |
max_iterations=20,
|
| 171 |
system_prompt=system_prompt
|
| 172 |
)
|
|
|
|
| 16 |
from chromadb import PersistentClient
|
| 17 |
|
| 18 |
# writable cache directories
|
| 19 |
+
CACHE_DIR = "/app/.cache"
|
| 20 |
+
HUGGINGFACE_CACHE = os.path.join(CACHE_DIR, "huggingface")
|
| 21 |
+
VECTORDb_DIR = "/app/vectordb"
|
| 22 |
+
STREAMLIT_CONFIG = "/app/.streamlit"
|
| 23 |
|
| 24 |
+
os.makedirs(HUGGINGFACE_CACHE, exist_ok=True)
|
| 25 |
+
os.makedirs(VECTORDb_DIR, exist_ok=True)
|
| 26 |
+
os.makedirs(STREAMLIT_CONFIG, exist_ok=True)
|
| 27 |
+
|
| 28 |
+
os.environ["TRANSFORMERS_CACHE"] = CACHE_DIR
|
| 29 |
+
os.environ["HF_HOME"] = CACHE_DIR
|
| 30 |
+
os.environ["XDG_CACHE_HOME"] = CACHE_DIR
|
| 31 |
+
os.environ["STREAMLIT_HOME"] = STREAMLIT_CONFIG
|
| 32 |
|
| 33 |
@st.cache_resource
|
| 34 |
def setup_rag_system(debug=False):
|
|
|
|
| 48 |
)
|
| 49 |
|
| 50 |
# Embeddings
|
| 51 |
+
embedding_model = HuggingFaceEmbedding(
|
| 52 |
+
model_name="sentence-transformers/all-MiniLM-L6-v2",
|
| 53 |
+
cache_folder=HUGGINGFACE_CACHE
|
| 54 |
+
)
|
| 55 |
+
|
| 56 |
|
| 57 |
# Persisted vector DBs
|
| 58 |
persist_dirs = [
|
|
|
|
| 92 |
hybrid_retriever = RecursiveRetriever(
|
| 93 |
"vector",
|
| 94 |
retriever_dict={"vector": vector_retriever, "bm25": bm25_retriever},
|
| 95 |
+
verbose=False
|
| 96 |
)
|
| 97 |
hybrid_retrievers.append(hybrid_retriever)
|
| 98 |
|
|
|
|
| 178 |
agent = ReActAgent(
|
| 179 |
tools=retriever_tools,
|
| 180 |
llm=llm,
|
| 181 |
+
verbose=False,
|
| 182 |
max_iterations=20,
|
| 183 |
system_prompt=system_prompt
|
| 184 |
)
|