Spaces:
Sleeping
Sleeping
Update rag.py
Browse files
rag.py
CHANGED
|
@@ -1,4 +1,5 @@
|
|
| 1 |
import os
|
|
|
|
| 2 |
import streamlit as st
|
| 3 |
from dotenv import load_dotenv
|
| 4 |
import pickle
|
|
@@ -15,20 +16,7 @@ from llama_index.core import get_response_synthesizer
|
|
| 15 |
from llama_index.core.agent import ReActAgent
|
| 16 |
from chromadb import PersistentClient
|
| 17 |
|
| 18 |
-
|
| 19 |
-
CACHE_DIR = "/app/.cache"
|
| 20 |
-
HUGGINGFACE_CACHE = os.path.join(CACHE_DIR, "huggingface")
|
| 21 |
-
VECTORDb_DIR = "/app/vectordb"
|
| 22 |
-
STREAMLIT_CONFIG = "/app/.streamlit"
|
| 23 |
-
|
| 24 |
-
os.makedirs(HUGGINGFACE_CACHE, exist_ok=True)
|
| 25 |
-
os.makedirs(VECTORDb_DIR, exist_ok=True)
|
| 26 |
-
os.makedirs(STREAMLIT_CONFIG, exist_ok=True)
|
| 27 |
-
|
| 28 |
-
os.environ["TRANSFORMERS_CACHE"] = CACHE_DIR
|
| 29 |
-
os.environ["HF_HOME"] = CACHE_DIR
|
| 30 |
-
os.environ["XDG_CACHE_HOME"] = CACHE_DIR
|
| 31 |
-
os.environ["STREAMLIT_HOME"] = STREAMLIT_CONFIG
|
| 32 |
|
| 33 |
@st.cache_resource
|
| 34 |
def setup_rag_system(debug=False):
|
|
@@ -48,11 +36,7 @@ def setup_rag_system(debug=False):
|
|
| 48 |
)
|
| 49 |
|
| 50 |
# Embeddings
|
| 51 |
-
embedding_model = HuggingFaceEmbedding(
|
| 52 |
-
model_name="sentence-transformers/all-MiniLM-L6-v2",
|
| 53 |
-
cache_folder=HUGGINGFACE_CACHE
|
| 54 |
-
)
|
| 55 |
-
|
| 56 |
|
| 57 |
# Persisted vector DBs
|
| 58 |
persist_dirs = [
|
|
@@ -92,7 +76,7 @@ def setup_rag_system(debug=False):
|
|
| 92 |
hybrid_retriever = RecursiveRetriever(
|
| 93 |
"vector",
|
| 94 |
retriever_dict={"vector": vector_retriever, "bm25": bm25_retriever},
|
| 95 |
-
verbose=
|
| 96 |
)
|
| 97 |
hybrid_retrievers.append(hybrid_retriever)
|
| 98 |
|
|
@@ -178,11 +162,13 @@ def setup_rag_system(debug=False):
|
|
| 178 |
agent = ReActAgent(
|
| 179 |
tools=retriever_tools,
|
| 180 |
llm=llm,
|
| 181 |
-
verbose=
|
| 182 |
max_iterations=20,
|
| 183 |
system_prompt=system_prompt
|
| 184 |
)
|
| 185 |
|
|
|
|
|
|
|
| 186 |
if debug:
|
| 187 |
return agent, llm, hybrid_retrievers
|
| 188 |
|
|
|
|
| 1 |
import os
|
| 2 |
+
import logging
|
| 3 |
import streamlit as st
|
| 4 |
from dotenv import load_dotenv
|
| 5 |
import pickle
|
|
|
|
| 16 |
from llama_index.core.agent import ReActAgent
|
| 17 |
from chromadb import PersistentClient
|
| 18 |
|
| 19 |
+
logger = logging.getLogger(__name__)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 20 |
|
| 21 |
@st.cache_resource
|
| 22 |
def setup_rag_system(debug=False):
|
|
|
|
| 36 |
)
|
| 37 |
|
| 38 |
# Embeddings
|
| 39 |
+
embedding_model = HuggingFaceEmbedding(model_name="sentence-transformers/all-MiniLM-L6-v2")
|
|
|
|
|
|
|
|
|
|
|
|
|
| 40 |
|
| 41 |
# Persisted vector DBs
|
| 42 |
persist_dirs = [
|
|
|
|
| 76 |
hybrid_retriever = RecursiveRetriever(
|
| 77 |
"vector",
|
| 78 |
retriever_dict={"vector": vector_retriever, "bm25": bm25_retriever},
|
| 79 |
+
verbose=True
|
| 80 |
)
|
| 81 |
hybrid_retrievers.append(hybrid_retriever)
|
| 82 |
|
|
|
|
| 162 |
agent = ReActAgent(
|
| 163 |
tools=retriever_tools,
|
| 164 |
llm=llm,
|
| 165 |
+
verbose=True,
|
| 166 |
max_iterations=20,
|
| 167 |
system_prompt=system_prompt
|
| 168 |
)
|
| 169 |
|
| 170 |
+
logger.info("RAG system setup complete.")
|
| 171 |
+
|
| 172 |
if debug:
|
| 173 |
return agent, llm, hybrid_retrievers
|
| 174 |
|