NeonSamurai commited on
Commit
3ced916
·
verified ·
1 Parent(s): b2f74d5

Update rag.py

Browse files
Files changed (1) hide show
  1. rag.py +7 -21
rag.py CHANGED
@@ -1,4 +1,5 @@
1
  import os
 
2
  import streamlit as st
3
  from dotenv import load_dotenv
4
  import pickle
@@ -15,20 +16,7 @@ from llama_index.core import get_response_synthesizer
15
  from llama_index.core.agent import ReActAgent
16
  from chromadb import PersistentClient
17
 
18
- # writable cache directories
19
- CACHE_DIR = "/app/.cache"
20
- HUGGINGFACE_CACHE = os.path.join(CACHE_DIR, "huggingface")
21
- VECTORDb_DIR = "/app/vectordb"
22
- STREAMLIT_CONFIG = "/app/.streamlit"
23
-
24
- os.makedirs(HUGGINGFACE_CACHE, exist_ok=True)
25
- os.makedirs(VECTORDb_DIR, exist_ok=True)
26
- os.makedirs(STREAMLIT_CONFIG, exist_ok=True)
27
-
28
- os.environ["TRANSFORMERS_CACHE"] = CACHE_DIR
29
- os.environ["HF_HOME"] = CACHE_DIR
30
- os.environ["XDG_CACHE_HOME"] = CACHE_DIR
31
- os.environ["STREAMLIT_HOME"] = STREAMLIT_CONFIG
32
 
33
  @st.cache_resource
34
  def setup_rag_system(debug=False):
@@ -48,11 +36,7 @@ def setup_rag_system(debug=False):
48
  )
49
 
50
  # Embeddings
51
- embedding_model = HuggingFaceEmbedding(
52
- model_name="sentence-transformers/all-MiniLM-L6-v2",
53
- cache_folder=HUGGINGFACE_CACHE
54
- )
55
-
56
 
57
  # Persisted vector DBs
58
  persist_dirs = [
@@ -92,7 +76,7 @@ def setup_rag_system(debug=False):
92
  hybrid_retriever = RecursiveRetriever(
93
  "vector",
94
  retriever_dict={"vector": vector_retriever, "bm25": bm25_retriever},
95
- verbose=False
96
  )
97
  hybrid_retrievers.append(hybrid_retriever)
98
 
@@ -178,11 +162,13 @@ def setup_rag_system(debug=False):
178
  agent = ReActAgent(
179
  tools=retriever_tools,
180
  llm=llm,
181
- verbose=False,
182
  max_iterations=20,
183
  system_prompt=system_prompt
184
  )
185
 
 
 
186
  if debug:
187
  return agent, llm, hybrid_retrievers
188
 
 
1
  import os
2
+ import logging
3
  import streamlit as st
4
  from dotenv import load_dotenv
5
  import pickle
 
16
  from llama_index.core.agent import ReActAgent
17
  from chromadb import PersistentClient
18
 
19
+ logger = logging.getLogger(__name__)
 
 
 
 
 
 
 
 
 
 
 
 
 
20
 
21
  @st.cache_resource
22
  def setup_rag_system(debug=False):
 
36
  )
37
 
38
  # Embeddings
39
+ embedding_model = HuggingFaceEmbedding(model_name="sentence-transformers/all-MiniLM-L6-v2")
 
 
 
 
40
 
41
  # Persisted vector DBs
42
  persist_dirs = [
 
76
  hybrid_retriever = RecursiveRetriever(
77
  "vector",
78
  retriever_dict={"vector": vector_retriever, "bm25": bm25_retriever},
79
+ verbose=True
80
  )
81
  hybrid_retrievers.append(hybrid_retriever)
82
 
 
162
  agent = ReActAgent(
163
  tools=retriever_tools,
164
  llm=llm,
165
+ verbose=True,
166
  max_iterations=20,
167
  system_prompt=system_prompt
168
  )
169
 
170
+ logger.info("RAG system setup complete.")
171
+
172
  if debug:
173
  return agent, llm, hybrid_retrievers
174