NeonSamurai commited on
Commit
bc6018a
·
verified ·
1 Parent(s): 80ebbd6

Update rag.py

Browse files
Files changed (1) hide show
  1. rag.py +19 -7
rag.py CHANGED
@@ -16,11 +16,19 @@ from llama_index.core.agent import ReActAgent
16
  from chromadb import PersistentClient
17
 
18
  # writable cache directories
19
- os.environ["TRANSFORMERS_CACHE"] = "/app/.cache"
20
- os.environ["HF_HOME"] = "/app/.cache"
21
- os.environ["XDG_CACHE_HOME"] = "/app/.cache" # Some libs use this
 
22
 
23
- os.makedirs("/app/.cache", exist_ok=True)
 
 
 
 
 
 
 
24
 
25
  @st.cache_resource
26
  def setup_rag_system(debug=False):
@@ -40,7 +48,11 @@ def setup_rag_system(debug=False):
40
  )
41
 
42
  # Embeddings
43
- embedding_model = HuggingFaceEmbedding(model_name="sentence-transformers/all-MiniLM-L6-v2")
 
 
 
 
44
 
45
  # Persisted vector DBs
46
  persist_dirs = [
@@ -80,7 +92,7 @@ def setup_rag_system(debug=False):
80
  hybrid_retriever = RecursiveRetriever(
81
  "vector",
82
  retriever_dict={"vector": vector_retriever, "bm25": bm25_retriever},
83
- verbose=True
84
  )
85
  hybrid_retrievers.append(hybrid_retriever)
86
 
@@ -166,7 +178,7 @@ def setup_rag_system(debug=False):
166
  agent = ReActAgent(
167
  tools=retriever_tools,
168
  llm=llm,
169
- verbose=True,
170
  max_iterations=20,
171
  system_prompt=system_prompt
172
  )
 
16
  from chromadb import PersistentClient
17
 
18
  # writable cache directories
19
+ CACHE_DIR = "/app/.cache"
20
+ HUGGINGFACE_CACHE = os.path.join(CACHE_DIR, "huggingface")
21
+ VECTORDb_DIR = "/app/vectordb"
22
+ STREAMLIT_CONFIG = "/app/.streamlit"
23
 
24
+ os.makedirs(HUGGINGFACE_CACHE, exist_ok=True)
25
+ os.makedirs(VECTORDb_DIR, exist_ok=True)
26
+ os.makedirs(STREAMLIT_CONFIG, exist_ok=True)
27
+
28
+ os.environ["TRANSFORMERS_CACHE"] = CACHE_DIR
29
+ os.environ["HF_HOME"] = CACHE_DIR
30
+ os.environ["XDG_CACHE_HOME"] = CACHE_DIR
31
+ os.environ["STREAMLIT_HOME"] = STREAMLIT_CONFIG
32
 
33
  @st.cache_resource
34
  def setup_rag_system(debug=False):
 
48
  )
49
 
50
  # Embeddings
51
+ embedding_model = HuggingFaceEmbedding(
52
+ model_name="sentence-transformers/all-MiniLM-L6-v2",
53
+ cache_folder=HUGGINGFACE_CACHE
54
+ )
55
+
56
 
57
  # Persisted vector DBs
58
  persist_dirs = [
 
92
  hybrid_retriever = RecursiveRetriever(
93
  "vector",
94
  retriever_dict={"vector": vector_retriever, "bm25": bm25_retriever},
95
+ verbose=False
96
  )
97
  hybrid_retrievers.append(hybrid_retriever)
98
 
 
178
  agent = ReActAgent(
179
  tools=retriever_tools,
180
  llm=llm,
181
+ verbose=False,
182
  max_iterations=20,
183
  system_prompt=system_prompt
184
  )