Rahul-Samedavar commited on
Commit
74e17dc
·
1 Parent(s): ade6079

final, alll set

Browse files
Files changed (1) hide show
  1. config/config.py +4 -5
config/config.py CHANGED
@@ -20,10 +20,9 @@ BEARER_TOKEN = os.getenv("BEARER_TOKEN")
20
  CHUNK_SIZE = 400 * 4
21
  CHUNK_OVERLAP = 100 * 4
22
 
23
- # Retrieval Settings
24
- TOP_K = 9
25
  SCORE_THRESHOLD = 0.3
26
- RERANK_TOP_K = 7 # 9*400 = 3600, < 4000, some tokens reserved for questions
27
  BM25_WEIGHT = 0.3
28
  SEMANTIC_WEIGHT = 0.7
29
 
@@ -38,8 +37,8 @@ MAX_CONTEXT_LENGTH = 4000*4
38
 
39
  USE_TOTAL_BUDGET_APPROACH = True
40
 
41
- EMBEDDING_MODEL = "all-MiniLM-L6-v2"
42
- BATCH_SIZE = 4
43
 
44
  OUTPUT_DIR = os.getenv("RAG_EMBEDDINGS_PATH", "./RAG/rag_embeddings")
45
 
 
20
  CHUNK_SIZE = 400 * 4
21
  CHUNK_OVERLAP = 100 * 4
22
 
23
+ TOP_K = 12
 
24
  SCORE_THRESHOLD = 0.3
25
+ RERANK_TOP_K = 9
26
  BM25_WEIGHT = 0.3
27
  SEMANTIC_WEIGHT = 0.7
28
 
 
37
 
38
  USE_TOTAL_BUDGET_APPROACH = True
39
 
40
+ EMBEDDING_MODEL ="BAAI/bge-large-en"
41
+ BATCH_SIZE = 8
42
 
43
  OUTPUT_DIR = os.getenv("RAG_EMBEDDINGS_PATH", "./RAG/rag_embeddings")
44