minh-4T commited on
Commit
a802c71
·
verified ·
1 Parent(s): 1eda9e4

Update core/config.py

Browse files
Files changed (1) hide show
  1. core/config.py +21 -11
core/config.py CHANGED
@@ -9,17 +9,27 @@ try:
9
  except Exception:
10
  pass
11
 
12
- # Read configuration from environment (safe for production). Defaults provided for convenience.
13
- GROQ_API_KEY = os.getenv('GROQ_API_KEY')
14
- LLM_MODEL = os.getenv('LLM_MODEL', 'llama-3.1-8b-instant')
15
- EMBED_MODEL = os.getenv('EMBED_MODEL', 'sentence-transformers/all-MiniLM-L6-v2')
16
- CROSS_ENCODER_MODEL = os.getenv('CROSS_ENCODER_MODEL', 'cross-encoder/ms-marco-MiniLM-L-6-v2')
17
- DATA_DIR = os.getenv('DATA_DIR', 'data')
18
- VECTOR_DIR = os.getenv('VECTOR_DIR', 'vectorstore')
19
- CHUNK_SIZE = int(os.getenv('CHUNK_SIZE', '1500'))
20
- CHUNK_OVERLAP = int(os.getenv('CHUNK_OVERLAP', '300'))
21
- TOP_K_RESULTS = int(os.getenv('TOP_K_RESULTS', '10'))
 
 
 
22
  FINAL_TOP_K = int(os.getenv('FINAL_TOP_K', '5'))
 
 
23
  QDRANT_URL = os.getenv('QDRANT_URL')
24
  QDRANT_API_KEY = os.getenv('QDRANT_API_KEY')
25
- DATABASE_URL = os.getenv('DATABASE_URL', 'sqlite:///chat_history.db')
 
 
 
 
 
 
9
  except Exception:
10
  pass
11
 
12
+ GROQ_API_KEYS = os.getenv('GROQ_API_KEYS', os.getenv('GROQ_API_KEY', ''))
13
+ GEMINI_API_KEYS = os.getenv('GEMINI_API_KEYS', '')
14
+
15
+ # Name models
16
+ LLM_MODEL = os.getenv('LLM_MODEL', 'llama-3.1-70b-versatile')
17
+ FAST_LLM_MODEL = os.getenv('FAST_LLM_MODEL', 'llama-3.1-8b-instant')
18
+ EMBED_MODEL = os.getenv('EMBED_MODEL', 'BAAI/bge-m3')
19
+ CROSS_ENCODER_MODEL = os.getenv('CROSS_ENCODER_MODEL', 'BAAI/bge-reranker-base')
20
+
21
+ # Chunking and retrieval settings
22
+ CHUNK_SIZE = int(os.getenv('CHUNK_SIZE', '800'))
23
+ CHUNK_OVERLAP = int(os.getenv('CHUNK_OVERLAP', '150'))
24
+ TOP_K_RESULTS = int(os.getenv('TOP_K_RESULTS', '15'))
25
  FINAL_TOP_K = int(os.getenv('FINAL_TOP_K', '5'))
26
+
27
+ # External service configs
28
  QDRANT_URL = os.getenv('QDRANT_URL')
29
  QDRANT_API_KEY = os.getenv('QDRANT_API_KEY')
30
+ DATABASE_URL = os.getenv('DATABASE_URL')
31
+
32
+ # - Context and output limits
33
+ MAX_CONTEXT_CHARS = int(os.getenv('MAX_CONTEXT_CHARS', '12000'))
34
+ MAX_OUT_CHARS = int(os.getenv('MAX_OUT_CHARS', '3000'))
35
+ MAX_HISTORY_MESSAGES = int(os.getenv('MAX_HISTORY_MESSAGES', '20'))