dnj0 commited on
Commit
cffffd0
·
verified ·
1 Parent(s): 7afdcb0

Update src/config.py

Browse files
Files changed (1) hide show
  1. src/config.py +10 -20
src/config.py CHANGED
@@ -1,42 +1,32 @@
1
- """
2
- Configuration file for Multimodal RAG LLM System
3
- """
4
  import os
5
  from pathlib import Path
6
 
7
- # API Configuration
8
  OPENAI_API_KEY = os.getenv("OPENAI_API_KEY", "")
9
- OPENAI_MODEL = "gpt-4o-mini" # Cheaper model variant
10
- USE_CACHE = True # Enable response caching
11
 
12
- # Vector Store Configuration
13
  CHROMA_DB_PATH = "./chroma_db"
14
  DOCSTORE_PATH = "./docstore"
15
  PROCESSED_FILES_LOG = "./processed_files.txt"
16
 
17
- # Embedding Model Configuration
18
  EMBEDDING_MODEL = "sentence-transformers/all-mpnet-base-v2"
19
  EMBEDDING_DIM = 768
20
 
21
- # System Configuration
22
- MAX_CHUNK_SIZE = 500 # Smaller chunks = fewer tokens
23
- CHUNK_OVERLAP = 50 # Less overlap = fewer chunks
24
- TEMPERATURE = 0.3 # Lower = faster, cheaper
25
- MAX_TOKENS = 500 # Limit response size (vs 1500)
26
 
27
- # Language Support
28
  LANGUAGE = "russian"
29
 
30
- # Create necessary directories
31
  Path(CHROMA_DB_PATH).mkdir(exist_ok=True)
32
  Path(DOCSTORE_PATH).mkdir(exist_ok=True)
33
 
34
- # PDF Upload Configuration
35
  UPLOAD_FOLDER = "./uploaded_pdfs"
36
  Path(UPLOAD_FOLDER).mkdir(exist_ok=True)
37
  MAX_PDF_SIZE_MB = 50
38
 
39
- # TOKEN OPTIMIZATION SETTINGS
40
- BATCH_SEARCH_RESULTS = 3 # Return only top 3 (not 5)
41
- CACHE_RESPONSES = True # Cache Q&A responses
42
- SUMMARIZE_FIRST = True # Summarize PDFs once, not per query
 
1
+
 
 
2
  import os
3
  from pathlib import Path
4
 
 
5
  OPENAI_API_KEY = os.getenv("OPENAI_API_KEY", "")
6
+ OPENAI_MODEL = "gpt-4o-mini"
7
+ USE_CACHE = True
8
 
 
9
  CHROMA_DB_PATH = "./chroma_db"
10
  DOCSTORE_PATH = "./docstore"
11
  PROCESSED_FILES_LOG = "./processed_files.txt"
12
 
 
13
  EMBEDDING_MODEL = "sentence-transformers/all-mpnet-base-v2"
14
  EMBEDDING_DIM = 768
15
 
16
+ MAX_CHUNK_SIZE = 500
17
+ CHUNK_OVERLAP = 50
18
+ TEMPERATURE = 0.3
19
+ MAX_TOKENS = 500
 
20
 
 
21
  LANGUAGE = "russian"
22
 
 
23
  Path(CHROMA_DB_PATH).mkdir(exist_ok=True)
24
  Path(DOCSTORE_PATH).mkdir(exist_ok=True)
25
 
 
26
  UPLOAD_FOLDER = "./uploaded_pdfs"
27
  Path(UPLOAD_FOLDER).mkdir(exist_ok=True)
28
  MAX_PDF_SIZE_MB = 50
29
 
30
+ BATCH_SEARCH_RESULTS = 3
31
+ CACHE_RESPONSES = True
32
+ SUMMARIZE_FIRST = True