File size: 406 Bytes
1715fb7
 
4ed3f0a
e8fa82e
1715fb7
 
4ed3f0a
 
1715fb7
4ed3f0a
e8fa82e
4ed3f0a
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
import os

BASE_DIR = "/app"
HF_DATASET_REPO = "Zubaish/gandhi-kb-docx"  # Ensure this points to your NEW docx repo
HF_TOKEN = os.getenv("HF_TOKEN")

CHROMA_DIR = os.path.join(BASE_DIR, "chroma_db")
KB_DIR = os.path.join(BASE_DIR, "kb")

EMBEDDING_MODEL = "sentence-transformers/all-MiniLM-L6-v2"
LLM_MODEL = "Qwen/Qwen2.5-1.5B-Instruct" 
LLM_TASK = "text-generation"

CHUNK_SIZE = 1000
CHUNK_OVERLAP = 100