File size: 887 Bytes
bb04c5f
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
# Directories to index
watch_paths:
  - ./data/scifact
  - ./data/nfcorpus #modify this

# File extensions to include
include_extensions:
  - ".pdf"
  - ".docx"
  - ".txt"
  - ".md"
  - ".pptx"
  - ".xlsx"
  - ".py"
  - ".js"
  - ".ipynb"


# --- Add these ---
top_k: 5                  # final results returned to user
candidate_k: 20           # candidates fetched before reranking

query_expansion: true     # WordNet synonym expansion
max_synonyms: 5           # max synonyms to append

reranking_enabled: true   # cross-encoder reranking
reranker_model: "cross-encoder/ms-marco-MiniLM-L-6-v2"

# Directories to skip
skip_directories:
  - ".git"
  - "node_modules"
  - "__pycache__"
  - ".venv"

# Where to store index data
data_dir: "./data"

embedding_model: "all-MiniLM-L6-v2"
# embedding_model: BAAI/bge-small-en-v1.5

debounce_seconds: 5