Spaces:
Sleeping
Sleeping
File size: 887 Bytes
bb04c5f | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 | # Directories to index
watch_paths:
- ./data/scifact
- ./data/nfcorpus #modify this
# File extensions to include
include_extensions:
- ".pdf"
- ".docx"
- ".txt"
- ".md"
- ".pptx"
- ".xlsx"
- ".py"
- ".js"
- ".ipynb"
# --- Add these ---
top_k: 5 # final results returned to user
candidate_k: 20 # candidates fetched before reranking
query_expansion: true # WordNet synonym expansion
max_synonyms: 5 # max synonyms to append
reranking_enabled: true # cross-encoder reranking
reranker_model: "cross-encoder/ms-marco-MiniLM-L-6-v2"
# Directories to skip
skip_directories:
- ".git"
- "node_modules"
- "__pycache__"
- ".venv"
# Where to store index data
data_dir: "./data"
embedding_model: "all-MiniLM-L6-v2"
# embedding_model: BAAI/bge-small-en-v1.5
debounce_seconds: 5 |