# ------------------------------------------------------------------ # RAG CBT QUESTION-ANSWERING SYSTEM CONFIGURATION # ------------------------------------------------------------------ project: name: "cbt-rag-system" category: "psychology" doc_limit: null # Load all pages from the book processing: # Embedding model used for both vector db and evaluator similarity embedding_model: "jinaai/jina-embeddings-v2-small-en" # Options: sentence, recursive, semantic, fixed technique: "recursive" # Jina supports 8192 tokens (~32k chars), using 1000 chars for better context chunk_size: 1000 chunk_overlap: 100 vector_db: base_index_name: "cbt-book" dimension: 512 # Jina outputs 512 dimensions metric: "cosine" batch_size: 50 # Reduced batch size for CPU processing retrieval: # Options: hybrid, semantic, bm25 mode: "hybrid" # Options: cross-encoder, rrf rerank_strategy: "cross-encoder" use_mmr: False top_k: 50 final_k: 4 generation: temperature: 0. max_new_tokens: 1500 # The model used to Judge the others (OpenRouter) judge_model: "deepseek/deepseek-v3.2" # List of contestants in the tournament models: - "TinyAya" - "Llama-3-8B" - "Qwen-3.5-9B" - "Mistral-7B"