akryldigital commited on
Commit
ff8da5f
·
verified ·
1 Parent(s): aadfbb0

update configs (model routing)

Browse files
src/config/filter_options.json CHANGED
The diff for this file is too large to render. See raw diff
 
src/config/settings.yaml CHANGED
@@ -7,7 +7,7 @@ qdrant:
7
  # url: "https://2c6d0136-b6ca-4400-bac5-1703f58abc43.europe-west3-0.gcp.cloud.qdrant.io"
8
  # Current cluster with BAAI-bge-m3 and colSmol-500M-v2 collections:
9
  url: "${QDRANT_URL}" # Load from environment variable (should be the us-west-1 cluster)
10
- collection_name: "BAAI-bge-m3" # Text-based RAG collection (41175 points)
11
  prefer_grpc: true
12
  api_key: "${QDRANT_API_KEY}" # Load from environment variable
13
 
@@ -57,6 +57,17 @@ reader:
57
  OPENAI:
58
  model: "gpt-4o-mini"
59
 
 
 
 
 
 
 
 
 
 
 
 
60
  OLLAMA:
61
  model: "mistral-small3.1:24b-instruct-2503-q8_0"
62
  base_url: "http://10.1.4.192:11434/"
 
7
  # url: "https://2c6d0136-b6ca-4400-bac5-1703f58abc43.europe-west3-0.gcp.cloud.qdrant.io"
8
  # Current cluster with BAAI-bge-m3 and colSmol-500M-v2 collections:
9
  url: "${QDRANT_URL}" # Load from environment variable (should be the us-west-1 cluster)
10
+ collection_name: "BAAI-bge-m3-full" # Full text-based RAG collection
11
  prefer_grpc: true
12
  api_key: "${QDRANT_API_KEY}" # Load from environment variable
13
 
 
57
  OPENAI:
58
  model: "gpt-4o-mini"
59
 
60
+ OPENAI_STRONG:
61
+ model: "gpt-4.1"
62
+ temperature: 0.2
63
+
64
+ # Optional: dedicated model for final response generation.
65
+ # Uncomment and set to gpt-5 or similar when ready for highest-quality answers.
66
+ # Falls back to OPENAI_STRONG if not set.
67
+ # OPENAI_RESPONSE:
68
+ # model: "gpt-4.1"
69
+ # temperature: 0.3
70
+
71
  OLLAMA:
72
  model: "mistral-small3.1:24b-instruct-2503-q8_0"
73
  base_url: "http://10.1.4.192:11434/"