Spaces:
Running
Running
update configs (model routing)
Browse files- src/config/filter_options.json +0 -0
- src/config/settings.yaml +12 -1
src/config/filter_options.json
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|
src/config/settings.yaml
CHANGED
|
@@ -7,7 +7,7 @@ qdrant:
|
|
| 7 |
# url: "https://2c6d0136-b6ca-4400-bac5-1703f58abc43.europe-west3-0.gcp.cloud.qdrant.io"
|
| 8 |
# Current cluster with BAAI-bge-m3 and colSmol-500M-v2 collections:
|
| 9 |
url: "${QDRANT_URL}" # Load from environment variable (should be the us-west-1 cluster)
|
| 10 |
-
collection_name: "BAAI-bge-m3" #
|
| 11 |
prefer_grpc: true
|
| 12 |
api_key: "${QDRANT_API_KEY}" # Load from environment variable
|
| 13 |
|
|
@@ -57,6 +57,17 @@ reader:
|
|
| 57 |
OPENAI:
|
| 58 |
model: "gpt-4o-mini"
|
| 59 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 60 |
OLLAMA:
|
| 61 |
model: "mistral-small3.1:24b-instruct-2503-q8_0"
|
| 62 |
base_url: "http://10.1.4.192:11434/"
|
|
|
|
| 7 |
# url: "https://2c6d0136-b6ca-4400-bac5-1703f58abc43.europe-west3-0.gcp.cloud.qdrant.io"
|
| 8 |
# Current cluster with BAAI-bge-m3 and colSmol-500M-v2 collections:
|
| 9 |
url: "${QDRANT_URL}" # Load from environment variable (should be the us-west-1 cluster)
|
| 10 |
+
collection_name: "BAAI-bge-m3-full" # Full text-based RAG collection
|
| 11 |
prefer_grpc: true
|
| 12 |
api_key: "${QDRANT_API_KEY}" # Load from environment variable
|
| 13 |
|
|
|
|
| 57 |
OPENAI:
|
| 58 |
model: "gpt-4o-mini"
|
| 59 |
|
| 60 |
+
OPENAI_STRONG:
|
| 61 |
+
model: "gpt-4.1"
|
| 62 |
+
temperature: 0.2
|
| 63 |
+
|
| 64 |
+
# Optional: dedicated model for final response generation.
|
| 65 |
+
# Uncomment and set to gpt-5 or similar when ready for highest-quality answers.
|
| 66 |
+
# Falls back to OPENAI_STRONG if not set.
|
| 67 |
+
# OPENAI_RESPONSE:
|
| 68 |
+
# model: "gpt-4.1"
|
| 69 |
+
# temperature: 0.3
|
| 70 |
+
|
| 71 |
OLLAMA:
|
| 72 |
model: "mistral-small3.1:24b-instruct-2503-q8_0"
|
| 73 |
base_url: "http://10.1.4.192:11434/"
|