Spaces:
Sleeping
Sleeping
Fix: Use MiniLM-L6-v2 to match Qdrant vector dimension (384)
Browse files
app.py
CHANGED
|
@@ -11,6 +11,7 @@ from src.data_pipeline import get_embedding
|
|
| 11 |
COLLECTION_NAME = "dashVector_v1"
|
| 12 |
VECTOR_SIZE = 384 # MiniLM-L6-v2
|
| 13 |
NUM_CLUSTERS = 32
|
|
|
|
| 14 |
|
| 15 |
# --- Initialize Backend ---
|
| 16 |
# We initialize once at startup
|
|
@@ -251,7 +252,7 @@ def run_benchmark(query):
|
|
| 251 |
|
| 252 |
# Generate Embedding
|
| 253 |
print("DEBUG: Generating embedding...")
|
| 254 |
-
query_vec = get_embedding(query)
|
| 255 |
print("DEBUG: Embedding generated.")
|
| 256 |
|
| 257 |
# Router Prediction
|
|
|
|
| 11 |
COLLECTION_NAME = "dashVector_v1"
|
| 12 |
VECTOR_SIZE = 384 # MiniLM-L6-v2
|
| 13 |
NUM_CLUSTERS = 32
|
| 14 |
+
EMBEDDING_MODEL = "sentence-transformers/all-MiniLM-L6-v2"
|
| 15 |
|
| 16 |
# --- Initialize Backend ---
|
| 17 |
# We initialize once at startup
|
|
|
|
| 252 |
|
| 253 |
# Generate Embedding
|
| 254 |
print("DEBUG: Generating embedding...")
|
| 255 |
+
query_vec = get_embedding(query, model_name=EMBEDDING_MODEL)
|
| 256 |
print("DEBUG: Embedding generated.")
|
| 257 |
|
| 258 |
# Router Prediction
|