justmotes commited on
Commit
178d05b
·
1 Parent(s): bd7d6a3

Fix: Use MiniLM-L6-v2 to match Qdrant vector dimension (384)

Browse files
Files changed (1) hide show
  1. app.py +2 -1
app.py CHANGED
@@ -11,6 +11,7 @@ from src.data_pipeline import get_embedding
11
  COLLECTION_NAME = "dashVector_v1"
12
  VECTOR_SIZE = 384 # MiniLM-L6-v2
13
  NUM_CLUSTERS = 32
 
14
 
15
  # --- Initialize Backend ---
16
  # We initialize once at startup
@@ -251,7 +252,7 @@ def run_benchmark(query):
251
 
252
  # Generate Embedding
253
  print("DEBUG: Generating embedding...")
254
- query_vec = get_embedding(query)
255
  print("DEBUG: Embedding generated.")
256
 
257
  # Router Prediction
 
11
  COLLECTION_NAME = "dashVector_v1"
12
  VECTOR_SIZE = 384 # MiniLM-L6-v2
13
  NUM_CLUSTERS = 32
14
+ EMBEDDING_MODEL = "sentence-transformers/all-MiniLM-L6-v2"
15
 
16
  # --- Initialize Backend ---
17
  # We initialize once at startup
 
252
 
253
  # Generate Embedding
254
  print("DEBUG: Generating embedding...")
255
+ query_vec = get_embedding(query, model_name=EMBEDDING_MODEL)
256
  print("DEBUG: Embedding generated.")
257
 
258
  # Router Prediction