slenk commited on
Commit
e4c5427
·
verified ·
1 Parent(s): bbf1f84

Upload src/codewraith/app/retriever.py with huggingface_hub

Browse files
Files changed (1) hide show
  1. src/codewraith/app/retriever.py +2 -2
src/codewraith/app/retriever.py CHANGED
@@ -68,7 +68,7 @@ class SpecRetriever:
68
 
69
  def build_index(
70
  self,
71
- dataset_path: str = "data/training_pairs_clean.jsonl",
72
  batch_size: int = 50,
73
  ) -> int:
74
  """Build the vector index from training pairs.
@@ -196,7 +196,7 @@ class SpecRetriever:
196
  return "".join(parts)
197
 
198
 
199
- def build_index(dataset_path: str = "data/training_pairs_clean.jsonl") -> None:
200
  """CLI entry point for building the vector index."""
201
  retriever = SpecRetriever()
202
  retriever.build_index(dataset_path)
 
68
 
69
  def build_index(
70
  self,
71
+ dataset_path: str = "data/training_pairs_v7_clean.jsonl",
72
  batch_size: int = 50,
73
  ) -> int:
74
  """Build the vector index from training pairs.
 
196
  return "".join(parts)
197
 
198
 
199
+ def build_index(dataset_path: str = "data/training_pairs_v7_clean.jsonl") -> None:
200
  """CLI entry point for building the vector index."""
201
  retriever = SpecRetriever()
202
  retriever.build_index(dataset_path)