Spaces:
Sleeping
Sleeping
Upload src/codewraith/app/retriever.py with huggingface_hub
Browse files
src/codewraith/app/retriever.py
CHANGED
|
@@ -68,7 +68,7 @@ class SpecRetriever:
|
|
| 68 |
|
| 69 |
def build_index(
|
| 70 |
self,
|
| 71 |
-
dataset_path: str = "data/
|
| 72 |
batch_size: int = 50,
|
| 73 |
) -> int:
|
| 74 |
"""Build the vector index from training pairs.
|
|
@@ -196,7 +196,7 @@ class SpecRetriever:
|
|
| 196 |
return "".join(parts)
|
| 197 |
|
| 198 |
|
| 199 |
-
def build_index(dataset_path: str = "data/
|
| 200 |
"""CLI entry point for building the vector index."""
|
| 201 |
retriever = SpecRetriever()
|
| 202 |
retriever.build_index(dataset_path)
|
|
|
|
| 68 |
|
| 69 |
def build_index(
|
| 70 |
self,
|
| 71 |
+
dataset_path: str = "data/training_pairs_v7_clean.jsonl",
|
| 72 |
batch_size: int = 50,
|
| 73 |
) -> int:
|
| 74 |
"""Build the vector index from training pairs.
|
|
|
|
| 196 |
return "".join(parts)
|
| 197 |
|
| 198 |
|
| 199 |
+
def build_index(dataset_path: str = "data/training_pairs_v7_clean.jsonl") -> None:
|
| 200 |
"""CLI entry point for building the vector index."""
|
| 201 |
retriever = SpecRetriever()
|
| 202 |
retriever.build_index(dataset_path)
|