Change use cache to False
Browse filesSo users can use the regenerate sample iteratively and see how the full dataset could look like (that's why we were using do_sample too)
src/distilabel_dataset_generator/apps/sft.py
CHANGED
|
@@ -26,7 +26,7 @@ from src.distilabel_dataset_generator.utils import (
|
|
| 26 |
|
| 27 |
def _run_pipeline(result_queue, num_turns, num_rows, system_prompt, is_sample):
|
| 28 |
pipeline = get_pipeline(num_turns, num_rows, system_prompt, is_sample)
|
| 29 |
-
distiset: Distiset = pipeline.run(use_cache=
|
| 30 |
result_queue.put(distiset)
|
| 31 |
|
| 32 |
|
|
|
|
| 26 |
|
| 27 |
def _run_pipeline(result_queue, num_turns, num_rows, system_prompt, is_sample):
|
| 28 |
pipeline = get_pipeline(num_turns, num_rows, system_prompt, is_sample)
|
| 29 |
+
distiset: Distiset = pipeline.run(use_cache=False)
|
| 30 |
result_queue.put(distiset)
|
| 31 |
|
| 32 |
|