Change use cache to False
Browse filesSo users can use the regenerate sample iteratively and see how the full dataset could look like (that's why we were using do_sample too)
src/distilabel_dataset_generator/apps/sft.py
CHANGED
@@ -26,7 +26,7 @@ from src.distilabel_dataset_generator.utils import (
|
|
26 |
|
27 |
def _run_pipeline(result_queue, num_turns, num_rows, system_prompt, is_sample):
|
28 |
pipeline = get_pipeline(num_turns, num_rows, system_prompt, is_sample)
|
29 |
-
distiset: Distiset = pipeline.run(use_cache=
|
30 |
result_queue.put(distiset)
|
31 |
|
32 |
|
|
|
26 |
|
27 |
def _run_pipeline(result_queue, num_turns, num_rows, system_prompt, is_sample):
|
28 |
pipeline = get_pipeline(num_turns, num_rows, system_prompt, is_sample)
|
29 |
+
distiset: Distiset = pipeline.run(use_cache=False)
|
30 |
result_queue.put(distiset)
|
31 |
|
32 |
|