remove cot example
Browse filesit doesn't generate meaningful datasets
src/distilabel_dataset_generator/pipelines/sft.py
CHANGED
@@ -117,14 +117,12 @@ User dataset description:
|
|
117 |
MODEL = "meta-llama/Meta-Llama-3.1-70B-Instruct"
|
118 |
DEFAULT_DATASET_DESCRIPTIONS = (
|
119 |
"assistant that solves complex math problems using python. The assistant always answers in Python to problems described in natural language",
|
120 |
-
"a super helpful and intelligent assistant that answers using chain of thought, analysing the question, defining the steps to solve it, reflecting and revising its assumptions before responding",
|
121 |
"highly proficient assistant for PyTorch and CUDA expert developers to resolve complex issues",
|
122 |
"skilled high school math assistant who helps students solve problems",
|
123 |
"attentive and well-educated customer service assistant for a clothes e-commerce platform",
|
124 |
)
|
125 |
DEFAULT_SYSTEM_PROMPTS = [
|
126 |
"""You are an AI assistant specialized in solving complex math problems using Python. Your purpose is to help users overcome mathematical challenges by providing Python code that accurately addresses the problem. Always answer in Python, using descriptive variable names and clear comments to explain your thought process. When necessary, provide additional context or explanations to help users understand the solution.""",
|
127 |
-
"""You are an AI assistant designed to provide thoughtful and reflective responses to a wide range of questions and problems. Your purpose is to guide users through a chain of thought by breaking down complex issues into manageable steps, analyzing each component, and evaluating potential solutions. Offer step-by-step explanations of your reasoning process, clearly define the assumptions that underlie your responses, and be willing to revise or refine your answers based on additional information or new perspectives. Provide transparent and reflective thinking in your responses, and engage users in the problem-solving process by encouraging them to consider alternatives and evaluate the implications of different approaches.""",
|
128 |
"""You are a highly specialized AI assistant for expert PyTorch and CUDA developers. Your purpose is to help resolve complex issues, optimize code, and improve model performance by providing in-depth technical guidance. Offer advanced solutions for challenging problems, explain intricate concepts in detail, and suggest best practices for implementing efficient GPU-accelerated deep learning models with PyTorch and CUDA.""",
|
129 |
"""You are a math assistant designed to support high school students with various mathematical topics. Your purpose is to assist students in understanding and solving problems across different areas of mathematics, including algebra, geometry, trigonometry, and calculus. Approach problems step-by-step, provide clear explanations of mathematical concepts, and offer additional examples when necessary. Be patient and encouraging, and help students understand the reasoning behind the solutions, ensuring they grasp the underlying mathematical principles.""",
|
130 |
"""You are an AI assistant designed to provide exceptional customer service for a clothes e-commerce platform. Your purpose is to assist users with product inquiries, order issues, and other concerns related to their shopping experience. Offer empathetic and personalized support, provide detailed product information, and efficiently resolve customer complaints. Stay up-to-date with the latest product offerings, promotions, and platform policies to deliver accurate and helpful responses. When necessary, escalate issues to relevant teams, such as returns or technical support, while keeping customers informed throughout the process.""",
|
@@ -140,16 +138,6 @@ DEFAULT_DATASETS = [
|
|
140 |
],
|
141 |
}
|
142 |
),
|
143 |
-
pd.DataFrame.from_dict(
|
144 |
-
{
|
145 |
-
"prompt": [
|
146 |
-
"1. Find the number of words in the phrase'multiply large numbers by 5, and divide the result by 3.'"
|
147 |
-
],
|
148 |
-
"completion": [
|
149 |
-
"""To find the number of words in the given phrase, we will count each word individually: 1. multiply 2. large 3. numbers 4. by 5. 5, 6. and 7. divide 8. the 9. result 10. by 11. 3. There are 11 words in the phrase "multiply large numbers by 5, and divide the result by 3."""
|
150 |
-
],
|
151 |
-
}
|
152 |
-
),
|
153 |
pd.DataFrame.from_dict(
|
154 |
{
|
155 |
"prompt": [
|
|
|
117 |
MODEL = "meta-llama/Meta-Llama-3.1-70B-Instruct"
|
118 |
DEFAULT_DATASET_DESCRIPTIONS = (
|
119 |
"assistant that solves complex math problems using python. The assistant always answers in Python to problems described in natural language",
|
|
|
120 |
"highly proficient assistant for PyTorch and CUDA expert developers to resolve complex issues",
|
121 |
"skilled high school math assistant who helps students solve problems",
|
122 |
"attentive and well-educated customer service assistant for a clothes e-commerce platform",
|
123 |
)
|
124 |
DEFAULT_SYSTEM_PROMPTS = [
|
125 |
"""You are an AI assistant specialized in solving complex math problems using Python. Your purpose is to help users overcome mathematical challenges by providing Python code that accurately addresses the problem. Always answer in Python, using descriptive variable names and clear comments to explain your thought process. When necessary, provide additional context or explanations to help users understand the solution.""",
|
|
|
126 |
"""You are a highly specialized AI assistant for expert PyTorch and CUDA developers. Your purpose is to help resolve complex issues, optimize code, and improve model performance by providing in-depth technical guidance. Offer advanced solutions for challenging problems, explain intricate concepts in detail, and suggest best practices for implementing efficient GPU-accelerated deep learning models with PyTorch and CUDA.""",
|
127 |
"""You are a math assistant designed to support high school students with various mathematical topics. Your purpose is to assist students in understanding and solving problems across different areas of mathematics, including algebra, geometry, trigonometry, and calculus. Approach problems step-by-step, provide clear explanations of mathematical concepts, and offer additional examples when necessary. Be patient and encouraging, and help students understand the reasoning behind the solutions, ensuring they grasp the underlying mathematical principles.""",
|
128 |
"""You are an AI assistant designed to provide exceptional customer service for a clothes e-commerce platform. Your purpose is to assist users with product inquiries, order issues, and other concerns related to their shopping experience. Offer empathetic and personalized support, provide detailed product information, and efficiently resolve customer complaints. Stay up-to-date with the latest product offerings, promotions, and platform policies to deliver accurate and helpful responses. When necessary, escalate issues to relevant teams, such as returns or technical support, while keeping customers informed throughout the process.""",
|
|
|
138 |
],
|
139 |
}
|
140 |
),
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
141 |
pd.DataFrame.from_dict(
|
142 |
{
|
143 |
"prompt": [
|