Spaces:
Sleeping
Sleeping
Update finetune_flan_t5.py
Browse files- finetune_flan_t5.py +9 -4
finetune_flan_t5.py
CHANGED
@@ -55,14 +55,19 @@ training_args = TrainingArguments(
|
|
55 |
# Define data collator
|
56 |
data_collator = DataCollatorForSeq2Seq(tokenizer, model=model)
|
57 |
|
58 |
-
|
|
|
|
|
59 |
trainer = SFTTrainer(
|
60 |
model=model,
|
61 |
-
args=training_args,
|
62 |
-
train_dataset=tokenized_dataset,
|
63 |
tokenizer=tokenizer,
|
64 |
-
|
|
|
|
|
|
|
|
|
65 |
)
|
66 |
|
|
|
67 |
# Start training
|
68 |
trainer.train()
|
|
|
55 |
# Define data collator
|
56 |
data_collator = DataCollatorForSeq2Seq(tokenizer, model=model)
|
57 |
|
58 |
+
def formatting_func(example):
|
59 |
+
return f"Input: {example['input']}\nOutput: {example['output']}"
|
60 |
+
|
61 |
trainer = SFTTrainer(
|
62 |
model=model,
|
|
|
|
|
63 |
tokenizer=tokenizer,
|
64 |
+
train_dataset=tokenized_dataset,
|
65 |
+
args=training_args,
|
66 |
+
data_collator=DataCollatorForSeq2Seq(tokenizer, padding=True),
|
67 |
+
formatting_func=formatting_func,
|
68 |
+
packing=False
|
69 |
)
|
70 |
|
71 |
+
|
72 |
# Start training
|
73 |
trainer.train()
|