flan-t5-custom-handler / training_config.py
MjolnirThor's picture
Create training_config.py
167d5e2 verified
raw
history blame
568 Bytes
from transformers import TrainingArguments
training_args = TrainingArguments(
output_dir="./results",
num_train_epochs=3,
per_device_train_batch_size=8, # Optimized for T4 GPU
per_device_eval_batch_size=8,
warmup_steps=500,
weight_decay=0.01,
logging_dir='./logs',
logging_steps=50,
save_steps=500,
eval_steps=500,
evaluation_strategy="steps",
save_strategy="steps",
save_total_limit=3,
load_best_model_at_end=True,
learning_rate=5e-5,
fp16=True, # Using GPU features
gradient_checkpointing=True
)