Create training_config.py
Browse files- training_config.py +21 -0
training_config.py
ADDED
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
from transformers import TrainingArguments
|
2 |
+
|
3 |
+
training_args = TrainingArguments(
|
4 |
+
output_dir="./results",
|
5 |
+
num_train_epochs=3,
|
6 |
+
per_device_train_batch_size=8, # Optimized for T4 GPU
|
7 |
+
per_device_eval_batch_size=8,
|
8 |
+
warmup_steps=500,
|
9 |
+
weight_decay=0.01,
|
10 |
+
logging_dir='./logs',
|
11 |
+
logging_steps=50,
|
12 |
+
save_steps=500,
|
13 |
+
eval_steps=500,
|
14 |
+
evaluation_strategy="steps",
|
15 |
+
save_strategy="steps",
|
16 |
+
save_total_limit=3,
|
17 |
+
load_best_model_at_end=True,
|
18 |
+
learning_rate=5e-5,
|
19 |
+
fp16=True, # Using GPU features
|
20 |
+
gradient_checkpointing=True
|
21 |
+
)
|