Update README.md
Browse files
README.md
CHANGED
@@ -21,6 +21,8 @@ This is a PEFT version of google/flan-t5-large trained using LoRA with the Edinb
|
|
21 |
- NUM_EPOCHS = 8
|
22 |
- LEARNING_RATE = 2e-6
|
23 |
- BATCH_SIZE = 8
|
|
|
|
|
24 |
- GRAD_ACC_STEPS = 8
|
25 |
- WARMUP_STEPS = 100
|
26 |
- RANK = 16
|
|
|
21 |
- NUM_EPOCHS = 8
|
22 |
- LEARNING_RATE = 2e-6
|
23 |
- BATCH_SIZE = 8
|
24 |
+
- OPTIMIZER = AdamW w/ betas=(0.9,0.999), eps=1e-8, weight_decay=0.01
|
25 |
+
- SCHEDULER = Cosine
|
26 |
- GRAD_ACC_STEPS = 8
|
27 |
- WARMUP_STEPS = 100
|
28 |
- RANK = 16
|