rvindra commited on
Commit
e5bc9ef
·
verified ·
1 Parent(s): c83f11f

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +2 -0
README.md CHANGED
@@ -21,6 +21,8 @@ This is a PEFT version of google/flan-t5-large trained using LoRA with the Edinb
21
  - NUM_EPOCHS = 8
22
  - LEARNING_RATE = 2e-6
23
  - BATCH_SIZE = 8
 
 
24
  - GRAD_ACC_STEPS = 8
25
  - WARMUP_STEPS = 100
26
  - RANK = 16
 
21
  - NUM_EPOCHS = 8
22
  - LEARNING_RATE = 2e-6
23
  - BATCH_SIZE = 8
24
+ - OPTIMIZER = AdamW w/ betas=(0.9,0.999), eps=1e-8, weight_decay=0.01
25
+ - SCHEDULER = Cosine
26
  - GRAD_ACC_STEPS = 8
27
  - WARMUP_STEPS = 100
28
  - RANK = 16