File size: 325 Bytes
d30087d |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 |
epochs: 1
batch_size: 16
lr: 0.0003
weight_decay: 0.1
gradient_accumulation_steps: 1
model_id: EleutherAI/pythia-410m
seed: 42
dataset_path: /data/user_data/zhilif/soft_mem/pile_tofu_poly_repeated_2.zst
save_dir: /data/locus/llm_weights/zhilif/soft_mem
wandb:
project: soft-mem
group: continual-finetune
max_length: 2048
|