|
fabric: |
|
loggers: |
|
_target_: lightning.fabric.loggers.TensorBoardLogger |
|
root_dir: outputs/logs |
|
name: llama_full_bradly_terry_rm |
|
version: null |
|
sub_dir: null |
|
default_hp_metric: false |
|
strategy: |
|
_target_: lightning.fabric.strategies.FSDPStrategy |
|
sharding_strategy: FULL_SHARD |
|
cpu_offload: false |
|
auto_wrap_policy: |
|
_target_: fusion_bench.mixins.lightning_fabric.get_policy |
|
_args_: |
|
- transformers.models.llama.modeling_llama.LlamaDecoderLayer |
|
activation_checkpointing_policy: ${.auto_wrap_policy} |
|
_target_: lightning.Fabric |
|
_recursive_: true |
|
devices: auto |
|
accelerator: auto |
|
precision: bf16-true |
|
method: |
|
_target_: fusion_bench.method.BradlyTerryRewardModeling |
|
_recursive_: false |
|
optimizer: |
|
_target_: torch.optim.AdamW |
|
lr: 0 |
|
weight_decay: 0.001 |
|
fused: null |
|
lr_scheduler: |
|
_target_: fusion_bench.optim.lr_scheduler.CosineDecayWithWarmup |
|
T_max: _T_max_ |
|
init_lr: 0 |
|
warmup_steps: 100 |
|
max_lr: 5.0e-06 |
|
min_lr: 1.0e-07 |
|
dataloader_kwargs: |
|
batch_size: 8 |
|
num_workers: 0 |
|
pin_memory: true |
|
max_epochs: 2 |
|
max_steps: -1 |
|
max_steps_per_epoch: -1 |
|
accumulate_grad_batches: 16 |
|
lr_scheduler_interval: step |
|
lr_scheduler_frequency: 1 |
|
checkpoint_save_interval: epoch |
|
checkpoint_save_frequency: 1 |
|
gradient_clip_val: 1 |
|
gradient_clip_algorithm: norm |
|
save_optimizer_state: false |
|
save_full_model: true |
|
save_ckpt_type: lightning |
|
ckpt_path: null |
|
max_length: 4096 |
|
fix_token_embedding: true |
|
modelpool: |
|
_target_: fusion_bench.modelpool.CausalLMPool |
|
pretrained_model_name_or_path: meta-llama/Llama-3.2-1B-Instruct |
|
models: |
|
_pretrained_: |
|
_target_: fusion_bench.modelpool.seq_classification_lm.create_reward_model_from_pretrained |
|
pretrained_model_name_or_path: ${...pretrained_model_name_or_path} |
|
torch_dtype: bfloat16 |
|
use_flash_attention_2: true |
|
tokenizer: |
|
_target_: transformers.AutoTokenizer.from_pretrained |
|
pretrained_model_name_or_path: ${..pretrained_model_name_or_path} |
|
pad_token: <|end_of_text|> |
|
train_datasets: |
|
preference_700k: |
|
_target_: fusion_bench.dataset.llama.preference_700k.load_tokenized_preference_700k_for_bradley_terry_rm |
|
tokenizer: ${...tokenizer} |
|
path: hendrydong/preference_700K |
|
split: train |
|
cache_path: null |
|
taskpool: |
|
_target_: fusion_bench.taskpool.DummyTaskPool |
|
model_save_path: null |
|
_target_: fusion_bench.programs.FabricModelFusionProgram |
|
_recursive_: false |
|
fast_dev_run: false |
|
dry_run: false |
|
print_config: true |
|
report_save_path: null |
|
print_function_call: true |
|
|