tanganke's picture
Upload folder using huggingface_hub
32c1ec9 verified
fabric:
loggers:
_target_: lightning.fabric.loggers.TensorBoardLogger
root_dir: outputs/logs
name: llama_full_bradly_terry_rm
version: null
sub_dir: null
default_hp_metric: false
strategy:
_target_: lightning.fabric.strategies.FSDPStrategy
sharding_strategy: FULL_SHARD
cpu_offload: false
auto_wrap_policy:
_target_: fusion_bench.mixins.lightning_fabric.get_policy
_args_:
- transformers.models.llama.modeling_llama.LlamaDecoderLayer
activation_checkpointing_policy: ${.auto_wrap_policy}
_target_: lightning.Fabric
_recursive_: true
devices: auto
accelerator: auto
precision: bf16-true
method:
_target_: fusion_bench.method.BradlyTerryRewardModeling
_recursive_: false
optimizer:
_target_: torch.optim.AdamW
lr: 0
weight_decay: 0.001
fused: null
lr_scheduler:
_target_: fusion_bench.optim.lr_scheduler.CosineDecayWithWarmup
T_max: _T_max_
init_lr: 0
warmup_steps: 100
max_lr: 5.0e-06
min_lr: 1.0e-07
dataloader_kwargs:
batch_size: 8
num_workers: 0
pin_memory: true
max_epochs: 2
max_steps: -1
max_steps_per_epoch: -1
accumulate_grad_batches: 16
lr_scheduler_interval: step
lr_scheduler_frequency: 1
checkpoint_save_interval: epoch
checkpoint_save_frequency: 1
gradient_clip_val: 1
gradient_clip_algorithm: norm
save_optimizer_state: false
save_full_model: true
save_ckpt_type: lightning
ckpt_path: null
max_length: 4096
fix_token_embedding: true
modelpool:
_target_: fusion_bench.modelpool.CausalLMPool
pretrained_model_name_or_path: meta-llama/Llama-3.2-1B-Instruct
models:
_pretrained_:
_target_: fusion_bench.modelpool.seq_classification_lm.create_reward_model_from_pretrained
pretrained_model_name_or_path: ${...pretrained_model_name_or_path}
torch_dtype: bfloat16
use_flash_attention_2: true
tokenizer:
_target_: transformers.AutoTokenizer.from_pretrained
pretrained_model_name_or_path: ${..pretrained_model_name_or_path}
pad_token: <|end_of_text|>
train_datasets:
preference_700k:
_target_: fusion_bench.dataset.llama.preference_700k.load_tokenized_preference_700k_for_bradley_terry_rm
tokenizer: ${...tokenizer}
path: hendrydong/preference_700K
split: train
cache_path: null
taskpool:
_target_: fusion_bench.taskpool.DummyTaskPool
model_save_path: null
_target_: fusion_bench.programs.FabricModelFusionProgram
_recursive_: false
fast_dev_run: false
dry_run: false
print_config: true
report_save_path: null
print_function_call: true