| wandb_project: joy-caption-1 | |
| device_batch_size: 2 | |
| batch_size: 256 | |
| learning_rate: 0.0002 | |
| warmup_samples: 18000 | |
| max_samples: 600000 | |
| save_every: 50000 | |
| test_every: 50000 | |
| use_amp: true | |
| grad_scaler: true | |
| lr_scheduler_type: cosine | |
| min_lr_ratio: 0.0 | |
| allow_tf32: true | |
| seed: 69 | |
| num_workers: 8 | |
| optimizer_type: adamw | |
| adam_beta1: 0.9 | |
| adam_beta2: 0.999 | |
| adam_eps: 1.0e-08 | |
| adam_weight_decay: 0.0 | |
| clip_grad_norm: 1.0 | |
| dataset: fancyfeast/joy-captioning-20240924a | |
| clip_model: google/siglip-so400m-patch14-384 | |
| text_model: ../lora-train/lora_model_vwbzycxh | |
| resume: null | |
| gradient_checkpointing: false | |
| test_size: 2048 | |
| grad_scaler_init: 65536.0 | |
| max_caption_length: 257 | |
| num_image_tokens: 32 | |
| adapter_type: mlp | |
| text_model_dtype: bfloat16 | |
| pre_test: false | |
| train_image_model: true | |
| image_model_lr: null | |
| train_lora: true | |
| lora_r: 64 | |
| lora_alpha: 16 | |
| lora_dropout: 0.1 | |
