{ "model": "vitamin_large", "exp_name": "unitok_large_causal", "output_dir": "local_output", "resume_from": "", "lpips_path": "", "dino_path": "", "fid_eval_src": "", "fid_eval_dst": "", "vis_img_dir": "asset/vis_imgs/", "fid_feature_extractor": "", "clip_pretrain_path": "", "fp16": false, "bf16": true, "tf32": true, "compile_model": false, "ddp_static": false, "grad_ckpt": true, "grad_accu": 1, "train_data": "", "val_data": null, "dataset_type": "webdataset", "imagenet_val": "", "imagenet_v2": null, "subset_ratio": 1.0, "img_size": 256, "resize_ratio": 1.125, "hflip": false, "workers": 16, "train_num_samples": 1280000000, "train_data_upsampling_factors": null, "dataset_resampled": false, "use_aug": false, "vocab_size": 32768, "vocab_width": 64, "vocab_norm": true, "vq_beta": 0.25, "num_codebooks": 8, "quant_proj": "attn", "embed_dim": 768, "num_query": 0, "use_clip_pretrain": false, "patch_size": 16, "drop_path": 0.1, "text_width": 768, "text_heads": 12, "text_layers": 12, "text_vocab_size": 49408, "text_context_length": 77, "local_loss": true, "gather_with_grad": true, "pretrained_clip": null, "pretrained_clip_text": null, "lock_text": false, "lock_text_unlocked_layers": 0, "lock_text_freeze_layer_norm": false, "force_custom_text": false, "force_custom_vision": false, "zeroshot_eval_freq": 1, "dino_depth": 12, "dino_kernel_size": 9, "disc_norm": "gn", "disc_aug_prob": 1.0, "disc_specnorm": false, "step_disc_every": 1, "vae_init": -0.5, "vocab_init": -1, "disc_init": -0.5, "epoch": 1, "local_bs": 56, "vae_local_bs": 56, "global_bs": 16384, "lr": 0.0005, "wd": 0.02, "disc_lr": 2e-05, "disc_wd": 0.2, "grad_clip": 10, "ema": 0.9999, "warmup_iter": null, "warmup_ep": 0.01, "disc_start_ep": 0.375, "disc_warmup_ep": 0.03, "schedule": "cos", "lr_start_ratio": 0.0, "lr_end_ratio": 0.1, "disc_lr_end_ratio": 0.1, "custom_lr_multiplier": null, "optimizer": "adamw", "optim_eps": 1e-06, "fuse_opt": false, "optim_beta": "0.9_0.95", "disc_optim_beta": "0.5_0.9", "l1": 0.2, "l2": 1.0, "lp": 1.0, "lpr": 48, "ld": 0.4, "le": 0.0, "lq": 1.0, "lc": 1.0, "e_temp": 0.01, "gada": 1, "bcr": 4.0, "bcr_cut": 0.2, "dcrit": "hg", "report_wandb": true, "wandb_notes": null, "run_id": null, "eval_per_epoch": 8, "dbg_unused_param": false, "dbg_nan": false, "seed": null, "deterministic": false, "same_seed_for_all_ranks": 0 }