htlou commited on Feb 3

Commit

ae6fda4

verified ·

1 Parent(s): 09fae75

Upload folder using huggingface_hub

Browse files

Files changed (28) hide show

.gitattributes +1 -0
arguments.yaml +49 -0
config.json +0 -0
environ.txt +56 -0
generation_config.json +7 -0
model-00001-of-00006.safetensors +3 -0
model-00002-of-00006.safetensors +3 -0
model-00003-of-00006.safetensors +3 -0
model-00004-of-00006.safetensors +3 -0
model-00005-of-00006.safetensors +3 -0
model-00006-of-00006.safetensors +3 -0
model.safetensors.index.json +719 -0
preprocessor_config.json +28 -0
processor_config.json +5 -0
script.sh +48 -0
special_tokens_map.json +37 -0
tokenizer.json +0 -0
tokenizer_config.json +0 -0
wandb/debug-internal.log +25 -0
wandb/debug.log +33 -0
wandb/run-20241011_202729-hvajn2pl/files/config.yaml +96 -0
wandb/run-20241011_202729-hvajn2pl/files/output.log +0 -0
wandb/run-20241011_202729-hvajn2pl/files/requirements.txt +234 -0
wandb/run-20241011_202729-hvajn2pl/files/wandb-metadata.json +112 -0
wandb/run-20241011_202729-hvajn2pl/files/wandb-summary.json +1 -0
wandb/run-20241011_202729-hvajn2pl/logs/debug-internal.log +25 -0
wandb/run-20241011_202729-hvajn2pl/logs/debug.log +33 -0
wandb/run-20241011_202729-hvajn2pl/run-hvajn2pl.wandb +3 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+wandb/run-20241011_202729-hvajn2pl/run-hvajn2pl.wandb filter=lfs diff=lfs merge=lfs -text

arguments.yaml ADDED Viewed

	@@ -0,0 +1,49 @@

+data_cfgs:
+  eval_data_files: null
+  eval_datasets: null
+  eval_optional_args: []
+  eval_size: null
+  eval_split: null
+  eval_subset: null
+  eval_template: null
+  train_data_files: llf_ti2ti_27k_tokenized.pt
+  train_datasets: /data/align-anything/hantao/align-anything/projects/text_image_to_text_image/outputs
+  train_optional_args: []
+  train_size: null
+  train_split: train
+  train_subset: null
+  train_template: AA_textfeedback
+logger_cfgs:
+  cache_dir: null
+  log_project: align-anything
+  log_run_name: sft
+  log_type: wandb
+  output_dir: ../outputs/sft_tf_cham_1011_27k_ti2ti
+  save_interval: 400.0
+model_cfgs:
+  model_max_length: 4096
+  model_name_or_path: /data/align-anything/hantao/models/0916_ti_to_ti_sft/
+  trust_remote_code: true
+special_tokens: null
+train_cfgs:
+  adam_betas:
+  - 0.9
+  - 0.95
+  adam_epsilon: 1.0e-08
+  bf16: true
+  ds_cfgs: ds_z3_config.json
+  epochs: 3.0
+  eval_interval: 1000
+  eval_strategy: steps
+  fp16: false
+  freeze_language_model: false
+  gradient_accumulation_steps: 2.0
+  gradient_checkpointing: true
+  learning_rate: 1.0e-06
+  lr_scheduler_type: cosine
+  lr_warmup_ratio: 0.03
+  max_grad_norm: 1.0
+  per_device_eval_batch_size: 4.0
+  per_device_train_batch_size: 4.0
+  seed: 42
+  weight_decay: 0.0

config.json ADDED Viewed

The diff for this file is too large to render. See raw diff

environ.txt ADDED Viewed

	@@ -0,0 +1,56 @@

+CONDA_DEFAULT_ENV=hantao_stable
+CONDA_EXE=/data/align-anything/miniconda3/bin/conda
+CONDA_PREFIX=/data/align-anything/miniconda3/envs/hantao_stable
+CONDA_PREFIX_1=/data/align-anything/miniconda3
+CONDA_PROMPT_MODIFIER=(hantao_stable)
+CONDA_PYTHON_EXE=/data/align-anything/miniconda3/bin/python
+CONDA_SHLVL=2
+CRASHDIR=/etc/ShellCrash
+CROSS_RANK=0
+CROSS_SIZE=1
+CUDA_MODULE_LOADING=LAZY
+CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7
+DBUS_SESSION_BUS_ADDRESS=unix:path=/run/user/2000/bus
+HOME=/home/align-anything
+LANG=en_US.UTF-8
+LD_LIBRARY_PATH=/data/align-anything/miniconda3/envs/hantao_stable/lib/python3.11/site-packages/cv2/../../lib64:
+LESSCLOSE=/usr/bin/lesspipe %s %s
+LESSOPEN=| /usr/bin/lesspipe %s
+LOCAL_RANK=0
+LOCAL_SIZE=8
+LOGLEVEL=WARNING
+LOGNAME=align-anything
+LS_COLORS=rs=0:di=01;34:ln=01;36:mh=00:pi=40;33:so=01;35:do=01;35:bd=40;33;01:cd=40;33;01:or=40;31;01:mi=00:su=37;41:sg=30;43:ca=30;41:tw=30;42:ow=34;42:st=37;44:ex=01;32:*.tar=01;31:*.tgz=01;31:*.arc=01;31:*.arj=01;31:*.taz=01;31:*.lha=01;31:*.lz4=01;31:*.lzh=01;31:*.lzma=01;31:*.tlz=01;31:*.txz=01;31:*.tzo=01;31:*.t7z=01;31:*.zip=01;31:*.z=01;31:*.dz=01;31:*.gz=01;31:*.lrz=01;31:*.lz=01;31:*.lzo=01;31:*.xz=01;31:*.zst=01;31:*.tzst=01;31:*.bz2=01;31:*.bz=01;31:*.tbz=01;31:*.tbz2=01;31:*.tz=01;31:*.deb=01;31:*.rpm=01;31:*.jar=01;31:*.war=01;31:*.ear=01;31:*.sar=01;31:*.rar=01;31:*.alz=01;31:*.ace=01;31:*.zoo=01;31:*.cpio=01;31:*.7z=01;31:*.rz=01;31:*.cab=01;31:*.wim=01;31:*.swm=01;31:*.dwm=01;31:*.esd=01;31:*.jpg=01;35:*.jpeg=01;35:*.mjpg=01;35:*.mjpeg=01;35:*.gif=01;35:*.bmp=01;35:*.pbm=01;35:*.pgm=01;35:*.ppm=01;35:*.tga=01;35:*.xbm=01;35:*.xpm=01;35:*.tif=01;35:*.tiff=01;35:*.png=01;35:*.svg=01;35:*.svgz=01;35:*.mng=01;35:*.pcx=01;35:*.mov=01;35:*.mpg=01;35:*.mpeg=01;35:*.m2v=01;35:*.mkv=01;35:*.webm=01;35:*.ogm=01;35:*.mp4=01;35:*.m4v=01;35:*.mp4v=01;35:*.vob=01;35:*.qt=01;35:*.nuv=01;35:*.wmv=01;35:*.asf=01;35:*.rm=01;35:*.rmvb=01;35:*.flc=01;35:*.avi=01;35:*.fli=01;35:*.flv=01;35:*.gl=01;35:*.dl=01;35:*.xcf=01;35:*.xwd=01;35:*.yuv=01;35:*.cgm=01;35:*.emf=01;35:*.ogv=01;35:*.ogx=01;35:*.aac=00;36:*.au=00;36:*.flac=00;36:*.m4a=00;36:*.mid=00;36:*.midi=00;36:*.mka=00;36:*.mp3=00;36:*.mpc=00;36:*.ogg=00;36:*.ra=00;36:*.wav=00;36:*.oga=00;36:*.opus=00;36:*.spx=00;36:*.xspf=00;36:
+MASTER_ADDR=127.0.0.1
+MASTER_PORT=58896
+MOTD_SHOWN=pam
+OLDPWD=/data/align-anything/hantao/align-anything/projects/text_image_to_text_image
+PATH=/data/align-anything/miniconda3/envs/hantao_stable/bin:/data/align-anything/miniconda3/condabin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/usr/local/games:/snap/bin
+PWD=/data/align-anything/hantao/align-anything/scripts
+PYGAME_HIDE_SUPPORT_PROMPT=1
+PYTHONHASHSEED=42
+PYTHONPATH=/data/align-anything/hantao/align-anything
+QT_QPA_FONTDIR=/data/align-anything/miniconda3/envs/hantao_stable/lib/python3.11/site-packages/cv2/qt/fonts
+QT_QPA_PLATFORM_PLUGIN_PATH=/data/align-anything/miniconda3/envs/hantao_stable/lib/python3.11/site-packages/cv2/qt/plugins
+RANK=0
+SHELL=/bin/bash
+SHLVL=3
+SSH_CLIENT=111.205.233.209 27514 30600
+SSH_CONNECTION=111.205.233.209 27514 10.10.212.196 30600
+SSH_TTY=/dev/pts/0
+TERM=screen
+TMUX=/tmp/tmux-2000/default,262430,0
+TMUX_PANE=%0
+TRITON_CACHE_DIR=/home/align-anything/cache/triton
+USER=align-anything
+WANDB_API_KEY=7e2dcc0c310ebcb7cdcafd5e9320d6be55cf1a33
+WANDB_SERVICE=2-320740-tcp-localhost-44893
+WORLD_SIZE=8
+XDG_DATA_DIRS=/usr/local/share:/usr/share:/var/lib/snapd/desktop
+XDG_RUNTIME_DIR=/run/user/2000
+XDG_SESSION_CLASS=user
+XDG_SESSION_ID=73
+XDG_SESSION_TYPE=tty
+_=/data/align-anything/miniconda3/envs/hantao_stable/bin/deepspeed
+_CE_CONDA=
+_CE_M=

generation_config.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 0,
+  "eos_token_id": 2,
+  "pad_token_id": 1,
+  "transformers_version": "4.44.0.dev0"
+}

model-00001-of-00006.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f6df1755613d66ee8a869dfb39698e9efba19900c85e149b0fe9c18a63874e7d
+size 4941356064

model-00002-of-00006.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7587ca600b9ca68701e951a18a3f0cf4ebd9c46949d66706efb0f19ad94411f2
+size 4857602760

model-00003-of-00006.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7415d76de1a6519baa413256b3511eac318a9c1d5ee5db94fa73a6232971f22d
+size 4857602816

model-00004-of-00006.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:05a3f4e7c44c16d0bdcf2fd429736d24230356410916d088cb441be00dbd2b15
+size 4857602816

model-00005-of-00006.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:de720f40153a1533b903c0f6c59b71c8c50229ab81eec5b7e2eefa8eb6c5f483
+size 4857602816

model-00006-of-00006.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:509ab97d07fc7d60b1ddb674c4d8793c95c5943207f77252d914a5ae110f4468
+size 3957857092

model.safetensors.index.json ADDED Viewed

	@@ -0,0 +1,719 @@

+{
+  "metadata": {
+    "total_size": 28329541132
+  },
+  "weight_map": {
+    "lm_head.weight": "model-00006-of-00006.safetensors",
+    "model.embed_tokens.weight": "model-00001-of-00006.safetensors",
+    "model.layers.0.input_layernorm.weight": "model-00001-of-00006.safetensors",
+    "model.layers.0.mlp.down_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.0.mlp.gate_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.0.mlp.up_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.0.post_attention_layernorm.weight": "model-00001-of-00006.safetensors",
+    "model.layers.0.self_attn.k_norm.bias": "model-00001-of-00006.safetensors",
+    "model.layers.0.self_attn.k_norm.weight": "model-00001-of-00006.safetensors",
+    "model.layers.0.self_attn.k_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.0.self_attn.o_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.0.self_attn.q_norm.bias": "model-00001-of-00006.safetensors",
+    "model.layers.0.self_attn.q_norm.weight": "model-00001-of-00006.safetensors",
+    "model.layers.0.self_attn.q_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.0.self_attn.v_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.1.input_layernorm.weight": "model-00001-of-00006.safetensors",
+    "model.layers.1.mlp.down_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.1.mlp.gate_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.1.mlp.up_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.1.post_attention_layernorm.weight": "model-00001-of-00006.safetensors",
+    "model.layers.1.self_attn.k_norm.bias": "model-00001-of-00006.safetensors",
+    "model.layers.1.self_attn.k_norm.weight": "model-00001-of-00006.safetensors",
+    "model.layers.1.self_attn.k_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.1.self_attn.o_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.1.self_attn.q_norm.bias": "model-00001-of-00006.safetensors",
+    "model.layers.1.self_attn.q_norm.weight": "model-00001-of-00006.safetensors",
+    "model.layers.1.self_attn.q_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.1.self_attn.v_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.10.input_layernorm.weight": "model-00003-of-00006.safetensors",
+    "model.layers.10.mlp.down_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.10.mlp.gate_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.10.mlp.up_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.10.post_attention_layernorm.weight": "model-00003-of-00006.safetensors",
+    "model.layers.10.self_attn.k_norm.bias": "model-00002-of-00006.safetensors",
+    "model.layers.10.self_attn.k_norm.weight": "model-00002-of-00006.safetensors",
+    "model.layers.10.self_attn.k_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.10.self_attn.o_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.10.self_attn.q_norm.bias": "model-00002-of-00006.safetensors",
+    "model.layers.10.self_attn.q_norm.weight": "model-00002-of-00006.safetensors",
+    "model.layers.10.self_attn.q_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.10.self_attn.v_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.11.input_layernorm.weight": "model-00003-of-00006.safetensors",
+    "model.layers.11.mlp.down_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.11.mlp.gate_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.11.mlp.up_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.11.post_attention_layernorm.weight": "model-00003-of-00006.safetensors",
+    "model.layers.11.self_attn.k_norm.bias": "model-00003-of-00006.safetensors",
+    "model.layers.11.self_attn.k_norm.weight": "model-00003-of-00006.safetensors",
+    "model.layers.11.self_attn.k_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.11.self_attn.o_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.11.self_attn.q_norm.bias": "model-00003-of-00006.safetensors",
+    "model.layers.11.self_attn.q_norm.weight": "model-00003-of-00006.safetensors",
+    "model.layers.11.self_attn.q_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.11.self_attn.v_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.12.input_layernorm.weight": "model-00003-of-00006.safetensors",
+    "model.layers.12.mlp.down_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.12.mlp.gate_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.12.mlp.up_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.12.post_attention_layernorm.weight": "model-00003-of-00006.safetensors",
+    "model.layers.12.self_attn.k_norm.bias": "model-00003-of-00006.safetensors",
+    "model.layers.12.self_attn.k_norm.weight": "model-00003-of-00006.safetensors",
+    "model.layers.12.self_attn.k_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.12.self_attn.o_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.12.self_attn.q_norm.bias": "model-00003-of-00006.safetensors",
+    "model.layers.12.self_attn.q_norm.weight": "model-00003-of-00006.safetensors",
+    "model.layers.12.self_attn.q_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.12.self_attn.v_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.13.input_layernorm.weight": "model-00003-of-00006.safetensors",
+    "model.layers.13.mlp.down_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.13.mlp.gate_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.13.mlp.up_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.13.post_attention_layernorm.weight": "model-00003-of-00006.safetensors",
+    "model.layers.13.self_attn.k_norm.bias": "model-00003-of-00006.safetensors",
+    "model.layers.13.self_attn.k_norm.weight": "model-00003-of-00006.safetensors",
+    "model.layers.13.self_attn.k_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.13.self_attn.o_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.13.self_attn.q_norm.bias": "model-00003-of-00006.safetensors",
+    "model.layers.13.self_attn.q_norm.weight": "model-00003-of-00006.safetensors",
+    "model.layers.13.self_attn.q_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.13.self_attn.v_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.14.input_layernorm.weight": "model-00003-of-00006.safetensors",
+    "model.layers.14.mlp.down_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.14.mlp.gate_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.14.mlp.up_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.14.post_attention_layernorm.weight": "model-00003-of-00006.safetensors",
+    "model.layers.14.self_attn.k_norm.bias": "model-00003-of-00006.safetensors",
+    "model.layers.14.self_attn.k_norm.weight": "model-00003-of-00006.safetensors",
+    "model.layers.14.self_attn.k_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.14.self_attn.o_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.14.self_attn.q_norm.bias": "model-00003-of-00006.safetensors",
+    "model.layers.14.self_attn.q_norm.weight": "model-00003-of-00006.safetensors",
+    "model.layers.14.self_attn.q_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.14.self_attn.v_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.15.input_layernorm.weight": "model-00003-of-00006.safetensors",
+    "model.layers.15.mlp.down_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.15.mlp.gate_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.15.mlp.up_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.15.post_attention_layernorm.weight": "model-00003-of-00006.safetensors",
+    "model.layers.15.self_attn.k_norm.bias": "model-00003-of-00006.safetensors",
+    "model.layers.15.self_attn.k_norm.weight": "model-00003-of-00006.safetensors",
+    "model.layers.15.self_attn.k_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.15.self_attn.o_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.15.self_attn.q_norm.bias": "model-00003-of-00006.safetensors",
+    "model.layers.15.self_attn.q_norm.weight": "model-00003-of-00006.safetensors",
+    "model.layers.15.self_attn.q_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.15.self_attn.v_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.16.input_layernorm.weight": "model-00004-of-00006.safetensors",
+    "model.layers.16.mlp.down_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.16.mlp.gate_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.16.mlp.up_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.16.post_attention_layernorm.weight": "model-00004-of-00006.safetensors",
+    "model.layers.16.self_attn.k_norm.bias": "model-00003-of-00006.safetensors",
+    "model.layers.16.self_attn.k_norm.weight": "model-00003-of-00006.safetensors",
+    "model.layers.16.self_attn.k_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.16.self_attn.o_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.16.self_attn.q_norm.bias": "model-00003-of-00006.safetensors",
+    "model.layers.16.self_attn.q_norm.weight": "model-00003-of-00006.safetensors",
+    "model.layers.16.self_attn.q_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.16.self_attn.v_proj.weight": "model-00003-of-00006.safetensors",
+    "model.layers.17.input_layernorm.weight": "model-00004-of-00006.safetensors",
+    "model.layers.17.mlp.down_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.17.mlp.gate_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.17.mlp.up_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.17.post_attention_layernorm.weight": "model-00004-of-00006.safetensors",
+    "model.layers.17.self_attn.k_norm.bias": "model-00004-of-00006.safetensors",
+    "model.layers.17.self_attn.k_norm.weight": "model-00004-of-00006.safetensors",
+    "model.layers.17.self_attn.k_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.17.self_attn.o_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.17.self_attn.q_norm.bias": "model-00004-of-00006.safetensors",
+    "model.layers.17.self_attn.q_norm.weight": "model-00004-of-00006.safetensors",
+    "model.layers.17.self_attn.q_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.17.self_attn.v_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.18.input_layernorm.weight": "model-00004-of-00006.safetensors",
+    "model.layers.18.mlp.down_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.18.mlp.gate_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.18.mlp.up_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.18.post_attention_layernorm.weight": "model-00004-of-00006.safetensors",
+    "model.layers.18.self_attn.k_norm.bias": "model-00004-of-00006.safetensors",
+    "model.layers.18.self_attn.k_norm.weight": "model-00004-of-00006.safetensors",
+    "model.layers.18.self_attn.k_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.18.self_attn.o_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.18.self_attn.q_norm.bias": "model-00004-of-00006.safetensors",
+    "model.layers.18.self_attn.q_norm.weight": "model-00004-of-00006.safetensors",
+    "model.layers.18.self_attn.q_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.18.self_attn.v_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.19.input_layernorm.weight": "model-00004-of-00006.safetensors",
+    "model.layers.19.mlp.down_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.19.mlp.gate_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.19.mlp.up_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.19.post_attention_layernorm.weight": "model-00004-of-00006.safetensors",
+    "model.layers.19.self_attn.k_norm.bias": "model-00004-of-00006.safetensors",
+    "model.layers.19.self_attn.k_norm.weight": "model-00004-of-00006.safetensors",
+    "model.layers.19.self_attn.k_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.19.self_attn.o_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.19.self_attn.q_norm.bias": "model-00004-of-00006.safetensors",
+    "model.layers.19.self_attn.q_norm.weight": "model-00004-of-00006.safetensors",
+    "model.layers.19.self_attn.q_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.19.self_attn.v_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.2.input_layernorm.weight": "model-00001-of-00006.safetensors",
+    "model.layers.2.mlp.down_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.2.mlp.gate_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.2.mlp.up_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.2.post_attention_layernorm.weight": "model-00001-of-00006.safetensors",
+    "model.layers.2.self_attn.k_norm.bias": "model-00001-of-00006.safetensors",
+    "model.layers.2.self_attn.k_norm.weight": "model-00001-of-00006.safetensors",
+    "model.layers.2.self_attn.k_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.2.self_attn.o_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.2.self_attn.q_norm.bias": "model-00001-of-00006.safetensors",
+    "model.layers.2.self_attn.q_norm.weight": "model-00001-of-00006.safetensors",
+    "model.layers.2.self_attn.q_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.2.self_attn.v_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.20.input_layernorm.weight": "model-00004-of-00006.safetensors",
+    "model.layers.20.mlp.down_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.20.mlp.gate_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.20.mlp.up_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.20.post_attention_layernorm.weight": "model-00004-of-00006.safetensors",
+    "model.layers.20.self_attn.k_norm.bias": "model-00004-of-00006.safetensors",
+    "model.layers.20.self_attn.k_norm.weight": "model-00004-of-00006.safetensors",
+    "model.layers.20.self_attn.k_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.20.self_attn.o_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.20.self_attn.q_norm.bias": "model-00004-of-00006.safetensors",
+    "model.layers.20.self_attn.q_norm.weight": "model-00004-of-00006.safetensors",
+    "model.layers.20.self_attn.q_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.20.self_attn.v_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.21.input_layernorm.weight": "model-00004-of-00006.safetensors",
+    "model.layers.21.mlp.down_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.21.mlp.gate_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.21.mlp.up_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.21.post_attention_layernorm.weight": "model-00004-of-00006.safetensors",
+    "model.layers.21.self_attn.k_norm.bias": "model-00004-of-00006.safetensors",
+    "model.layers.21.self_attn.k_norm.weight": "model-00004-of-00006.safetensors",
+    "model.layers.21.self_attn.k_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.21.self_attn.o_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.21.self_attn.q_norm.bias": "model-00004-of-00006.safetensors",
+    "model.layers.21.self_attn.q_norm.weight": "model-00004-of-00006.safetensors",
+    "model.layers.21.self_attn.q_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.21.self_attn.v_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.22.input_layernorm.weight": "model-00005-of-00006.safetensors",
+    "model.layers.22.mlp.down_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.22.mlp.gate_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.22.mlp.up_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.22.post_attention_layernorm.weight": "model-00005-of-00006.safetensors",
+    "model.layers.22.self_attn.k_norm.bias": "model-00004-of-00006.safetensors",
+    "model.layers.22.self_attn.k_norm.weight": "model-00004-of-00006.safetensors",
+    "model.layers.22.self_attn.k_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.22.self_attn.o_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.22.self_attn.q_norm.bias": "model-00004-of-00006.safetensors",
+    "model.layers.22.self_attn.q_norm.weight": "model-00004-of-00006.safetensors",
+    "model.layers.22.self_attn.q_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.22.self_attn.v_proj.weight": "model-00004-of-00006.safetensors",
+    "model.layers.23.input_layernorm.weight": "model-00005-of-00006.safetensors",
+    "model.layers.23.mlp.down_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.23.mlp.gate_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.23.mlp.up_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.23.post_attention_layernorm.weight": "model-00005-of-00006.safetensors",
+    "model.layers.23.self_attn.k_norm.bias": "model-00005-of-00006.safetensors",
+    "model.layers.23.self_attn.k_norm.weight": "model-00005-of-00006.safetensors",
+    "model.layers.23.self_attn.k_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.23.self_attn.o_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.23.self_attn.q_norm.bias": "model-00005-of-00006.safetensors",
+    "model.layers.23.self_attn.q_norm.weight": "model-00005-of-00006.safetensors",
+    "model.layers.23.self_attn.q_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.23.self_attn.v_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.24.input_layernorm.weight": "model-00005-of-00006.safetensors",
+    "model.layers.24.mlp.down_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.24.mlp.gate_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.24.mlp.up_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.24.post_attention_layernorm.weight": "model-00005-of-00006.safetensors",
+    "model.layers.24.self_attn.k_norm.bias": "model-00005-of-00006.safetensors",
+    "model.layers.24.self_attn.k_norm.weight": "model-00005-of-00006.safetensors",
+    "model.layers.24.self_attn.k_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.24.self_attn.o_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.24.self_attn.q_norm.bias": "model-00005-of-00006.safetensors",
+    "model.layers.24.self_attn.q_norm.weight": "model-00005-of-00006.safetensors",
+    "model.layers.24.self_attn.q_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.24.self_attn.v_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.25.input_layernorm.weight": "model-00005-of-00006.safetensors",
+    "model.layers.25.mlp.down_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.25.mlp.gate_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.25.mlp.up_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.25.post_attention_layernorm.weight": "model-00005-of-00006.safetensors",
+    "model.layers.25.self_attn.k_norm.bias": "model-00005-of-00006.safetensors",
+    "model.layers.25.self_attn.k_norm.weight": "model-00005-of-00006.safetensors",
+    "model.layers.25.self_attn.k_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.25.self_attn.o_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.25.self_attn.q_norm.bias": "model-00005-of-00006.safetensors",
+    "model.layers.25.self_attn.q_norm.weight": "model-00005-of-00006.safetensors",
+    "model.layers.25.self_attn.q_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.25.self_attn.v_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.26.input_layernorm.weight": "model-00005-of-00006.safetensors",
+    "model.layers.26.mlp.down_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.26.mlp.gate_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.26.mlp.up_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.26.post_attention_layernorm.weight": "model-00005-of-00006.safetensors",
+    "model.layers.26.self_attn.k_norm.bias": "model-00005-of-00006.safetensors",
+    "model.layers.26.self_attn.k_norm.weight": "model-00005-of-00006.safetensors",
+    "model.layers.26.self_attn.k_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.26.self_attn.o_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.26.self_attn.q_norm.bias": "model-00005-of-00006.safetensors",
+    "model.layers.26.self_attn.q_norm.weight": "model-00005-of-00006.safetensors",
+    "model.layers.26.self_attn.q_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.26.self_attn.v_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.27.input_layernorm.weight": "model-00005-of-00006.safetensors",
+    "model.layers.27.mlp.down_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.27.mlp.gate_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.27.mlp.up_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.27.post_attention_layernorm.weight": "model-00005-of-00006.safetensors",
+    "model.layers.27.self_attn.k_norm.bias": "model-00005-of-00006.safetensors",
+    "model.layers.27.self_attn.k_norm.weight": "model-00005-of-00006.safetensors",
+    "model.layers.27.self_attn.k_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.27.self_attn.o_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.27.self_attn.q_norm.bias": "model-00005-of-00006.safetensors",
+    "model.layers.27.self_attn.q_norm.weight": "model-00005-of-00006.safetensors",
+    "model.layers.27.self_attn.q_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.27.self_attn.v_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.28.input_layernorm.weight": "model-00006-of-00006.safetensors",
+    "model.layers.28.mlp.down_proj.weight": "model-00006-of-00006.safetensors",
+    "model.layers.28.mlp.gate_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.28.mlp.up_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.28.post_attention_layernorm.weight": "model-00006-of-00006.safetensors",
+    "model.layers.28.self_attn.k_norm.bias": "model-00005-of-00006.safetensors",
+    "model.layers.28.self_attn.k_norm.weight": "model-00005-of-00006.safetensors",
+    "model.layers.28.self_attn.k_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.28.self_attn.o_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.28.self_attn.q_norm.bias": "model-00005-of-00006.safetensors",
+    "model.layers.28.self_attn.q_norm.weight": "model-00005-of-00006.safetensors",
+    "model.layers.28.self_attn.q_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.28.self_attn.v_proj.weight": "model-00005-of-00006.safetensors",
+    "model.layers.29.input_layernorm.weight": "model-00006-of-00006.safetensors",
+    "model.layers.29.mlp.down_proj.weight": "model-00006-of-00006.safetensors",
+    "model.layers.29.mlp.gate_proj.weight": "model-00006-of-00006.safetensors",
+    "model.layers.29.mlp.up_proj.weight": "model-00006-of-00006.safetensors",
+    "model.layers.29.post_attention_layernorm.weight": "model-00006-of-00006.safetensors",
+    "model.layers.29.self_attn.k_norm.bias": "model-00006-of-00006.safetensors",
+    "model.layers.29.self_attn.k_norm.weight": "model-00006-of-00006.safetensors",
+    "model.layers.29.self_attn.k_proj.weight": "model-00006-of-00006.safetensors",
+    "model.layers.29.self_attn.o_proj.weight": "model-00006-of-00006.safetensors",
+    "model.layers.29.self_attn.q_norm.bias": "model-00006-of-00006.safetensors",
+    "model.layers.29.self_attn.q_norm.weight": "model-00006-of-00006.safetensors",
+    "model.layers.29.self_attn.q_proj.weight": "model-00006-of-00006.safetensors",
+    "model.layers.29.self_attn.v_proj.weight": "model-00006-of-00006.safetensors",
+    "model.layers.3.input_layernorm.weight": "model-00001-of-00006.safetensors",
+    "model.layers.3.mlp.down_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.3.mlp.gate_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.3.mlp.up_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.3.post_attention_layernorm.weight": "model-00001-of-00006.safetensors",
+    "model.layers.3.self_attn.k_norm.bias": "model-00001-of-00006.safetensors",
+    "model.layers.3.self_attn.k_norm.weight": "model-00001-of-00006.safetensors",
+    "model.layers.3.self_attn.k_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.3.self_attn.o_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.3.self_attn.q_norm.bias": "model-00001-of-00006.safetensors",
+    "model.layers.3.self_attn.q_norm.weight": "model-00001-of-00006.safetensors",
+    "model.layers.3.self_attn.q_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.3.self_attn.v_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.30.input_layernorm.weight": "model-00006-of-00006.safetensors",
+    "model.layers.30.mlp.down_proj.weight": "model-00006-of-00006.safetensors",
+    "model.layers.30.mlp.gate_proj.weight": "model-00006-of-00006.safetensors",
+    "model.layers.30.mlp.up_proj.weight": "model-00006-of-00006.safetensors",
+    "model.layers.30.post_attention_layernorm.weight": "model-00006-of-00006.safetensors",
+    "model.layers.30.self_attn.k_norm.bias": "model-00006-of-00006.safetensors",
+    "model.layers.30.self_attn.k_norm.weight": "model-00006-of-00006.safetensors",
+    "model.layers.30.self_attn.k_proj.weight": "model-00006-of-00006.safetensors",
+    "model.layers.30.self_attn.o_proj.weight": "model-00006-of-00006.safetensors",
+    "model.layers.30.self_attn.q_norm.bias": "model-00006-of-00006.safetensors",
+    "model.layers.30.self_attn.q_norm.weight": "model-00006-of-00006.safetensors",
+    "model.layers.30.self_attn.q_proj.weight": "model-00006-of-00006.safetensors",
+    "model.layers.30.self_attn.v_proj.weight": "model-00006-of-00006.safetensors",
+    "model.layers.31.input_layernorm.weight": "model-00006-of-00006.safetensors",
+    "model.layers.31.mlp.down_proj.weight": "model-00006-of-00006.safetensors",
+    "model.layers.31.mlp.gate_proj.weight": "model-00006-of-00006.safetensors",
+    "model.layers.31.mlp.up_proj.weight": "model-00006-of-00006.safetensors",
+    "model.layers.31.post_attention_layernorm.weight": "model-00006-of-00006.safetensors",
+    "model.layers.31.self_attn.k_norm.bias": "model-00006-of-00006.safetensors",
+    "model.layers.31.self_attn.k_norm.weight": "model-00006-of-00006.safetensors",
+    "model.layers.31.self_attn.k_proj.weight": "model-00006-of-00006.safetensors",
+    "model.layers.31.self_attn.o_proj.weight": "model-00006-of-00006.safetensors",
+    "model.layers.31.self_attn.q_norm.bias": "model-00006-of-00006.safetensors",
+    "model.layers.31.self_attn.q_norm.weight": "model-00006-of-00006.safetensors",
+    "model.layers.31.self_attn.q_proj.weight": "model-00006-of-00006.safetensors",
+    "model.layers.31.self_attn.v_proj.weight": "model-00006-of-00006.safetensors",
+    "model.layers.4.input_layernorm.weight": "model-00002-of-00006.safetensors",
+    "model.layers.4.mlp.down_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.4.mlp.gate_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.4.mlp.up_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.4.post_attention_layernorm.weight": "model-00002-of-00006.safetensors",
+    "model.layers.4.self_attn.k_norm.bias": "model-00001-of-00006.safetensors",
+    "model.layers.4.self_attn.k_norm.weight": "model-00001-of-00006.safetensors",
+    "model.layers.4.self_attn.k_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.4.self_attn.o_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.4.self_attn.q_norm.bias": "model-00001-of-00006.safetensors",
+    "model.layers.4.self_attn.q_norm.weight": "model-00001-of-00006.safetensors",
+    "model.layers.4.self_attn.q_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.4.self_attn.v_proj.weight": "model-00001-of-00006.safetensors",
+    "model.layers.5.input_layernorm.weight": "model-00002-of-00006.safetensors",
+    "model.layers.5.mlp.down_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.5.mlp.gate_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.5.mlp.up_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.5.post_attention_layernorm.weight": "model-00002-of-00006.safetensors",
+    "model.layers.5.self_attn.k_norm.bias": "model-00002-of-00006.safetensors",
+    "model.layers.5.self_attn.k_norm.weight": "model-00002-of-00006.safetensors",
+    "model.layers.5.self_attn.k_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.5.self_attn.o_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.5.self_attn.q_norm.bias": "model-00002-of-00006.safetensors",
+    "model.layers.5.self_attn.q_norm.weight": "model-00002-of-00006.safetensors",
+    "model.layers.5.self_attn.q_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.5.self_attn.v_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.6.input_layernorm.weight": "model-00002-of-00006.safetensors",
+    "model.layers.6.mlp.down_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.6.mlp.gate_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.6.mlp.up_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.6.post_attention_layernorm.weight": "model-00002-of-00006.safetensors",
+    "model.layers.6.self_attn.k_norm.bias": "model-00002-of-00006.safetensors",
+    "model.layers.6.self_attn.k_norm.weight": "model-00002-of-00006.safetensors",
+    "model.layers.6.self_attn.k_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.6.self_attn.o_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.6.self_attn.q_norm.bias": "model-00002-of-00006.safetensors",
+    "model.layers.6.self_attn.q_norm.weight": "model-00002-of-00006.safetensors",
+    "model.layers.6.self_attn.q_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.6.self_attn.v_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.7.input_layernorm.weight": "model-00002-of-00006.safetensors",
+    "model.layers.7.mlp.down_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.7.mlp.gate_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.7.mlp.up_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.7.post_attention_layernorm.weight": "model-00002-of-00006.safetensors",
+    "model.layers.7.self_attn.k_norm.bias": "model-00002-of-00006.safetensors",
+    "model.layers.7.self_attn.k_norm.weight": "model-00002-of-00006.safetensors",
+    "model.layers.7.self_attn.k_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.7.self_attn.o_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.7.self_attn.q_norm.bias": "model-00002-of-00006.safetensors",
+    "model.layers.7.self_attn.q_norm.weight": "model-00002-of-00006.safetensors",
+    "model.layers.7.self_attn.q_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.7.self_attn.v_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.8.input_layernorm.weight": "model-00002-of-00006.safetensors",
+    "model.layers.8.mlp.down_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.8.mlp.gate_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.8.mlp.up_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.8.post_attention_layernorm.weight": "model-00002-of-00006.safetensors",
+    "model.layers.8.self_attn.k_norm.bias": "model-00002-of-00006.safetensors",
+    "model.layers.8.self_attn.k_norm.weight": "model-00002-of-00006.safetensors",
+    "model.layers.8.self_attn.k_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.8.self_attn.o_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.8.self_attn.q_norm.bias": "model-00002-of-00006.safetensors",
+    "model.layers.8.self_attn.q_norm.weight": "model-00002-of-00006.safetensors",
+    "model.layers.8.self_attn.q_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.8.self_attn.v_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.9.input_layernorm.weight": "model-00002-of-00006.safetensors",
+    "model.layers.9.mlp.down_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.9.mlp.gate_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.9.mlp.up_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.9.post_attention_layernorm.weight": "model-00002-of-00006.safetensors",
+    "model.layers.9.self_attn.k_norm.bias": "model-00002-of-00006.safetensors",
+    "model.layers.9.self_attn.k_norm.weight": "model-00002-of-00006.safetensors",
+    "model.layers.9.self_attn.k_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.9.self_attn.o_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.9.self_attn.q_norm.bias": "model-00002-of-00006.safetensors",
+    "model.layers.9.self_attn.q_norm.weight": "model-00002-of-00006.safetensors",
+    "model.layers.9.self_attn.q_proj.weight": "model-00002-of-00006.safetensors",
+    "model.layers.9.self_attn.v_proj.weight": "model-00002-of-00006.safetensors",
+    "model.norm.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.conv_in.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.conv_in.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.conv_out.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.conv_out.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.mid.attn_1.k.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.mid.attn_1.k.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.mid.attn_1.norm.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.mid.attn_1.norm.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.mid.attn_1.proj_out.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.mid.attn_1.proj_out.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.mid.attn_1.q.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.mid.attn_1.q.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.mid.attn_1.v.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.mid.attn_1.v.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.mid.block_1.conv1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.mid.block_1.conv1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.mid.block_1.conv2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.mid.block_1.conv2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.mid.block_1.norm1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.mid.block_1.norm1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.mid.block_1.norm2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.mid.block_1.norm2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.mid.block_2.conv1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.mid.block_2.conv1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.mid.block_2.conv2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.mid.block_2.conv2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.mid.block_2.norm1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.mid.block_2.norm1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.mid.block_2.norm2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.mid.block_2.norm2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.norm_out.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.norm_out.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.0.block.0.conv1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.0.block.0.conv1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.0.block.0.conv2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.0.block.0.conv2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.0.block.0.norm1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.0.block.0.norm1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.0.block.0.norm2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.0.block.0.norm2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.0.block.1.conv1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.0.block.1.conv1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.0.block.1.conv2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.0.block.1.conv2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.0.block.1.norm1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.0.block.1.norm1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.0.block.1.norm2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.0.block.1.norm2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.0.block.2.conv1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.0.block.2.conv1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.0.block.2.conv2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.0.block.2.conv2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.0.block.2.norm1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.0.block.2.norm1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.0.block.2.norm2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.0.block.2.norm2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.1.block.0.conv1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.1.block.0.conv1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.1.block.0.conv2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.1.block.0.conv2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.1.block.0.nin_shortcut.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.1.block.0.nin_shortcut.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.1.block.0.norm1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.1.block.0.norm1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.1.block.0.norm2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.1.block.0.norm2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.1.block.1.conv1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.1.block.1.conv1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.1.block.1.conv2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.1.block.1.conv2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.1.block.1.norm1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.1.block.1.norm1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.1.block.1.norm2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.1.block.1.norm2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.1.block.2.conv1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.1.block.2.conv1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.1.block.2.conv2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.1.block.2.conv2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.1.block.2.norm1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.1.block.2.norm1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.1.block.2.norm2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.1.block.2.norm2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.1.upsample.conv.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.1.upsample.conv.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.2.block.0.conv1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.2.block.0.conv1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.2.block.0.conv2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.2.block.0.conv2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.2.block.0.norm1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.2.block.0.norm1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.2.block.0.norm2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.2.block.0.norm2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.2.block.1.conv1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.2.block.1.conv1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.2.block.1.conv2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.2.block.1.conv2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.2.block.1.norm1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.2.block.1.norm1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.2.block.1.norm2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.2.block.1.norm2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.2.block.2.conv1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.2.block.2.conv1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.2.block.2.conv2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.2.block.2.conv2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.2.block.2.norm1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.2.block.2.norm1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.2.block.2.norm2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.2.block.2.norm2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.2.upsample.conv.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.2.upsample.conv.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.3.block.0.conv1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.3.block.0.conv1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.3.block.0.conv2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.3.block.0.conv2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.3.block.0.nin_shortcut.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.3.block.0.nin_shortcut.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.3.block.0.norm1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.3.block.0.norm1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.3.block.0.norm2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.3.block.0.norm2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.3.block.1.conv1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.3.block.1.conv1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.3.block.1.conv2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.3.block.1.conv2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.3.block.1.norm1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.3.block.1.norm1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.3.block.1.norm2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.3.block.1.norm2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.3.block.2.conv1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.3.block.2.conv1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.3.block.2.conv2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.3.block.2.conv2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.3.block.2.norm1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.3.block.2.norm1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.3.block.2.norm2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.3.block.2.norm2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.3.upsample.conv.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.3.upsample.conv.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.4.block.0.conv1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.4.block.0.conv1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.4.block.0.conv2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.4.block.0.conv2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.4.block.0.norm1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.4.block.0.norm1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.4.block.0.norm2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.4.block.0.norm2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.4.block.1.conv1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.4.block.1.conv1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.4.block.1.conv2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.4.block.1.conv2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.4.block.1.norm1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.4.block.1.norm1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.4.block.1.norm2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.4.block.1.norm2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.4.block.2.conv1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.4.block.2.conv1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.4.block.2.conv2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.4.block.2.conv2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.4.block.2.norm1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.4.block.2.norm1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.4.block.2.norm2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.4.block.2.norm2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.4.upsample.conv.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.decoder.up.4.upsample.conv.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.conv_in.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.conv_in.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.conv_out.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.conv_out.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.0.block.0.conv1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.0.block.0.conv1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.0.block.0.conv2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.0.block.0.conv2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.0.block.0.norm1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.0.block.0.norm1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.0.block.0.norm2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.0.block.0.norm2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.0.block.1.conv1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.0.block.1.conv1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.0.block.1.conv2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.0.block.1.conv2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.0.block.1.norm1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.0.block.1.norm1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.0.block.1.norm2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.0.block.1.norm2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.0.downsample.conv.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.0.downsample.conv.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.1.block.0.conv1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.1.block.0.conv1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.1.block.0.conv2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.1.block.0.conv2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.1.block.0.norm1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.1.block.0.norm1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.1.block.0.norm2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.1.block.0.norm2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.1.block.1.conv1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.1.block.1.conv1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.1.block.1.conv2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.1.block.1.conv2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.1.block.1.norm1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.1.block.1.norm1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.1.block.1.norm2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.1.block.1.norm2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.1.downsample.conv.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.1.downsample.conv.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.2.block.0.conv1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.2.block.0.conv1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.2.block.0.conv2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.2.block.0.conv2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.2.block.0.nin_shortcut.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.2.block.0.nin_shortcut.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.2.block.0.norm1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.2.block.0.norm1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.2.block.0.norm2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.2.block.0.norm2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.2.block.1.conv1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.2.block.1.conv1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.2.block.1.conv2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.2.block.1.conv2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.2.block.1.norm1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.2.block.1.norm1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.2.block.1.norm2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.2.block.1.norm2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.2.downsample.conv.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.2.downsample.conv.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.3.block.0.conv1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.3.block.0.conv1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.3.block.0.conv2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.3.block.0.conv2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.3.block.0.norm1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.3.block.0.norm1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.3.block.0.norm2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.3.block.0.norm2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.3.block.1.conv1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.3.block.1.conv1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.3.block.1.conv2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.3.block.1.conv2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.3.block.1.norm1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.3.block.1.norm1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.3.block.1.norm2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.3.block.1.norm2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.3.downsample.conv.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.3.downsample.conv.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.4.block.0.conv1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.4.block.0.conv1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.4.block.0.conv2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.4.block.0.conv2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.4.block.0.nin_shortcut.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.4.block.0.nin_shortcut.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.4.block.0.norm1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.4.block.0.norm1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.4.block.0.norm2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.4.block.0.norm2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.4.block.1.conv1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.4.block.1.conv1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.4.block.1.conv2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.4.block.1.conv2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.4.block.1.norm1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.4.block.1.norm1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.4.block.1.norm2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.down.4.block.1.norm2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.mid.attn_1.k.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.mid.attn_1.k.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.mid.attn_1.norm.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.mid.attn_1.norm.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.mid.attn_1.proj_out.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.mid.attn_1.proj_out.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.mid.attn_1.q.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.mid.attn_1.q.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.mid.attn_1.v.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.mid.attn_1.v.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.mid.block_1.conv1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.mid.block_1.conv1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.mid.block_1.conv2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.mid.block_1.conv2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.mid.block_1.norm1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.mid.block_1.norm1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.mid.block_1.norm2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.mid.block_1.norm2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.mid.block_2.conv1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.mid.block_2.conv1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.mid.block_2.conv2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.mid.block_2.conv2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.mid.block_2.norm1.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.mid.block_2.norm1.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.mid.block_2.norm2.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.mid.block_2.norm2.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.norm_out.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.encoder.norm_out.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.post_quant_conv.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.post_quant_conv.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.quant_conv.bias": "model-00006-of-00006.safetensors",
+    "model.vqmodel.quant_conv.weight": "model-00006-of-00006.safetensors",
+    "model.vqmodel.quantize.embedding.weight": "model-00006-of-00006.safetensors"
+  }
+}

preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,28 @@

+{
+  "crop_size": {
+    "height": 512,
+    "width": 512
+  },
+  "do_center_crop": true,
+  "do_convert_rgb": true,
+  "do_normalize": true,
+  "do_rescale": true,
+  "do_resize": true,
+  "image_mean": [
+    1.0,
+    1.0,
+    1.0
+  ],
+  "image_processor_type": "ChameleonImageProcessor",
+  "image_std": [
+    1.0,
+    1.0,
+    1.0
+  ],
+  "processor_class": "ChameleonProcessor",
+  "resample": 1,
+  "rescale_factor": 0.0078,
+  "size": {
+    "shortest_edge": 512
+  }
+}

processor_config.json ADDED Viewed

	@@ -0,0 +1,5 @@

+{
+  "image_seq_length": 1024,
+  "image_token": "<image>",
+  "processor_class": "ChameleonProcessor"
+}

script.sh ADDED Viewed

	@@ -0,0 +1,48 @@

+#!/usr/bin/env bash
+#
+# Copyright 2024 PKU-Alignment Team. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+export TRITON_CACHE_DIR="/home/align-anything/cache/triton"
+# You can replace it with a local model path
+MODEL_NAME_OR_PATH="/data/align-anything/hantao/models/0916_ti_to_ti_sft/"
+# You can replace it with a local dataset path
+TRAIN_DATASETS="/data/align-anything/hantao/align-anything/projects/text_image_to_text_image/outputs"
+TRAIN_DATA_FILES="llf_ti2ti_27k_tokenized.pt"
+# You can replace it with a new path
+OUTPUT_DIR="../outputs/sft_tf_cham_1011_27k_ti2ti"
+# For wandb online logging
+export WANDB_API_KEY="7e2dcc0c310ebcb7cdcafd5e9320d6be55cf1a33"
+# Source the setup script
+source ./setup.sh
+# sleep 30m
+# Execute deepspeed command
+deepspeed \
+	--master_port ${MASTER_PORT} \
+	--module align_anything.trainers.text_image_to_text_image.sft \
+	--model_name_or_path ${MODEL_NAME_OR_PATH} \
+	--train_datasets ${TRAIN_DATASETS} \
+	--train_data_files ${TRAIN_DATA_FILES} \
+	--output_dir ${OUTPUT_DIR} \
+	--train_template AA_textfeedback \
+	--train_split train \
+	--per_device_train_batch_size 4 \
+	--per_device_eval_batch_size 4 \
+	--gradient_accumulation_steps 2 \
+	--save_interval 400 \
+	--learning_rate 1e-6 \
+	--epochs 3 \
+	--lr_scheduler_type cosine

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,37 @@

+{
+  "bos_token": {
+    "content": "<s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "<pad>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "sep_token": {
+    "content": "<reserved08706>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "<unk>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json ADDED Viewed

The diff for this file is too large to render. See raw diff

wandb/debug-internal.log ADDED Viewed

	@@ -0,0 +1,25 @@

+{"time":"2024-10-11T20:27:29.314392342Z","level":"INFO","msg":"using version","core version":"0.18.3"}
+{"time":"2024-10-11T20:27:29.314422946Z","level":"INFO","msg":"created symlink","path":"../outputs/sft_tf_cham_1011_27k_ti2ti/wandb/run-20241011_202729-hvajn2pl/logs/debug-core.log"}
+{"time":"2024-10-11T20:27:31.315941153Z","level":"ERROR","msg":"dialing: google: could not find default credentials. See https://cloud.google.com/docs/authentication/external/set-up-adc for more information"}
+{"time":"2024-10-11T20:27:31.343923384Z","level":"INFO","msg":"created new stream","id":"hvajn2pl"}
+{"time":"2024-10-11T20:27:31.344015309Z","level":"INFO","msg":"stream: started","id":"hvajn2pl"}
+{"time":"2024-10-11T20:27:31.344030708Z","level":"INFO","msg":"writer: Do: started","stream_id":{"value":"hvajn2pl"}}
+{"time":"2024-10-11T20:27:31.3440543Z","level":"INFO","msg":"handler: started","stream_id":{"value":"hvajn2pl"}}
+{"time":"2024-10-11T20:27:31.344075012Z","level":"INFO","msg":"sender: started","stream_id":{"value":"hvajn2pl"}}
+{"time":"2024-10-11T20:27:32.111921422Z","level":"INFO","msg":"wandb-core","!BADKEY":null}
+{"time":"2024-10-11T20:27:32.115787579Z","level":"INFO","msg":"Starting system monitor"}
+{"time":"2024-10-11T20:37:17.77464423Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded"}
+{"time":"2024-10-11T21:02:18.014643124Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
+{"time":"2024-10-11T21:48:05.805217442Z","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/htlou/align-anything/hvajn2pl/file_stream"}
+{"time":"2024-10-11T22:52:56.823831464Z","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/htlou/align-anything/hvajn2pl/file_stream"}
+{"time":"2024-10-12T04:14:39.094813754Z","level":"INFO","msg":"Stopping system monitor"}
+{"time":"2024-10-12T04:14:39.115766983Z","level":"INFO","msg":"Stopped system monitor"}
+{"time":"2024-10-12T04:14:39.625373664Z","level":"WARN","msg":"No program path found, not creating job artifact. See https://docs.wandb.ai/guides/launch/create-job"}
+{"time":"2024-10-12T04:14:39.625411287Z","level":"INFO","msg":"sender: sendDefer: no job artifact to save"}
+{"time":"2024-10-12T04:14:44.099325031Z","level":"ERROR","msg":"monitor: gpu: timeout waiting for process to exit"}
+{"time":"2024-10-12T04:15:06.376494069Z","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
+{"time":"2024-10-12T04:15:08.082335235Z","level":"INFO","msg":"stream: closing","id":"hvajn2pl"}
+{"time":"2024-10-12T04:15:08.082392093Z","level":"INFO","msg":"handler: closed","stream_id":{"value":"hvajn2pl"}}
+{"time":"2024-10-12T04:15:08.082456448Z","level":"INFO","msg":"writer: Close: closed","stream_id":{"value":"hvajn2pl"}}
+{"time":"2024-10-12T04:15:08.082510885Z","level":"INFO","msg":"sender: closed","stream_id":{"value":"hvajn2pl"}}
+{"time":"2024-10-12T04:15:08.084798858Z","level":"INFO","msg":"stream: closed","id":"hvajn2pl"}

wandb/debug.log ADDED Viewed

	@@ -0,0 +1,33 @@

+2024-10-11 20:27:29,297 INFO    MainThread:320740 [wandb_setup.py:_flush():79] Current SDK version is 0.18.3
+2024-10-11 20:27:29,297 INFO    MainThread:320740 [wandb_setup.py:_flush():79] Configure stats pid to 320740
+2024-10-11 20:27:29,297 INFO    MainThread:320740 [wandb_setup.py:_flush():79] Loading settings from /home/align-anything/.config/wandb/settings
+2024-10-11 20:27:29,297 INFO    MainThread:320740 [wandb_setup.py:_flush():79] Loading settings from /data/align-anything/hantao/align-anything/scripts/wandb/settings
+2024-10-11 20:27:29,297 INFO    MainThread:320740 [wandb_setup.py:_flush():79] Loading settings from environment variables: {'api_key': '***REDACTED***'}
+2024-10-11 20:27:29,297 INFO    MainThread:320740 [wandb_setup.py:_flush():79] Applying setup settings: {'mode': None, '_disable_service': None}
+2024-10-11 20:27:29,297 WARNING MainThread:320740 [wandb_setup.py:_flush():79] Could not find program at -m align_anything.trainers.text_image_to_text_image.sft
+2024-10-11 20:27:29,297 INFO    MainThread:320740 [wandb_setup.py:_flush():79] Inferring run settings from compute environment: {'program_relpath': None, 'program': '-m align_anything.trainers.text_image_to_text_image.sft'}
+2024-10-11 20:27:29,297 INFO    MainThread:320740 [wandb_setup.py:_flush():79] Applying login settings: {}
+2024-10-11 20:27:29,298 INFO    MainThread:320740 [wandb_init.py:_log_setup():532] Logging user logs to ../outputs/sft_tf_cham_1011_27k_ti2ti/wandb/run-20241011_202729-hvajn2pl/logs/debug.log
+2024-10-11 20:27:29,298 INFO    MainThread:320740 [wandb_init.py:_log_setup():533] Logging internal logs to ../outputs/sft_tf_cham_1011_27k_ti2ti/wandb/run-20241011_202729-hvajn2pl/logs/debug-internal.log
+2024-10-11 20:27:29,298 INFO    MainThread:320740 [wandb_init.py:init():617] calling init triggers
+2024-10-11 20:27:29,298 INFO    MainThread:320740 [wandb_init.py:init():624] wandb.init called with sweep_config: {}
+config: {'train_cfgs': {'ds_cfgs': 'ds_z3_config.json', 'epochs': 3.0, 'seed': 42, 'per_device_train_batch_size': 4.0, 'per_device_eval_batch_size': 4.0, 'gradient_accumulation_steps': 2.0, 'gradient_checkpointing': True, 'learning_rate': 1e-06, 'lr_scheduler_type': 'cosine', 'lr_warmup_ratio': 0.03, 'weight_decay': 0.0, 'adam_betas': [0.9, 0.95], 'adam_epsilon': 1e-08, 'bf16': True, 'fp16': False, 'eval_strategy': 'steps', 'eval_interval': 1000, 'freeze_language_model': False, 'max_grad_norm': 1.0}, 'data_cfgs': {'train_datasets': '/data/align-anything/hantao/align-anything/projects/text_image_to_text_image/outputs', 'train_template': 'AA_textfeedback', 'train_size': None, 'train_split': 'train', 'train_subset': None, 'train_data_files': 'llf_ti2ti_27k_tokenized.pt', 'train_optional_args': [], 'eval_datasets': None, 'eval_template': None, 'eval_size': None, 'eval_split': None, 'eval_subset': None, 'eval_data_files': None, 'eval_optional_args': []}, 'logger_cfgs': {'log_type': 'wandb', 'log_project': 'align-anything', 'log_run_name': 'sft', 'output_dir': '../outputs/sft_tf_cham_1011_27k_ti2ti', 'cache_dir': None, 'save_interval': 400.0}, 'model_cfgs': {'model_name_or_path': '/data/align-anything/hantao/models/0916_ti_to_ti_sft/', 'trust_remote_code': True, 'model_max_length': 4096}, 'special_tokens': None}
+2024-10-11 20:27:29,298 INFO    MainThread:320740 [wandb_init.py:init():667] starting backend
+2024-10-11 20:27:29,298 INFO    MainThread:320740 [wandb_init.py:init():671] sending inform_init request
+2024-10-11 20:27:29,308 INFO    MainThread:320740 [backend.py:_multiprocessing_setup():104] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
+2024-10-11 20:27:29,308 INFO    MainThread:320740 [wandb_init.py:init():684] backend started and connected
+2024-10-11 20:27:29,318 INFO    MainThread:320740 [wandb_init.py:init():779] updated telemetry
+2024-10-11 20:27:29,397 INFO    MainThread:320740 [wandb_init.py:init():812] communicating run to backend with 90.0 second timeout
+2024-10-11 20:27:32,099 INFO    MainThread:320740 [wandb_init.py:init():863] starting run threads in backend
+2024-10-11 20:27:32,709 INFO    MainThread:320740 [wandb_run.py:_console_start():2465] atexit reg
+2024-10-11 20:27:32,710 INFO    MainThread:320740 [wandb_run.py:_redirect():2313] redirect: wrap_raw
+2024-10-11 20:27:32,710 INFO    MainThread:320740 [wandb_run.py:_redirect():2378] Wrapping output streams.
+2024-10-11 20:27:32,710 INFO    MainThread:320740 [wandb_run.py:_redirect():2403] Redirects installed.
+2024-10-11 20:27:32,722 INFO    MainThread:320740 [wandb_init.py:init():907] run started, returning control to user process
+2024-10-12 04:14:39,088 INFO    MainThread:320740 [wandb_run.py:_finish():2164] finishing run htlou/align-anything/hvajn2pl
+2024-10-12 04:14:39,090 INFO    MainThread:320740 [wandb_run.py:_atexit_cleanup():2428] got exitcode: 0
+2024-10-12 04:14:39,093 INFO    MainThread:320740 [wandb_run.py:_restore():2410] restore
+2024-10-12 04:14:39,093 INFO    MainThread:320740 [wandb_run.py:_restore():2416] restore done
+2024-10-12 04:15:08,063 INFO    MainThread:320740 [wandb_run.py:_footer_history_summary_info():4049] rendering history
+2024-10-12 04:15:08,065 INFO    MainThread:320740 [wandb_run.py:_footer_history_summary_info():4081] rendering summary
+2024-10-12 04:15:08,077 INFO    MainThread:320740 [wandb_run.py:_footer_sync_info():4008] logging synced files

wandb/run-20241011_202729-hvajn2pl/files/config.yaml ADDED Viewed

	@@ -0,0 +1,96 @@

+_wandb:
+    value:
+        cli_version: 0.18.3
+        m: []
+        python_version: 3.11.0
+        t:
+            "1":
+                - 1
+                - 11
+                - 41
+                - 49
+                - 51
+                - 55
+                - 71
+                - 83
+                - 98
+                - 105
+            "2":
+                - 1
+                - 11
+                - 41
+                - 49
+                - 51
+                - 55
+                - 71
+                - 83
+                - 98
+                - 105
+            "3":
+                - 2
+                - 13
+                - 16
+                - 23
+                - 55
+                - 61
+            "4": 3.11.0
+            "5": 0.18.3
+            "6": 4.46.0.dev0
+            "8":
+                - 5
+            "12": 0.18.3
+            "13": linux-x86_64
+data_cfgs:
+    value:
+        eval_data_files: null
+        eval_datasets: null
+        eval_optional_args: []
+        eval_size: null
+        eval_split: null
+        eval_subset: null
+        eval_template: null
+        train_data_files: llf_ti2ti_27k_tokenized.pt
+        train_datasets: /data/align-anything/hantao/align-anything/projects/text_image_to_text_image/outputs
+        train_optional_args: []
+        train_size: null
+        train_split: train
+        train_subset: null
+        train_template: AA_textfeedback
+logger_cfgs:
+    value:
+        cache_dir: null
+        log_project: align-anything
+        log_run_name: sft
+        log_type: wandb
+        output_dir: ../outputs/sft_tf_cham_1011_27k_ti2ti
+        save_interval: 400
+model_cfgs:
+    value:
+        model_max_length: 4096
+        model_name_or_path: /data/align-anything/hantao/models/0916_ti_to_ti_sft/
+        trust_remote_code: true
+special_tokens:
+    value: null
+train_cfgs:
+    value:
+        adam_betas:
+            - 0.9
+            - 0.95
+        adam_epsilon: 1e-08
+        bf16: true
+        ds_cfgs: ds_z3_config.json
+        epochs: 3
+        eval_interval: 1000
+        eval_strategy: steps
+        fp16: false
+        freeze_language_model: false
+        gradient_accumulation_steps: 2
+        gradient_checkpointing: true
+        learning_rate: 1e-06
+        lr_scheduler_type: cosine
+        lr_warmup_ratio: 0.03
+        max_grad_norm: 1
+        per_device_eval_batch_size: 4
+        per_device_train_batch_size: 4
+        seed: 42
+        weight_decay: 0

wandb/run-20241011_202729-hvajn2pl/files/output.log ADDED Viewed

The diff for this file is too large to render. See raw diff

wandb/run-20241011_202729-hvajn2pl/files/requirements.txt ADDED Viewed

	@@ -0,0 +1,234 @@

+align-anything==0.0.1.dev0
+pluggy==1.5.0
+yt-dlp==2024.8.6
+referencing==0.35.1
+nvitop==1.3.2
+shellingham==1.5.4
+pydantic==2.9.2
+grpcio==1.66.2
+packaging==24.1
+fastapi==0.115.0
+matplotlib==3.9.2
+typing_extensions==4.12.2
+pycountry==24.6.1
+rpds-py==0.20.0
+prometheus_client==0.21.0
+vllm==0.6.2
+pycryptodomex==3.21.0
+MarkupSafe==2.1.5
+prometheus-fastapi-instrumentator==7.0.0
+peft==0.13.1
+Brotli==1.1.0
+audioread==3.0.1
+numpy==1.26.4
+nest-asyncio==1.6.0
+nvidia-nvtx-cu12==12.1.105
+kiwisolver==1.4.7
+librosa==0.10.2.post1
+msgspec==0.18.6
+lark==1.2.2
+aiosignal==1.3.1
+args==0.1.0
+attrs==24.2.0
+regex==2024.9.11
+typer==0.12.5
+nvidia-ml-py==12.535.161
+httptools==0.6.1
+wheel==0.44.0
+pyairports==2.1.1
+threadpoolctl==3.5.0
+nvidia-curand-cu12==10.3.2.106
+yarl==1.14.0
+rich==13.9.2
+nvidia-nccl-cu12==2.20.5
+click==8.1.7
+importlib_metadata==8.5.0
+fsspec==2024.6.1
+outlines_core==0.1.0
+h11==0.14.0
+uvloop==0.20.0
+deepspeed==0.15.2
+absl-py==2.1.0
+setproctitle==1.3.3
+Werkzeug==3.0.4
+nvidia-cuda-cupti-cu12==12.1.105
+fairscale==0.4.13
+wandb==0.18.3
+protobuf==3.20.3
+pytz==2024.2
+sentry-sdk==2.16.0
+opencv-python==4.6.0.66
+cfgv==3.4.0
+diskcache==5.6.3
+psutil==6.0.0
+frechet-audio-distance==0.1.2
+zipp==3.20.2
+pytorch-fid==0.3.0
+nodeenv==1.9.1
+align-anything==0.0.1.dev0
+joblib==1.4.2
+jiter==0.6.1
+interegular==0.3.3
+jsonschema==4.23.0
+numba==0.60.0
+nvidia-cufft-cu12==11.0.2.54
+idna==3.10
+sympy==1.13.3
+proglog==0.1.10
+httpx==0.27.2
+gradio==5.0.1
+lazy_loader==0.4
+pip==24.2
+aiohappyeyeballs==2.4.3
+aiofiles==23.2.1
+contourpy==1.3.0
+mutagen==1.47.0
+watchfiles==0.24.0
+imageio-ffmpeg==0.5.1
+termcolor==2.5.0
+mmsg==0.1.dev20+g585c63a
+imageio==2.35.1
+gguf==0.10.0
+hpsv2==1.2.0
+pydantic_core==2.23.4
+ruff==0.6.9
+markdown-it-py==3.0.0
+torchlibrosa==0.1.0
+cycler==0.12.1
+tzdata==2024.2
+httpcore==1.0.6
+Markdown==3.7
+platformdirs==4.3.6
+term-image==0.7.2
+transformers==4.46.0.dev0
+GitPython==3.1.43
+outlines==0.1.1.dev4+ga2fd35c
+virtualenv==20.26.6
+propcache==0.2.0
+nvidia-cusparse-cu12==12.1.0.106
+identify==2.6.1
+webdataset==0.2.100
+datasets==3.0.1
+accelerate==1.0.0
+multiprocess==0.70.16
+wcwidth==0.2.13
+pre_commit==4.0.1
+tomlkit==0.12.0
+torchvision==0.19.0
+websockets==12.0
+pytest==7.2.0
+timm==0.6.13
+six==1.16.0
+aiohttp==3.10.9
+tiktoken==0.7.0
+ffmpy==0.4.0
+urllib3==2.2.3
+torchaudio==2.4.0
+tensorboard==2.18.0
+scikit-learn==1.5.2
+frozenlist==1.4.1
+multidict==6.1.0
+PyYAML==6.0.2
+xxhash==3.5.0
+torch==2.4.0
+sniffio==1.3.1
+soundfile==0.12.1
+mdurl==0.1.2
+python-multipart==0.0.12
+tensorboard-data-server==0.7.2
+airportsdata==20241001
+nvidia-cudnn-cu12==9.1.0.70
+setuptools-scm==8.1.0
+orjson==3.10.7
+tqdm==4.66.5
+ninja==1.11.1.1
+image-reward==1.5
+clint==0.5.1
+setuptools==75.1.0
+shortuuid==1.0.13
+cffi==1.17.1
+docker-pycreds==0.4.0
+distro==1.9.0
+msgpack==1.1.0
+sentencepiece==0.2.0
+jsonschema-specifications==2024.10.1
+anyio==4.6.0
+optree==0.13.0
+xformers==0.0.27.post2
+pooch==1.8.2
+pyzmq==26.2.0
+Pygments==2.18.0
+partial-json-parser==0.2.1.1.post4
+einops==0.8.0
+nvidia-cublas-cu12==12.1.3.1
+gitdb==4.0.11
+cachetools==5.5.0
+decorator==4.4.2
+uvicorn==0.31.1
+clip==0.2.0
+ftfy==6.2.3
+mistral_common==1.4.4
+safetensors==0.4.5
+charset-normalizer==3.4.0
+soxr==0.5.0.post1
+requests==2.32.3
+pyparsing==3.1.4
+smmap==5.0.1
+annotated-types==0.7.0
+nvidia-cuda-nvrtc-cu12==12.1.105
+cloudpickle==3.0.0
+openai==1.51.2
+ray==2.37.0
+nvidia-nvjitlink-cu12==12.6.77
+resampy==0.4.3
+triton==3.0.0
+huggingface-hub==0.25.2
+pydub==0.25.1
+semantic-version==2.10.0
+distlib==0.3.9
+networkx==3.3
+pandas==2.2.3
+fonttools==4.54.1
+lm-format-enforcer==0.10.6
+python-dotenv==1.0.1
+Jinja2==3.1.4
+nvidia-cuda-runtime-cu12==12.1.105
+iniconfig==2.0.0
+moviepy==1.0.3
+pyarrow==17.0.0
+filelock==3.16.1
+py-cpuinfo==9.0.0
+python-dateutil==2.9.0.post0
+certifi==2024.8.30
+braceexpand==0.1.7
+dill==0.3.8
+bitsandbytes==0.44.1
+starlette==0.38.6
+diffusers==0.30.3
+pillow==10.4.0
+scipy==1.14.1
+pytest-split==0.8.0
+nvidia-cusolver-cu12==11.4.5.107
+llvmlite==0.43.0
+gradio_client==1.4.0
+mpmath==1.3.0
+pycparser==2.22
+hjson==3.1.0
+tokenizers==0.20.1
+jaraco.context==5.3.0
+typeguard==4.3.0
+inflect==7.3.1
+importlib_metadata==8.0.0
+jaraco.collections==5.1.0
+backports.tarfile==1.2.0
+platformdirs==4.2.2
+jaraco.functools==4.0.1
+zipp==3.19.2
+autocommand==2.2.2
+typing_extensions==4.12.2
+jaraco.text==3.12.1
+importlib_resources==6.4.0
+more-itertools==10.3.0
+wheel==0.43.0
+packaging==24.1
+tomli==2.0.1

wandb/run-20241011_202729-hvajn2pl/files/wandb-metadata.json ADDED Viewed

	@@ -0,0 +1,112 @@

+{
+  "os":  "Linux-5.4.0-144-generic-x86_64-with-glibc2.31",
+  "python":  "3.11.0",
+  "startedAt":  "2024-10-11T20:27:29.308691Z",
+  "args":  [
+    "--local_rank=0",
+    "--model_name_or_path",
+    "/data/align-anything/hantao/models/0916_ti_to_ti_sft/",
+    "--train_datasets",
+    "/data/align-anything/hantao/align-anything/projects/text_image_to_text_image/outputs",
+    "--train_data_files",
+    "llf_ti2ti_27k_tokenized.pt",
+    "--output_dir",
+    "../outputs/sft_tf_cham_1011_27k_ti2ti",
+    "--train_template",
+    "AA_textfeedback",
+    "--train_split",
+    "train",
+    "--per_device_train_batch_size",
+    "4",
+    "--per_device_eval_batch_size",
+    "4",
+    "--gradient_accumulation_steps",
+    "2",
+    "--save_interval",
+    "400",
+    "--learning_rate",
+    "1e-6",
+    "--epochs",
+    "3",
+    "--lr_scheduler_type",
+    "cosine"
+  ],
+  "program":  "-m align_anything.trainers.text_image_to_text_image.sft",
+  "git":  {
+    "remote":  "https://github.com/PKU-Alignment/align-anything.git",
+    "commit":  "6fde660afc9985323f147930eedf188a5699adc7"
+  },
+  "email":  "[email protected]",
+  "root":  "../outputs/sft_tf_cham_1011_27k_ti2ti",
+  "host":  "lyg0196",
+  "username":  "align-anything",
+  "executable":  "/data/align-anything/miniconda3/envs/hantao_stable/bin/python",
+  "cpu_count":  64,
+  "cpu_count_logical":  128,
+  "gpu":  "[NVIDIA A100-SXM4-80GB, NVIDIA A100-SXM4-80GB, NVIDIA A100-SXM4-80GB, NVIDIA A100-SXM4-80GB, NVIDIA A100-SXM4-80GB, NVIDIA A100-SXM4-80GB, NVIDIA A100-SXM4-80GB, NVIDIA A100-SXM4-80GB]",
+  "gpu_count":  8,
+  "disk":  {
+    "/":  {
+      "total":  "940744544256",
+      "used":  "49302532096"
+    }
+  },
+  "memory":  {
+    "total":  "540660944896"
+  },
+  "cpu":  {
+    "count":  64,
+    "countLogical":  128
+  },
+  "gpu_nvidia":  [
+    {
+      "name":  "NVIDIA A100-SXM4-80GB",
+      "memoryTotal":  "85899345920",
+      "cudaCores":  6912,
+      "architecture":  "Ampere"
+    },
+    {
+      "name":  "NVIDIA A100-SXM4-80GB",
+      "memoryTotal":  "85899345920",
+      "cudaCores":  6912,
+      "architecture":  "Ampere"
+    },
+    {
+      "name":  "NVIDIA A100-SXM4-80GB",
+      "memoryTotal":  "85899345920",
+      "cudaCores":  6912,
+      "architecture":  "Ampere"
+    },
+    {
+      "name":  "NVIDIA A100-SXM4-80GB",
+      "memoryTotal":  "85899345920",
+      "cudaCores":  6912,
+      "architecture":  "Ampere"
+    },
+    {
+      "name":  "NVIDIA A100-SXM4-80GB",
+      "memoryTotal":  "85899345920",
+      "cudaCores":  6912,
+      "architecture":  "Ampere"
+    },
+    {
+      "name":  "NVIDIA A100-SXM4-80GB",
+      "memoryTotal":  "85899345920",
+      "cudaCores":  6912,
+      "architecture":  "Ampere"
+    },
+    {
+      "name":  "NVIDIA A100-SXM4-80GB",
+      "memoryTotal":  "85899345920",
+      "cudaCores":  6912,
+      "architecture":  "Ampere"
+    },
+    {
+      "name":  "NVIDIA A100-SXM4-80GB",
+      "memoryTotal":  "85899345920",
+      "cudaCores":  6912,
+      "architecture":  "Ampere"
+    }
+  ],
+  "cudaVersion":  "12.4"
+}

wandb/run-20241011_202729-hvajn2pl/files/wandb-summary.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"_wandb":{"runtime":28029},"train/step":4983,"train/loss":0.3495679199695587,"train/lr":1.6866608503751657e-12,"train/epoch":3,"_timestamp":1.728706315447278e+09,"_runtime":28029.786090375,"_step":4983}

wandb/run-20241011_202729-hvajn2pl/logs/debug-internal.log ADDED Viewed

	@@ -0,0 +1,25 @@

+{"time":"2024-10-11T20:27:29.314392342Z","level":"INFO","msg":"using version","core version":"0.18.3"}
+{"time":"2024-10-11T20:27:29.314422946Z","level":"INFO","msg":"created symlink","path":"../outputs/sft_tf_cham_1011_27k_ti2ti/wandb/run-20241011_202729-hvajn2pl/logs/debug-core.log"}
+{"time":"2024-10-11T20:27:31.315941153Z","level":"ERROR","msg":"dialing: google: could not find default credentials. See https://cloud.google.com/docs/authentication/external/set-up-adc for more information"}
+{"time":"2024-10-11T20:27:31.343923384Z","level":"INFO","msg":"created new stream","id":"hvajn2pl"}
+{"time":"2024-10-11T20:27:31.344015309Z","level":"INFO","msg":"stream: started","id":"hvajn2pl"}
+{"time":"2024-10-11T20:27:31.344030708Z","level":"INFO","msg":"writer: Do: started","stream_id":{"value":"hvajn2pl"}}
+{"time":"2024-10-11T20:27:31.3440543Z","level":"INFO","msg":"handler: started","stream_id":{"value":"hvajn2pl"}}
+{"time":"2024-10-11T20:27:31.344075012Z","level":"INFO","msg":"sender: started","stream_id":{"value":"hvajn2pl"}}
+{"time":"2024-10-11T20:27:32.111921422Z","level":"INFO","msg":"wandb-core","!BADKEY":null}
+{"time":"2024-10-11T20:27:32.115787579Z","level":"INFO","msg":"Starting system monitor"}
+{"time":"2024-10-11T20:37:17.77464423Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded"}
+{"time":"2024-10-11T21:02:18.014643124Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
+{"time":"2024-10-11T21:48:05.805217442Z","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/htlou/align-anything/hvajn2pl/file_stream"}
+{"time":"2024-10-11T22:52:56.823831464Z","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/htlou/align-anything/hvajn2pl/file_stream"}
+{"time":"2024-10-12T04:14:39.094813754Z","level":"INFO","msg":"Stopping system monitor"}
+{"time":"2024-10-12T04:14:39.115766983Z","level":"INFO","msg":"Stopped system monitor"}
+{"time":"2024-10-12T04:14:39.625373664Z","level":"WARN","msg":"No program path found, not creating job artifact. See https://docs.wandb.ai/guides/launch/create-job"}
+{"time":"2024-10-12T04:14:39.625411287Z","level":"INFO","msg":"sender: sendDefer: no job artifact to save"}
+{"time":"2024-10-12T04:14:44.099325031Z","level":"ERROR","msg":"monitor: gpu: timeout waiting for process to exit"}
+{"time":"2024-10-12T04:15:06.376494069Z","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
+{"time":"2024-10-12T04:15:08.082335235Z","level":"INFO","msg":"stream: closing","id":"hvajn2pl"}
+{"time":"2024-10-12T04:15:08.082392093Z","level":"INFO","msg":"handler: closed","stream_id":{"value":"hvajn2pl"}}
+{"time":"2024-10-12T04:15:08.082456448Z","level":"INFO","msg":"writer: Close: closed","stream_id":{"value":"hvajn2pl"}}
+{"time":"2024-10-12T04:15:08.082510885Z","level":"INFO","msg":"sender: closed","stream_id":{"value":"hvajn2pl"}}
+{"time":"2024-10-12T04:15:08.084798858Z","level":"INFO","msg":"stream: closed","id":"hvajn2pl"}

wandb/run-20241011_202729-hvajn2pl/logs/debug.log ADDED Viewed

	@@ -0,0 +1,33 @@

+2024-10-11 20:27:29,297 INFO    MainThread:320740 [wandb_setup.py:_flush():79] Current SDK version is 0.18.3
+2024-10-11 20:27:29,297 INFO    MainThread:320740 [wandb_setup.py:_flush():79] Configure stats pid to 320740
+2024-10-11 20:27:29,297 INFO    MainThread:320740 [wandb_setup.py:_flush():79] Loading settings from /home/align-anything/.config/wandb/settings
+2024-10-11 20:27:29,297 INFO    MainThread:320740 [wandb_setup.py:_flush():79] Loading settings from /data/align-anything/hantao/align-anything/scripts/wandb/settings
+2024-10-11 20:27:29,297 INFO    MainThread:320740 [wandb_setup.py:_flush():79] Loading settings from environment variables: {'api_key': '***REDACTED***'}
+2024-10-11 20:27:29,297 INFO    MainThread:320740 [wandb_setup.py:_flush():79] Applying setup settings: {'mode': None, '_disable_service': None}
+2024-10-11 20:27:29,297 WARNING MainThread:320740 [wandb_setup.py:_flush():79] Could not find program at -m align_anything.trainers.text_image_to_text_image.sft
+2024-10-11 20:27:29,297 INFO    MainThread:320740 [wandb_setup.py:_flush():79] Inferring run settings from compute environment: {'program_relpath': None, 'program': '-m align_anything.trainers.text_image_to_text_image.sft'}
+2024-10-11 20:27:29,297 INFO    MainThread:320740 [wandb_setup.py:_flush():79] Applying login settings: {}
+2024-10-11 20:27:29,298 INFO    MainThread:320740 [wandb_init.py:_log_setup():532] Logging user logs to ../outputs/sft_tf_cham_1011_27k_ti2ti/wandb/run-20241011_202729-hvajn2pl/logs/debug.log
+2024-10-11 20:27:29,298 INFO    MainThread:320740 [wandb_init.py:_log_setup():533] Logging internal logs to ../outputs/sft_tf_cham_1011_27k_ti2ti/wandb/run-20241011_202729-hvajn2pl/logs/debug-internal.log
+2024-10-11 20:27:29,298 INFO    MainThread:320740 [wandb_init.py:init():617] calling init triggers
+2024-10-11 20:27:29,298 INFO    MainThread:320740 [wandb_init.py:init():624] wandb.init called with sweep_config: {}
+config: {'train_cfgs': {'ds_cfgs': 'ds_z3_config.json', 'epochs': 3.0, 'seed': 42, 'per_device_train_batch_size': 4.0, 'per_device_eval_batch_size': 4.0, 'gradient_accumulation_steps': 2.0, 'gradient_checkpointing': True, 'learning_rate': 1e-06, 'lr_scheduler_type': 'cosine', 'lr_warmup_ratio': 0.03, 'weight_decay': 0.0, 'adam_betas': [0.9, 0.95], 'adam_epsilon': 1e-08, 'bf16': True, 'fp16': False, 'eval_strategy': 'steps', 'eval_interval': 1000, 'freeze_language_model': False, 'max_grad_norm': 1.0}, 'data_cfgs': {'train_datasets': '/data/align-anything/hantao/align-anything/projects/text_image_to_text_image/outputs', 'train_template': 'AA_textfeedback', 'train_size': None, 'train_split': 'train', 'train_subset': None, 'train_data_files': 'llf_ti2ti_27k_tokenized.pt', 'train_optional_args': [], 'eval_datasets': None, 'eval_template': None, 'eval_size': None, 'eval_split': None, 'eval_subset': None, 'eval_data_files': None, 'eval_optional_args': []}, 'logger_cfgs': {'log_type': 'wandb', 'log_project': 'align-anything', 'log_run_name': 'sft', 'output_dir': '../outputs/sft_tf_cham_1011_27k_ti2ti', 'cache_dir': None, 'save_interval': 400.0}, 'model_cfgs': {'model_name_or_path': '/data/align-anything/hantao/models/0916_ti_to_ti_sft/', 'trust_remote_code': True, 'model_max_length': 4096}, 'special_tokens': None}
+2024-10-11 20:27:29,298 INFO    MainThread:320740 [wandb_init.py:init():667] starting backend
+2024-10-11 20:27:29,298 INFO    MainThread:320740 [wandb_init.py:init():671] sending inform_init request
+2024-10-11 20:27:29,308 INFO    MainThread:320740 [backend.py:_multiprocessing_setup():104] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
+2024-10-11 20:27:29,308 INFO    MainThread:320740 [wandb_init.py:init():684] backend started and connected
+2024-10-11 20:27:29,318 INFO    MainThread:320740 [wandb_init.py:init():779] updated telemetry
+2024-10-11 20:27:29,397 INFO    MainThread:320740 [wandb_init.py:init():812] communicating run to backend with 90.0 second timeout
+2024-10-11 20:27:32,099 INFO    MainThread:320740 [wandb_init.py:init():863] starting run threads in backend
+2024-10-11 20:27:32,709 INFO    MainThread:320740 [wandb_run.py:_console_start():2465] atexit reg
+2024-10-11 20:27:32,710 INFO    MainThread:320740 [wandb_run.py:_redirect():2313] redirect: wrap_raw
+2024-10-11 20:27:32,710 INFO    MainThread:320740 [wandb_run.py:_redirect():2378] Wrapping output streams.
+2024-10-11 20:27:32,710 INFO    MainThread:320740 [wandb_run.py:_redirect():2403] Redirects installed.
+2024-10-11 20:27:32,722 INFO    MainThread:320740 [wandb_init.py:init():907] run started, returning control to user process
+2024-10-12 04:14:39,088 INFO    MainThread:320740 [wandb_run.py:_finish():2164] finishing run htlou/align-anything/hvajn2pl
+2024-10-12 04:14:39,090 INFO    MainThread:320740 [wandb_run.py:_atexit_cleanup():2428] got exitcode: 0
+2024-10-12 04:14:39,093 INFO    MainThread:320740 [wandb_run.py:_restore():2410] restore
+2024-10-12 04:14:39,093 INFO    MainThread:320740 [wandb_run.py:_restore():2416] restore done
+2024-10-12 04:15:08,063 INFO    MainThread:320740 [wandb_run.py:_footer_history_summary_info():4049] rendering history
+2024-10-12 04:15:08,065 INFO    MainThread:320740 [wandb_run.py:_footer_history_summary_info():4081] rendering summary
+2024-10-12 04:15:08,077 INFO    MainThread:320740 [wandb_run.py:_footer_sync_info():4008] logging synced files

wandb/run-20241011_202729-hvajn2pl/run-hvajn2pl.wandb ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9158a2c0d338475b6a5747499dd2f57d32151d5602d5f0f12161f9c7374c574a
+size 30879748