Add files using upload-large-folder tool

Browse files

Files changed (11) hide show

README.md +4 -18
chat_template.jinja +7 -0
config.json +82 -39
generation_config.json +2 -2
model-00001-of-00005.safetensors +2 -2
model-00002-of-00005.safetensors +2 -2
model-00003-of-00005.safetensors +2 -2
model-00004-of-00005.safetensors +2 -2
model-00005-of-00005.safetensors +2 -2
model.safetensors.index.json +448 -483
tokenizer_config.json +4 -4

README.md CHANGED Viewed

@@ -1,29 +1,15 @@
 ---
-base_model: Qwen/Qwen2.5-VL-32B-Instruct
 license: apache-2.0
 language:
 - en
 pipeline_tag: image-text-to-text
 tags:
 - multimodal
 library_name: transformers
 ---
-<div>
-  <p style="margin-bottom: 0; margin-top: 0;">
-   <strong>See <a href="https://huggingface.co/collections/unsloth/qwen25-vl-all-versions-679ca6c784fad5bd976a05a1">our collection</a> for versions of Qwen2.5-VL including 4-bit & dynamic formats.</strong>
-  </p>
-  <div style="display: flex; gap: 5px; align-items: center; ">
-    <a href="https://github.com/unslothai/unsloth/">
-      <img src="https://github.com/unslothai/unsloth/raw/main/images/unsloth%20new%20logo.png" width="133">
-    </a>
-    <a href="https://discord.gg/unsloth">
-      <img src="https://github.com/unslothai/unsloth/raw/main/images/Discord%20button.png" width="173">
-    </a>
-    <a href="https://docs.unsloth.ai/">
-      <img src="https://raw.githubusercontent.com/unslothai/unsloth/refs/heads/main/images/documentation%20green%20button.png" width="143">
-    </a>
-  </div>
-</div>
 # Qwen2.5-VL-32B-Instruct
 <a href="https://chat.qwenlm.ai/" target="_blank" style="margin: 2px;">
@@ -66,7 +52,7 @@ We extend dynamic resolution to the temporal dimension by adopting dynamic FPS s
 We enhance both training and inference speeds by strategically implementing window attention into the ViT. The ViT architecture is further optimized with SwiGLU and RMSNorm, aligning it with the structure of the Qwen2.5 LLM.
-We have three models with 3, 7 and 72 billion parameters. This repo contains the instruction-tuned 32B Qwen2.5-VL model. For more information, visit our [Blog](https://qwenlm.github.io/blog/qwen2.5-vl/) and [GitHub](https://github.com/QwenLM/Qwen2.5-VL).

 ---
+base_model:
+- Qwen/Qwen2.5-VL-32B-Instruct
 license: apache-2.0
 language:
 - en
 pipeline_tag: image-text-to-text
 tags:
 - multimodal
+- unsloth
 library_name: transformers
 ---
 # Qwen2.5-VL-32B-Instruct
 <a href="https://chat.qwenlm.ai/" target="_blank" style="margin: 2px;">
 We enhance both training and inference speeds by strategically implementing window attention into the ViT. The ViT architecture is further optimized with SwiGLU and RMSNorm, aligning it with the structure of the Qwen2.5 LLM.
+We have four models with 3, 7, 32 and 72 billion parameters. This repo contains the instruction-tuned 32B Qwen2.5-VL model. For more information, visit our [Blog](https://qwenlm.github.io/blog/qwen2.5-vl/) and [GitHub](https://github.com/QwenLM/Qwen2.5-VL).

chat_template.jinja ADDED Viewed

	@@ -0,0 +1,7 @@

+{% set image_count = namespace(value=0) %}{% set video_count = namespace(value=0) %}{% for message in messages %}{% if loop.first and message['role'] != 'system' %}<|im_start|>system
+You are a helpful assistant.<|im_end|>
+{% endif %}<|im_start|>{{ message['role'] }}
+{% if message['content'] is string %}{{ message['content'] }}<|im_end|>
+{% else %}{% for content in message['content'] %}{% if content['type'] == 'image' or 'image' in content or 'image_url' in content %}{% set image_count.value = image_count.value + 1 %}{% if add_vision_id %}Picture {{ image_count.value }}: {% endif %}<|vision_start|><|image_pad|><|vision_end|>{% elif content['type'] == 'video' or 'video' in content %}{% set video_count.value = video_count.value + 1 %}{% if add_vision_id %}Video {{ video_count.value }}: {% endif %}<|vision_start|><|video_pad|><|vision_end|>{% elif 'text' in content %}{{ content['text'] }}{% endif %}{% endfor %}<|im_end|>
+{% endif %}{% endfor %}{% if add_generation_prompt %}<|im_start|>assistant
+{% endif %}

config.json CHANGED Viewed

@@ -9,7 +9,7 @@
   "image_token_id": 151655,
   "initializer_range": 0.02,
   "intermediate_size": 27648,
-  "max_position_embeddings": 32768,
   "max_window_layers": 64,
   "model_type": "qwen2_5_vl",
   "num_attention_heads": 40,
@@ -31,75 +31,78 @@
       "merger",
       "modality_projection",
       "model.layers.10.mlp",
-      "model.layers.7.mlp",
-      "model.layers.22.mlp",
       "model.layers.15.mlp",
-      "visual.blocks.31.mlp",
       "visual.blocks.27.attn",
       "visual.blocks.28.attn",
       "visual.blocks.31.attn",
       "visual.merger.mlp",
       "visual.blocks.30.mlp",
-      "visual.blocks.29.attn",
-      "visual.blocks.26.attn",
       "visual.blocks.24.attn",
       "visual.blocks.30.attn",
-      "visual.blocks.21.attn",
-      "visual.blocks.25.attn",
       "visual.blocks.22.attn",
-      "visual.blocks.29.mlp",
-      "visual.blocks.19.attn",
       "visual.blocks.20.attn",
       "model.layers.6.mlp",
-      "visual.blocks.18.attn",
       "visual.blocks.26.mlp",
       "visual.blocks.27.mlp",
-      "visual.blocks.20.mlp",
-      "visual.blocks.18.mlp",
       "visual.blocks.19.mlp",
-      "visual.blocks.28.mlp",
       "visual.blocks.23.mlp",
-      "visual.blocks.25.mlp",
       "visual.blocks.23.attn",
       "visual.blocks.22.mlp",
-      "visual.blocks.17.attn",
-      "visual.blocks.12.attn",
-      "visual.blocks.11.attn",
-      "visual.blocks.9.attn",
-      "visual.blocks.21.mlp",
-      "visual.blocks.16.attn",
       "visual.blocks.14.attn",
       "visual.blocks.10.mlp",
-      "visual.blocks.10.attn",
       "visual.blocks.13.attn",
-      "visual.blocks.24.mlp",
-      "visual.blocks.11.mlp",
-      "visual.blocks.9.mlp",
-      "visual.blocks.6.attn",
-      "visual.blocks.5.mlp",
-      "visual.blocks.12.mlp",
       "visual.blocks.4.mlp",
-      "visual.blocks.16.mlp",
       "visual.blocks.8.mlp",
-      "visual.blocks.6.mlp",
       "visual.blocks.2.attn",
-      "visual.blocks.1.mlp",
-      "visual.blocks.7.mlp",
       "visual.blocks.8.attn",
       "visual.blocks.13.mlp",
-      "visual.blocks.3.mlp",
       "visual.blocks.15.mlp",
-      "visual.blocks.2.mlp",
       "visual.blocks.1.attn",
-      "visual.blocks.5.attn",
-      "visual.blocks.0.attn",
       "visual.blocks.15.attn",
-      "visual.blocks.4.attn",
       "visual.blocks.7.attn",
       "visual.blocks.3.attn",
       "visual.blocks.14.mlp",
       "visual.blocks.0.mlp",
-      "visual.blocks.17.mlp"
     ],
     "llm_int8_threshold": 6.0,
     "load_in_4bit": true,
@@ -118,9 +121,48 @@
   },
   "rope_theta": 1000000.0,
   "sliding_window": 32768,
   "tie_word_embeddings": false,
   "torch_dtype": "bfloat16",
-  "transformers_version": "4.50.1",
   "unsloth_fixed": true,
   "use_cache": true,
   "use_sliding_window": false,
@@ -137,6 +179,7 @@
     "hidden_size": 1280,
     "in_channels": 3,
     "in_chans": 3,
     "intermediate_size": 3456,
     "model_type": "qwen2_5_vl",
     "num_heads": 16,

   "image_token_id": 151655,
   "initializer_range": 0.02,
   "intermediate_size": 27648,
+  "max_position_embeddings": 128000,
   "max_window_layers": 64,
   "model_type": "qwen2_5_vl",
   "num_attention_heads": 40,
       "merger",
       "modality_projection",
       "model.layers.10.mlp",
+      "model.layers.16.mlp",
       "model.layers.15.mlp",
+      "model.layers.5.mlp",
+      "model.layers.5.self_attn",
+      "model.layers.8.mlp",
       "visual.blocks.27.attn",
+      "visual.blocks.31.mlp",
       "visual.blocks.28.attn",
+      "visual.blocks.21.attn",
       "visual.blocks.31.attn",
+      "visual.blocks.26.attn",
+      "visual.blocks.29.attn",
       "visual.merger.mlp",
       "visual.blocks.30.mlp",
       "visual.blocks.24.attn",
       "visual.blocks.30.attn",
       "visual.blocks.22.attn",
+      "visual.blocks.25.attn",
       "visual.blocks.20.attn",
+      "visual.blocks.29.mlp",
       "model.layers.6.mlp",
       "visual.blocks.26.mlp",
+      "visual.blocks.25.mlp",
       "visual.blocks.27.mlp",
+      "visual.blocks.18.attn",
       "visual.blocks.19.mlp",
+      "visual.blocks.19.attn",
       "visual.blocks.23.mlp",
+      "visual.blocks.17.attn",
       "visual.blocks.23.attn",
+      "visual.blocks.20.mlp",
       "visual.blocks.22.mlp",
+      "visual.blocks.9.mlp",
       "visual.blocks.14.attn",
+      "visual.blocks.18.mlp",
+      "visual.blocks.28.mlp",
+      "visual.blocks.24.mlp",
+      "visual.blocks.11.attn",
       "visual.blocks.10.mlp",
+      "visual.blocks.6.mlp",
+      "visual.blocks.16.attn",
+      "visual.blocks.21.mlp",
       "visual.blocks.13.attn",
+      "visual.blocks.12.attn",
       "visual.blocks.4.mlp",
+      "visual.blocks.10.attn",
+      "visual.blocks.11.mlp",
+      "visual.blocks.9.attn",
       "visual.blocks.8.mlp",
+      "visual.blocks.16.mlp",
       "visual.blocks.2.attn",
+      "visual.blocks.5.mlp",
+      "visual.blocks.2.mlp",
       "visual.blocks.8.attn",
+      "visual.blocks.6.attn",
       "visual.blocks.13.mlp",
+      "visual.blocks.7.mlp",
+      "visual.blocks.1.mlp",
       "visual.blocks.15.mlp",
       "visual.blocks.1.attn",
+      "visual.blocks.3.mlp",
       "visual.blocks.15.attn",
       "visual.blocks.7.attn",
+      "visual.blocks.12.mlp",
+      "visual.blocks.5.attn",
+      "visual.blocks.4.attn",
       "visual.blocks.3.attn",
+      "visual.blocks.0.attn",
       "visual.blocks.14.mlp",
+      "visual.blocks.17.mlp",
       "visual.blocks.0.mlp",
+      "visual.blocks.31.mlp.down_proj"
     ],
     "llm_int8_threshold": 6.0,
     "load_in_4bit": true,
   },
   "rope_theta": 1000000.0,
   "sliding_window": 32768,
+  "text_config": {
+    "architectures": [
+      "Qwen2_5_VLForConditionalGeneration"
+    ],
+    "attention_dropout": 0.0,
+    "eos_token_id": 151645,
+    "hidden_act": "silu",
+    "hidden_size": 5120,
+    "image_token_id": null,
+    "initializer_range": 0.02,
+    "intermediate_size": 27648,
+    "max_position_embeddings": 128000,
+    "max_window_layers": 64,
+    "model_type": "qwen2_5_vl_text",
+    "num_attention_heads": 40,
+    "num_hidden_layers": 64,
+    "num_key_value_heads": 8,
+    "pad_token_id": 151643,
+    "rms_norm_eps": 1e-06,
+    "rope_scaling": {
+      "mrope_section": [
+        16,
+        24,
+        24
+      ],
+      "rope_type": "default",
+      "type": "default"
+    },
+    "rope_theta": 1000000.0,
+    "sliding_window": 32768,
+    "torch_dtype": "bfloat16",
+    "use_cache": true,
+    "use_sliding_window": false,
+    "video_token_id": null,
+    "vision_end_token_id": 151653,
+    "vision_start_token_id": 151652,
+    "vision_token_id": 151654,
+    "vocab_size": 152064
+  },
   "tie_word_embeddings": false,
   "torch_dtype": "bfloat16",
+  "transformers_version": "4.52.0.dev0",
   "unsloth_fixed": true,
   "use_cache": true,
   "use_sliding_window": false,
     "hidden_size": 1280,
     "in_channels": 3,
     "in_chans": 3,
+    "initializer_range": 0.02,
     "intermediate_size": 3456,
     "model_type": "qwen2_5_vl",
     "num_heads": 16,

generation_config.json CHANGED Viewed

@@ -5,9 +5,9 @@
     151645,
     151643
   ],
-  "max_length": 32768,
   "pad_token_id": 151654,
   "repetition_penalty": 1.05,
   "temperature": 1e-06,
-  "transformers_version": "4.50.1"
 }

     151645,
     151643
   ],
+  "max_length": 128000,
   "pad_token_id": 151654,
   "repetition_penalty": 1.05,
   "temperature": 1e-06,
+  "transformers_version": "4.52.0.dev0"
 }

model-00001-of-00005.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b73548a3ed8963202b0558db433b2cf3e37f29485443badcff32ea55a645f5a5
-size 4759939934

 version https://git-lfs.github.com/spec/v1
+oid sha256:75e8b15c927cc3ae1737f61bc7b238d5e008a73b5e8052ee8f75189b710a70c1
+size 4884840863

model-00002-of-00005.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:64f31c761976fdd3dba7117d1d8dddbda583cba145359980b73b04eb785c0170
-size 4991807831

 version https://git-lfs.github.com/spec/v1
+oid sha256:614eb314745898b39031deafa6486b022a5272920cf7a2ffddd4e3d35293268d
+size 4753752247

model-00003-of-00005.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bbaa6846f566db7ad67a1caff12f4f8eab7b1cd9ce496d6a7a3b6214426079c2
-size 4993690414

 version https://git-lfs.github.com/spec/v1
+oid sha256:9822c75f53a00867e05736b063a57010714a63d2302c3bf66ba407bbdbd29cae
+size 4989181706

model-00004-of-00005.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7f1fd7b300eb6bd4b34e7f78c83faad6baaae561852651cb8ac70318af128fc5
-size 4958587451

 version https://git-lfs.github.com/spec/v1
+oid sha256:36c7b46219878dff2dcf373aa56347da55958df1d9f9d5e0ae94c4b25e87eab0
+size 4939613635

model-00005-of-00005.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e4469c46443a245744089c31dfd38d43e7417a514799b62e72424d2037d9f0d3
-size 4040475063

 version https://git-lfs.github.com/spec/v1
+oid sha256:98cdc0eb48e4279e454248b2aa1937209041cf6a91007d8dbab5494742270310
+size 4900743706

model.safetensors.index.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "metadata": {
-    "total_size": 23744109829
   },
   "weight_map": {
     "lm_head.weight": "model-00005-of-00005.safetensors",
@@ -319,11 +319,11 @@
     "model.layers.14.self_attn.v_proj.weight.nested_quant_map": "model-00002-of-00005.safetensors",
     "model.layers.14.self_attn.v_proj.weight.quant_map": "model-00002-of-00005.safetensors",
     "model.layers.14.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00002-of-00005.safetensors",
-    "model.layers.15.input_layernorm.weight": "model-00002-of-00005.safetensors",
-    "model.layers.15.mlp.down_proj.weight": "model-00002-of-00005.safetensors",
     "model.layers.15.mlp.gate_proj.weight": "model-00002-of-00005.safetensors",
-    "model.layers.15.mlp.up_proj.weight": "model-00002-of-00005.safetensors",
-    "model.layers.15.post_attention_layernorm.weight": "model-00002-of-00005.safetensors",
     "model.layers.15.self_attn.k_proj.bias": "model-00002-of-00005.safetensors",
     "model.layers.15.self_attn.k_proj.weight": "model-00002-of-00005.safetensors",
     "model.layers.15.self_attn.k_proj.weight.absmax": "model-00002-of-00005.safetensors",
@@ -351,53 +351,38 @@
     "model.layers.15.self_attn.v_proj.weight.nested_quant_map": "model-00002-of-00005.safetensors",
     "model.layers.15.self_attn.v_proj.weight.quant_map": "model-00002-of-00005.safetensors",
     "model.layers.15.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00002-of-00005.safetensors",
-    "model.layers.16.input_layernorm.weight": "model-00002-of-00005.safetensors",
-    "model.layers.16.mlp.down_proj.weight": "model-00002-of-00005.safetensors",
-    "model.layers.16.mlp.down_proj.weight.absmax": "model-00002-of-00005.safetensors",
-    "model.layers.16.mlp.down_proj.weight.nested_absmax": "model-00002-of-00005.safetensors",
-    "model.layers.16.mlp.down_proj.weight.nested_quant_map": "model-00002-of-00005.safetensors",
-    "model.layers.16.mlp.down_proj.weight.quant_map": "model-00002-of-00005.safetensors",
-    "model.layers.16.mlp.down_proj.weight.quant_state.bitsandbytes__nf4": "model-00002-of-00005.safetensors",
-    "model.layers.16.mlp.gate_proj.weight": "model-00002-of-00005.safetensors",
-    "model.layers.16.mlp.gate_proj.weight.absmax": "model-00002-of-00005.safetensors",
-    "model.layers.16.mlp.gate_proj.weight.nested_absmax": "model-00002-of-00005.safetensors",
-    "model.layers.16.mlp.gate_proj.weight.nested_quant_map": "model-00002-of-00005.safetensors",
-    "model.layers.16.mlp.gate_proj.weight.quant_map": "model-00002-of-00005.safetensors",
-    "model.layers.16.mlp.gate_proj.weight.quant_state.bitsandbytes__nf4": "model-00002-of-00005.safetensors",
-    "model.layers.16.mlp.up_proj.weight": "model-00002-of-00005.safetensors",
-    "model.layers.16.mlp.up_proj.weight.absmax": "model-00002-of-00005.safetensors",
-    "model.layers.16.mlp.up_proj.weight.nested_absmax": "model-00002-of-00005.safetensors",
-    "model.layers.16.mlp.up_proj.weight.nested_quant_map": "model-00002-of-00005.safetensors",
-    "model.layers.16.mlp.up_proj.weight.quant_map": "model-00002-of-00005.safetensors",
-    "model.layers.16.mlp.up_proj.weight.quant_state.bitsandbytes__nf4": "model-00002-of-00005.safetensors",
-    "model.layers.16.post_attention_layernorm.weight": "model-00002-of-00005.safetensors",
-    "model.layers.16.self_attn.k_proj.bias": "model-00002-of-00005.safetensors",
-    "model.layers.16.self_attn.k_proj.weight": "model-00002-of-00005.safetensors",
-    "model.layers.16.self_attn.k_proj.weight.absmax": "model-00002-of-00005.safetensors",
-    "model.layers.16.self_attn.k_proj.weight.nested_absmax": "model-00002-of-00005.safetensors",
-    "model.layers.16.self_attn.k_proj.weight.nested_quant_map": "model-00002-of-00005.safetensors",
-    "model.layers.16.self_attn.k_proj.weight.quant_map": "model-00002-of-00005.safetensors",
-    "model.layers.16.self_attn.k_proj.weight.quant_state.bitsandbytes__nf4": "model-00002-of-00005.safetensors",
-    "model.layers.16.self_attn.o_proj.weight": "model-00002-of-00005.safetensors",
-    "model.layers.16.self_attn.o_proj.weight.absmax": "model-00002-of-00005.safetensors",
-    "model.layers.16.self_attn.o_proj.weight.nested_absmax": "model-00002-of-00005.safetensors",
-    "model.layers.16.self_attn.o_proj.weight.nested_quant_map": "model-00002-of-00005.safetensors",
-    "model.layers.16.self_attn.o_proj.weight.quant_map": "model-00002-of-00005.safetensors",
-    "model.layers.16.self_attn.o_proj.weight.quant_state.bitsandbytes__nf4": "model-00002-of-00005.safetensors",
-    "model.layers.16.self_attn.q_proj.bias": "model-00002-of-00005.safetensors",
-    "model.layers.16.self_attn.q_proj.weight": "model-00002-of-00005.safetensors",
-    "model.layers.16.self_attn.q_proj.weight.absmax": "model-00002-of-00005.safetensors",
-    "model.layers.16.self_attn.q_proj.weight.nested_absmax": "model-00002-of-00005.safetensors",
-    "model.layers.16.self_attn.q_proj.weight.nested_quant_map": "model-00002-of-00005.safetensors",
-    "model.layers.16.self_attn.q_proj.weight.quant_map": "model-00002-of-00005.safetensors",
-    "model.layers.16.self_attn.q_proj.weight.quant_state.bitsandbytes__nf4": "model-00002-of-00005.safetensors",
-    "model.layers.16.self_attn.v_proj.bias": "model-00002-of-00005.safetensors",
-    "model.layers.16.self_attn.v_proj.weight": "model-00002-of-00005.safetensors",
-    "model.layers.16.self_attn.v_proj.weight.absmax": "model-00002-of-00005.safetensors",
-    "model.layers.16.self_attn.v_proj.weight.nested_absmax": "model-00002-of-00005.safetensors",
-    "model.layers.16.self_attn.v_proj.weight.nested_quant_map": "model-00002-of-00005.safetensors",
-    "model.layers.16.self_attn.v_proj.weight.quant_map": "model-00002-of-00005.safetensors",
-    "model.layers.16.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00002-of-00005.safetensors",
     "model.layers.17.input_layernorm.weight": "model-00003-of-00005.safetensors",
     "model.layers.17.mlp.down_proj.weight": "model-00003-of-00005.safetensors",
     "model.layers.17.mlp.down_proj.weight.absmax": "model-00003-of-00005.safetensors",
@@ -418,33 +403,33 @@
     "model.layers.17.mlp.up_proj.weight.quant_map": "model-00003-of-00005.safetensors",
     "model.layers.17.mlp.up_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
     "model.layers.17.post_attention_layernorm.weight": "model-00003-of-00005.safetensors",
-    "model.layers.17.self_attn.k_proj.bias": "model-00002-of-00005.safetensors",
-    "model.layers.17.self_attn.k_proj.weight": "model-00002-of-00005.safetensors",
-    "model.layers.17.self_attn.k_proj.weight.absmax": "model-00002-of-00005.safetensors",
-    "model.layers.17.self_attn.k_proj.weight.nested_absmax": "model-00002-of-00005.safetensors",
-    "model.layers.17.self_attn.k_proj.weight.nested_quant_map": "model-00002-of-00005.safetensors",
-    "model.layers.17.self_attn.k_proj.weight.quant_map": "model-00002-of-00005.safetensors",
-    "model.layers.17.self_attn.k_proj.weight.quant_state.bitsandbytes__nf4": "model-00002-of-00005.safetensors",
     "model.layers.17.self_attn.o_proj.weight": "model-00003-of-00005.safetensors",
     "model.layers.17.self_attn.o_proj.weight.absmax": "model-00003-of-00005.safetensors",
     "model.layers.17.self_attn.o_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
     "model.layers.17.self_attn.o_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
     "model.layers.17.self_attn.o_proj.weight.quant_map": "model-00003-of-00005.safetensors",
     "model.layers.17.self_attn.o_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
-    "model.layers.17.self_attn.q_proj.bias": "model-00002-of-00005.safetensors",
-    "model.layers.17.self_attn.q_proj.weight": "model-00002-of-00005.safetensors",
-    "model.layers.17.self_attn.q_proj.weight.absmax": "model-00002-of-00005.safetensors",
-    "model.layers.17.self_attn.q_proj.weight.nested_absmax": "model-00002-of-00005.safetensors",
-    "model.layers.17.self_attn.q_proj.weight.nested_quant_map": "model-00002-of-00005.safetensors",
-    "model.layers.17.self_attn.q_proj.weight.quant_map": "model-00002-of-00005.safetensors",
-    "model.layers.17.self_attn.q_proj.weight.quant_state.bitsandbytes__nf4": "model-00002-of-00005.safetensors",
-    "model.layers.17.self_attn.v_proj.bias": "model-00002-of-00005.safetensors",
-    "model.layers.17.self_attn.v_proj.weight": "model-00002-of-00005.safetensors",
-    "model.layers.17.self_attn.v_proj.weight.absmax": "model-00002-of-00005.safetensors",
-    "model.layers.17.self_attn.v_proj.weight.nested_absmax": "model-00002-of-00005.safetensors",
-    "model.layers.17.self_attn.v_proj.weight.nested_quant_map": "model-00002-of-00005.safetensors",
-    "model.layers.17.self_attn.v_proj.weight.quant_map": "model-00002-of-00005.safetensors",
-    "model.layers.17.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00002-of-00005.safetensors",
     "model.layers.18.input_layernorm.weight": "model-00003-of-00005.safetensors",
     "model.layers.18.mlp.down_proj.weight": "model-00003-of-00005.safetensors",
     "model.layers.18.mlp.down_proj.weight.absmax": "model-00003-of-00005.safetensors",
@@ -682,8 +667,23 @@
     "model.layers.21.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
     "model.layers.22.input_layernorm.weight": "model-00003-of-00005.safetensors",
     "model.layers.22.mlp.down_proj.weight": "model-00003-of-00005.safetensors",
     "model.layers.22.mlp.gate_proj.weight": "model-00003-of-00005.safetensors",
     "model.layers.22.mlp.up_proj.weight": "model-00003-of-00005.safetensors",
     "model.layers.22.post_attention_layernorm.weight": "model-00003-of-00005.safetensors",
     "model.layers.22.self_attn.k_proj.bias": "model-00003-of-00005.safetensors",
     "model.layers.22.self_attn.k_proj.weight": "model-00003-of-00005.safetensors",
@@ -1135,26 +1135,26 @@
     "model.layers.30.self_attn.v_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
     "model.layers.30.self_attn.v_proj.weight.quant_map": "model-00003-of-00005.safetensors",
     "model.layers.30.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
-    "model.layers.31.input_layernorm.weight": "model-00003-of-00005.safetensors",
-    "model.layers.31.mlp.down_proj.weight": "model-00003-of-00005.safetensors",
-    "model.layers.31.mlp.down_proj.weight.absmax": "model-00003-of-00005.safetensors",
-    "model.layers.31.mlp.down_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
-    "model.layers.31.mlp.down_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.31.mlp.down_proj.weight.quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.31.mlp.down_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
-    "model.layers.31.mlp.gate_proj.weight": "model-00003-of-00005.safetensors",
-    "model.layers.31.mlp.gate_proj.weight.absmax": "model-00003-of-00005.safetensors",
-    "model.layers.31.mlp.gate_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
-    "model.layers.31.mlp.gate_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.31.mlp.gate_proj.weight.quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.31.mlp.gate_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
-    "model.layers.31.mlp.up_proj.weight": "model-00003-of-00005.safetensors",
-    "model.layers.31.mlp.up_proj.weight.absmax": "model-00003-of-00005.safetensors",
-    "model.layers.31.mlp.up_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
-    "model.layers.31.mlp.up_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.31.mlp.up_proj.weight.quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.31.mlp.up_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
-    "model.layers.31.post_attention_layernorm.weight": "model-00003-of-00005.safetensors",
     "model.layers.31.self_attn.k_proj.bias": "model-00003-of-00005.safetensors",
     "model.layers.31.self_attn.k_proj.weight": "model-00003-of-00005.safetensors",
     "model.layers.31.self_attn.k_proj.weight.absmax": "model-00003-of-00005.safetensors",
@@ -1162,12 +1162,12 @@
     "model.layers.31.self_attn.k_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
     "model.layers.31.self_attn.k_proj.weight.quant_map": "model-00003-of-00005.safetensors",
     "model.layers.31.self_attn.k_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
-    "model.layers.31.self_attn.o_proj.weight": "model-00003-of-00005.safetensors",
-    "model.layers.31.self_attn.o_proj.weight.absmax": "model-00003-of-00005.safetensors",
-    "model.layers.31.self_attn.o_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
-    "model.layers.31.self_attn.o_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.31.self_attn.o_proj.weight.quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.31.self_attn.o_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
     "model.layers.31.self_attn.q_proj.bias": "model-00003-of-00005.safetensors",
     "model.layers.31.self_attn.q_proj.weight": "model-00003-of-00005.safetensors",
     "model.layers.31.self_attn.q_proj.weight.absmax": "model-00003-of-00005.safetensors",
@@ -1182,100 +1182,100 @@
     "model.layers.31.self_attn.v_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
     "model.layers.31.self_attn.v_proj.weight.quant_map": "model-00003-of-00005.safetensors",
     "model.layers.31.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
-    "model.layers.32.input_layernorm.weight": "model-00003-of-00005.safetensors",
-    "model.layers.32.mlp.down_proj.weight": "model-00003-of-00005.safetensors",
-    "model.layers.32.mlp.down_proj.weight.absmax": "model-00003-of-00005.safetensors",
-    "model.layers.32.mlp.down_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
-    "model.layers.32.mlp.down_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.32.mlp.down_proj.weight.quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.32.mlp.down_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
-    "model.layers.32.mlp.gate_proj.weight": "model-00003-of-00005.safetensors",
-    "model.layers.32.mlp.gate_proj.weight.absmax": "model-00003-of-00005.safetensors",
-    "model.layers.32.mlp.gate_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
-    "model.layers.32.mlp.gate_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.32.mlp.gate_proj.weight.quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.32.mlp.gate_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
-    "model.layers.32.mlp.up_proj.weight": "model-00003-of-00005.safetensors",
-    "model.layers.32.mlp.up_proj.weight.absmax": "model-00003-of-00005.safetensors",
-    "model.layers.32.mlp.up_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
-    "model.layers.32.mlp.up_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.32.mlp.up_proj.weight.quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.32.mlp.up_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
-    "model.layers.32.post_attention_layernorm.weight": "model-00003-of-00005.safetensors",
-    "model.layers.32.self_attn.k_proj.bias": "model-00003-of-00005.safetensors",
-    "model.layers.32.self_attn.k_proj.weight": "model-00003-of-00005.safetensors",
-    "model.layers.32.self_attn.k_proj.weight.absmax": "model-00003-of-00005.safetensors",
-    "model.layers.32.self_attn.k_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
-    "model.layers.32.self_attn.k_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.32.self_attn.k_proj.weight.quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.32.self_attn.k_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
-    "model.layers.32.self_attn.o_proj.weight": "model-00003-of-00005.safetensors",
-    "model.layers.32.self_attn.o_proj.weight.absmax": "model-00003-of-00005.safetensors",
-    "model.layers.32.self_attn.o_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
-    "model.layers.32.self_attn.o_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.32.self_attn.o_proj.weight.quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.32.self_attn.o_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
-    "model.layers.32.self_attn.q_proj.bias": "model-00003-of-00005.safetensors",
-    "model.layers.32.self_attn.q_proj.weight": "model-00003-of-00005.safetensors",
-    "model.layers.32.self_attn.q_proj.weight.absmax": "model-00003-of-00005.safetensors",
-    "model.layers.32.self_attn.q_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
-    "model.layers.32.self_attn.q_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.32.self_attn.q_proj.weight.quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.32.self_attn.q_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
-    "model.layers.32.self_attn.v_proj.bias": "model-00003-of-00005.safetensors",
-    "model.layers.32.self_attn.v_proj.weight": "model-00003-of-00005.safetensors",
-    "model.layers.32.self_attn.v_proj.weight.absmax": "model-00003-of-00005.safetensors",
-    "model.layers.32.self_attn.v_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
-    "model.layers.32.self_attn.v_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.32.self_attn.v_proj.weight.quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.32.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
-    "model.layers.33.input_layernorm.weight": "model-00003-of-00005.safetensors",
-    "model.layers.33.mlp.down_proj.weight": "model-00003-of-00005.safetensors",
-    "model.layers.33.mlp.down_proj.weight.absmax": "model-00003-of-00005.safetensors",
-    "model.layers.33.mlp.down_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
-    "model.layers.33.mlp.down_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.33.mlp.down_proj.weight.quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.33.mlp.down_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
-    "model.layers.33.mlp.gate_proj.weight": "model-00003-of-00005.safetensors",
-    "model.layers.33.mlp.gate_proj.weight.absmax": "model-00003-of-00005.safetensors",
-    "model.layers.33.mlp.gate_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
-    "model.layers.33.mlp.gate_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.33.mlp.gate_proj.weight.quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.33.mlp.gate_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
-    "model.layers.33.mlp.up_proj.weight": "model-00003-of-00005.safetensors",
-    "model.layers.33.mlp.up_proj.weight.absmax": "model-00003-of-00005.safetensors",
-    "model.layers.33.mlp.up_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
-    "model.layers.33.mlp.up_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.33.mlp.up_proj.weight.quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.33.mlp.up_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
-    "model.layers.33.post_attention_layernorm.weight": "model-00003-of-00005.safetensors",
-    "model.layers.33.self_attn.k_proj.bias": "model-00003-of-00005.safetensors",
-    "model.layers.33.self_attn.k_proj.weight": "model-00003-of-00005.safetensors",
-    "model.layers.33.self_attn.k_proj.weight.absmax": "model-00003-of-00005.safetensors",
-    "model.layers.33.self_attn.k_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
-    "model.layers.33.self_attn.k_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.33.self_attn.k_proj.weight.quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.33.self_attn.k_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
-    "model.layers.33.self_attn.o_proj.weight": "model-00003-of-00005.safetensors",
-    "model.layers.33.self_attn.o_proj.weight.absmax": "model-00003-of-00005.safetensors",
-    "model.layers.33.self_attn.o_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
-    "model.layers.33.self_attn.o_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.33.self_attn.o_proj.weight.quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.33.self_attn.o_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
-    "model.layers.33.self_attn.q_proj.bias": "model-00003-of-00005.safetensors",
-    "model.layers.33.self_attn.q_proj.weight": "model-00003-of-00005.safetensors",
-    "model.layers.33.self_attn.q_proj.weight.absmax": "model-00003-of-00005.safetensors",
-    "model.layers.33.self_attn.q_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
-    "model.layers.33.self_attn.q_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.33.self_attn.q_proj.weight.quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.33.self_attn.q_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
-    "model.layers.33.self_attn.v_proj.bias": "model-00003-of-00005.safetensors",
-    "model.layers.33.self_attn.v_proj.weight": "model-00003-of-00005.safetensors",
-    "model.layers.33.self_attn.v_proj.weight.absmax": "model-00003-of-00005.safetensors",
-    "model.layers.33.self_attn.v_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
-    "model.layers.33.self_attn.v_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.33.self_attn.v_proj.weight.quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.33.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
     "model.layers.34.input_layernorm.weight": "model-00004-of-00005.safetensors",
     "model.layers.34.mlp.down_proj.weight": "model-00004-of-00005.safetensors",
     "model.layers.34.mlp.down_proj.weight.absmax": "model-00004-of-00005.safetensors",
@@ -1283,12 +1283,12 @@
     "model.layers.34.mlp.down_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
     "model.layers.34.mlp.down_proj.weight.quant_map": "model-00004-of-00005.safetensors",
     "model.layers.34.mlp.down_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
-    "model.layers.34.mlp.gate_proj.weight": "model-00003-of-00005.safetensors",
-    "model.layers.34.mlp.gate_proj.weight.absmax": "model-00003-of-00005.safetensors",
-    "model.layers.34.mlp.gate_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
-    "model.layers.34.mlp.gate_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.34.mlp.gate_proj.weight.quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.34.mlp.gate_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
     "model.layers.34.mlp.up_proj.weight": "model-00004-of-00005.safetensors",
     "model.layers.34.mlp.up_proj.weight.absmax": "model-00004-of-00005.safetensors",
     "model.layers.34.mlp.up_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
@@ -1296,33 +1296,33 @@
     "model.layers.34.mlp.up_proj.weight.quant_map": "model-00004-of-00005.safetensors",
     "model.layers.34.mlp.up_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
     "model.layers.34.post_attention_layernorm.weight": "model-00004-of-00005.safetensors",
-    "model.layers.34.self_attn.k_proj.bias": "model-00003-of-00005.safetensors",
-    "model.layers.34.self_attn.k_proj.weight": "model-00003-of-00005.safetensors",
-    "model.layers.34.self_attn.k_proj.weight.absmax": "model-00003-of-00005.safetensors",
-    "model.layers.34.self_attn.k_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
-    "model.layers.34.self_attn.k_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.34.self_attn.k_proj.weight.quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.34.self_attn.k_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
-    "model.layers.34.self_attn.o_proj.weight": "model-00003-of-00005.safetensors",
-    "model.layers.34.self_attn.o_proj.weight.absmax": "model-00003-of-00005.safetensors",
-    "model.layers.34.self_attn.o_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
-    "model.layers.34.self_attn.o_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.34.self_attn.o_proj.weight.quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.34.self_attn.o_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
-    "model.layers.34.self_attn.q_proj.bias": "model-00003-of-00005.safetensors",
-    "model.layers.34.self_attn.q_proj.weight": "model-00003-of-00005.safetensors",
-    "model.layers.34.self_attn.q_proj.weight.absmax": "model-00003-of-00005.safetensors",
-    "model.layers.34.self_attn.q_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
-    "model.layers.34.self_attn.q_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.34.self_attn.q_proj.weight.quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.34.self_attn.q_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
-    "model.layers.34.self_attn.v_proj.bias": "model-00003-of-00005.safetensors",
-    "model.layers.34.self_attn.v_proj.weight": "model-00003-of-00005.safetensors",
-    "model.layers.34.self_attn.v_proj.weight.absmax": "model-00003-of-00005.safetensors",
-    "model.layers.34.self_attn.v_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
-    "model.layers.34.self_attn.v_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.34.self_attn.v_proj.weight.quant_map": "model-00003-of-00005.safetensors",
-    "model.layers.34.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
     "model.layers.35.input_layernorm.weight": "model-00004-of-00005.safetensors",
     "model.layers.35.mlp.down_proj.weight": "model-00004-of-00005.safetensors",
     "model.layers.35.mlp.down_proj.weight.absmax": "model-00004-of-00005.safetensors",
@@ -2075,60 +2075,25 @@
     "model.layers.49.self_attn.v_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
     "model.layers.49.self_attn.v_proj.weight.quant_map": "model-00004-of-00005.safetensors",
     "model.layers.49.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
-    "model.layers.5.input_layernorm.weight": "model-00001-of-00005.safetensors",
-    "model.layers.5.mlp.down_proj.weight": "model-00001-of-00005.safetensors",
-    "model.layers.5.mlp.down_proj.weight.absmax": "model-00001-of-00005.safetensors",
-    "model.layers.5.mlp.down_proj.weight.nested_absmax": "model-00001-of-00005.safetensors",
-    "model.layers.5.mlp.down_proj.weight.nested_quant_map": "model-00001-of-00005.safetensors",
-    "model.layers.5.mlp.down_proj.weight.quant_map": "model-00001-of-00005.safetensors",
-    "model.layers.5.mlp.down_proj.weight.quant_state.bitsandbytes__nf4": "model-00001-of-00005.safetensors",
     "model.layers.5.mlp.gate_proj.weight": "model-00001-of-00005.safetensors",
-    "model.layers.5.mlp.gate_proj.weight.absmax": "model-00001-of-00005.safetensors",
-    "model.layers.5.mlp.gate_proj.weight.nested_absmax": "model-00001-of-00005.safetensors",
-    "model.layers.5.mlp.gate_proj.weight.nested_quant_map": "model-00001-of-00005.safetensors",
-    "model.layers.5.mlp.gate_proj.weight.quant_map": "model-00001-of-00005.safetensors",
-    "model.layers.5.mlp.gate_proj.weight.quant_state.bitsandbytes__nf4": "model-00001-of-00005.safetensors",
     "model.layers.5.mlp.up_proj.weight": "model-00001-of-00005.safetensors",
-    "model.layers.5.mlp.up_proj.weight.absmax": "model-00001-of-00005.safetensors",
-    "model.layers.5.mlp.up_proj.weight.nested_absmax": "model-00001-of-00005.safetensors",
-    "model.layers.5.mlp.up_proj.weight.nested_quant_map": "model-00001-of-00005.safetensors",
-    "model.layers.5.mlp.up_proj.weight.quant_map": "model-00001-of-00005.safetensors",
-    "model.layers.5.mlp.up_proj.weight.quant_state.bitsandbytes__nf4": "model-00001-of-00005.safetensors",
-    "model.layers.5.post_attention_layernorm.weight": "model-00001-of-00005.safetensors",
     "model.layers.5.self_attn.k_proj.bias": "model-00001-of-00005.safetensors",
     "model.layers.5.self_attn.k_proj.weight": "model-00001-of-00005.safetensors",
-    "model.layers.5.self_attn.k_proj.weight.absmax": "model-00001-of-00005.safetensors",
-    "model.layers.5.self_attn.k_proj.weight.nested_absmax": "model-00001-of-00005.safetensors",
-    "model.layers.5.self_attn.k_proj.weight.nested_quant_map": "model-00001-of-00005.safetensors",
-    "model.layers.5.self_attn.k_proj.weight.quant_map": "model-00001-of-00005.safetensors",
-    "model.layers.5.self_attn.k_proj.weight.quant_state.bitsandbytes__nf4": "model-00001-of-00005.safetensors",
     "model.layers.5.self_attn.o_proj.weight": "model-00001-of-00005.safetensors",
-    "model.layers.5.self_attn.o_proj.weight.absmax": "model-00001-of-00005.safetensors",
-    "model.layers.5.self_attn.o_proj.weight.nested_absmax": "model-00001-of-00005.safetensors",
-    "model.layers.5.self_attn.o_proj.weight.nested_quant_map": "model-00001-of-00005.safetensors",
-    "model.layers.5.self_attn.o_proj.weight.quant_map": "model-00001-of-00005.safetensors",
-    "model.layers.5.self_attn.o_proj.weight.quant_state.bitsandbytes__nf4": "model-00001-of-00005.safetensors",
     "model.layers.5.self_attn.q_proj.bias": "model-00001-of-00005.safetensors",
     "model.layers.5.self_attn.q_proj.weight": "model-00001-of-00005.safetensors",
-    "model.layers.5.self_attn.q_proj.weight.absmax": "model-00001-of-00005.safetensors",
-    "model.layers.5.self_attn.q_proj.weight.nested_absmax": "model-00001-of-00005.safetensors",
-    "model.layers.5.self_attn.q_proj.weight.nested_quant_map": "model-00001-of-00005.safetensors",
-    "model.layers.5.self_attn.q_proj.weight.quant_map": "model-00001-of-00005.safetensors",
-    "model.layers.5.self_attn.q_proj.weight.quant_state.bitsandbytes__nf4": "model-00001-of-00005.safetensors",
     "model.layers.5.self_attn.v_proj.bias": "model-00001-of-00005.safetensors",
     "model.layers.5.self_attn.v_proj.weight": "model-00001-of-00005.safetensors",
-    "model.layers.5.self_attn.v_proj.weight.absmax": "model-00001-of-00005.safetensors",
-    "model.layers.5.self_attn.v_proj.weight.nested_absmax": "model-00001-of-00005.safetensors",
-    "model.layers.5.self_attn.v_proj.weight.nested_quant_map": "model-00001-of-00005.safetensors",
-    "model.layers.5.self_attn.v_proj.weight.quant_map": "model-00001-of-00005.safetensors",
-    "model.layers.5.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00001-of-00005.safetensors",
-    "model.layers.50.input_layernorm.weight": "model-00004-of-00005.safetensors",
-    "model.layers.50.mlp.down_proj.weight": "model-00004-of-00005.safetensors",
-    "model.layers.50.mlp.down_proj.weight.absmax": "model-00004-of-00005.safetensors",
-    "model.layers.50.mlp.down_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
-    "model.layers.50.mlp.down_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.50.mlp.down_proj.weight.quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.50.mlp.down_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
     "model.layers.50.mlp.gate_proj.weight": "model-00004-of-00005.safetensors",
     "model.layers.50.mlp.gate_proj.weight.absmax": "model-00004-of-00005.safetensors",
     "model.layers.50.mlp.gate_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
@@ -2141,7 +2106,7 @@
     "model.layers.50.mlp.up_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
     "model.layers.50.mlp.up_proj.weight.quant_map": "model-00004-of-00005.safetensors",
     "model.layers.50.mlp.up_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
-    "model.layers.50.post_attention_layernorm.weight": "model-00004-of-00005.safetensors",
     "model.layers.50.self_attn.k_proj.bias": "model-00004-of-00005.safetensors",
     "model.layers.50.self_attn.k_proj.weight": "model-00004-of-00005.safetensors",
     "model.layers.50.self_attn.k_proj.weight.absmax": "model-00004-of-00005.safetensors",
@@ -2169,147 +2134,147 @@
     "model.layers.50.self_attn.v_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
     "model.layers.50.self_attn.v_proj.weight.quant_map": "model-00004-of-00005.safetensors",
     "model.layers.50.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
-    "model.layers.51.input_layernorm.weight": "model-00004-of-00005.safetensors",
-    "model.layers.51.mlp.down_proj.weight": "model-00004-of-00005.safetensors",
-    "model.layers.51.mlp.down_proj.weight.absmax": "model-00004-of-00005.safetensors",
-    "model.layers.51.mlp.down_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
-    "model.layers.51.mlp.down_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.51.mlp.down_proj.weight.quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.51.mlp.down_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
-    "model.layers.51.mlp.gate_proj.weight": "model-00004-of-00005.safetensors",
-    "model.layers.51.mlp.gate_proj.weight.absmax": "model-00004-of-00005.safetensors",
-    "model.layers.51.mlp.gate_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
-    "model.layers.51.mlp.gate_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.51.mlp.gate_proj.weight.quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.51.mlp.gate_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
-    "model.layers.51.mlp.up_proj.weight": "model-00004-of-00005.safetensors",
-    "model.layers.51.mlp.up_proj.weight.absmax": "model-00004-of-00005.safetensors",
-    "model.layers.51.mlp.up_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
-    "model.layers.51.mlp.up_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.51.mlp.up_proj.weight.quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.51.mlp.up_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
-    "model.layers.51.post_attention_layernorm.weight": "model-00004-of-00005.safetensors",
-    "model.layers.51.self_attn.k_proj.bias": "model-00004-of-00005.safetensors",
-    "model.layers.51.self_attn.k_proj.weight": "model-00004-of-00005.safetensors",
-    "model.layers.51.self_attn.k_proj.weight.absmax": "model-00004-of-00005.safetensors",
-    "model.layers.51.self_attn.k_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
-    "model.layers.51.self_attn.k_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.51.self_attn.k_proj.weight.quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.51.self_attn.k_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
-    "model.layers.51.self_attn.o_proj.weight": "model-00004-of-00005.safetensors",
-    "model.layers.51.self_attn.o_proj.weight.absmax": "model-00004-of-00005.safetensors",
-    "model.layers.51.self_attn.o_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
-    "model.layers.51.self_attn.o_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.51.self_attn.o_proj.weight.quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.51.self_attn.o_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
-    "model.layers.51.self_attn.q_proj.bias": "model-00004-of-00005.safetensors",
-    "model.layers.51.self_attn.q_proj.weight": "model-00004-of-00005.safetensors",
-    "model.layers.51.self_attn.q_proj.weight.absmax": "model-00004-of-00005.safetensors",
-    "model.layers.51.self_attn.q_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
-    "model.layers.51.self_attn.q_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.51.self_attn.q_proj.weight.quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.51.self_attn.q_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
-    "model.layers.51.self_attn.v_proj.bias": "model-00004-of-00005.safetensors",
-    "model.layers.51.self_attn.v_proj.weight": "model-00004-of-00005.safetensors",
-    "model.layers.51.self_attn.v_proj.weight.absmax": "model-00004-of-00005.safetensors",
-    "model.layers.51.self_attn.v_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
-    "model.layers.51.self_attn.v_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.51.self_attn.v_proj.weight.quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.51.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
-    "model.layers.52.input_layernorm.weight": "model-00004-of-00005.safetensors",
-    "model.layers.52.mlp.down_proj.weight": "model-00004-of-00005.safetensors",
-    "model.layers.52.mlp.down_proj.weight.absmax": "model-00004-of-00005.safetensors",
-    "model.layers.52.mlp.down_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
-    "model.layers.52.mlp.down_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.52.mlp.down_proj.weight.quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.52.mlp.down_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
-    "model.layers.52.mlp.gate_proj.weight": "model-00004-of-00005.safetensors",
-    "model.layers.52.mlp.gate_proj.weight.absmax": "model-00004-of-00005.safetensors",
-    "model.layers.52.mlp.gate_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
-    "model.layers.52.mlp.gate_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.52.mlp.gate_proj.weight.quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.52.mlp.gate_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
-    "model.layers.52.mlp.up_proj.weight": "model-00004-of-00005.safetensors",
-    "model.layers.52.mlp.up_proj.weight.absmax": "model-00004-of-00005.safetensors",
-    "model.layers.52.mlp.up_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
-    "model.layers.52.mlp.up_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.52.mlp.up_proj.weight.quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.52.mlp.up_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
-    "model.layers.52.post_attention_layernorm.weight": "model-00004-of-00005.safetensors",
-    "model.layers.52.self_attn.k_proj.bias": "model-00004-of-00005.safetensors",
-    "model.layers.52.self_attn.k_proj.weight": "model-00004-of-00005.safetensors",
-    "model.layers.52.self_attn.k_proj.weight.absmax": "model-00004-of-00005.safetensors",
-    "model.layers.52.self_attn.k_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
-    "model.layers.52.self_attn.k_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.52.self_attn.k_proj.weight.quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.52.self_attn.k_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
-    "model.layers.52.self_attn.o_proj.weight": "model-00004-of-00005.safetensors",
-    "model.layers.52.self_attn.o_proj.weight.absmax": "model-00004-of-00005.safetensors",
-    "model.layers.52.self_attn.o_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
-    "model.layers.52.self_attn.o_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.52.self_attn.o_proj.weight.quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.52.self_attn.o_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
-    "model.layers.52.self_attn.q_proj.bias": "model-00004-of-00005.safetensors",
-    "model.layers.52.self_attn.q_proj.weight": "model-00004-of-00005.safetensors",
-    "model.layers.52.self_attn.q_proj.weight.absmax": "model-00004-of-00005.safetensors",
-    "model.layers.52.self_attn.q_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
-    "model.layers.52.self_attn.q_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.52.self_attn.q_proj.weight.quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.52.self_attn.q_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
-    "model.layers.52.self_attn.v_proj.bias": "model-00004-of-00005.safetensors",
-    "model.layers.52.self_attn.v_proj.weight": "model-00004-of-00005.safetensors",
-    "model.layers.52.self_attn.v_proj.weight.absmax": "model-00004-of-00005.safetensors",
-    "model.layers.52.self_attn.v_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
-    "model.layers.52.self_attn.v_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.52.self_attn.v_proj.weight.quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.52.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
-    "model.layers.53.input_layernorm.weight": "model-00004-of-00005.safetensors",
-    "model.layers.53.mlp.down_proj.weight": "model-00004-of-00005.safetensors",
-    "model.layers.53.mlp.down_proj.weight.absmax": "model-00004-of-00005.safetensors",
-    "model.layers.53.mlp.down_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
-    "model.layers.53.mlp.down_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.53.mlp.down_proj.weight.quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.53.mlp.down_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
-    "model.layers.53.mlp.gate_proj.weight": "model-00004-of-00005.safetensors",
-    "model.layers.53.mlp.gate_proj.weight.absmax": "model-00004-of-00005.safetensors",
-    "model.layers.53.mlp.gate_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
-    "model.layers.53.mlp.gate_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.53.mlp.gate_proj.weight.quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.53.mlp.gate_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
-    "model.layers.53.mlp.up_proj.weight": "model-00004-of-00005.safetensors",
-    "model.layers.53.mlp.up_proj.weight.absmax": "model-00004-of-00005.safetensors",
-    "model.layers.53.mlp.up_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
-    "model.layers.53.mlp.up_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.53.mlp.up_proj.weight.quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.53.mlp.up_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
-    "model.layers.53.post_attention_layernorm.weight": "model-00004-of-00005.safetensors",
-    "model.layers.53.self_attn.k_proj.bias": "model-00004-of-00005.safetensors",
-    "model.layers.53.self_attn.k_proj.weight": "model-00004-of-00005.safetensors",
-    "model.layers.53.self_attn.k_proj.weight.absmax": "model-00004-of-00005.safetensors",
-    "model.layers.53.self_attn.k_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
-    "model.layers.53.self_attn.k_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.53.self_attn.k_proj.weight.quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.53.self_attn.k_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
-    "model.layers.53.self_attn.o_proj.weight": "model-00004-of-00005.safetensors",
-    "model.layers.53.self_attn.o_proj.weight.absmax": "model-00004-of-00005.safetensors",
-    "model.layers.53.self_attn.o_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
-    "model.layers.53.self_attn.o_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.53.self_attn.o_proj.weight.quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.53.self_attn.o_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
-    "model.layers.53.self_attn.q_proj.bias": "model-00004-of-00005.safetensors",
-    "model.layers.53.self_attn.q_proj.weight": "model-00004-of-00005.safetensors",
-    "model.layers.53.self_attn.q_proj.weight.absmax": "model-00004-of-00005.safetensors",
-    "model.layers.53.self_attn.q_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
-    "model.layers.53.self_attn.q_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.53.self_attn.q_proj.weight.quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.53.self_attn.q_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
-    "model.layers.53.self_attn.v_proj.bias": "model-00004-of-00005.safetensors",
-    "model.layers.53.self_attn.v_proj.weight": "model-00004-of-00005.safetensors",
-    "model.layers.53.self_attn.v_proj.weight.absmax": "model-00004-of-00005.safetensors",
-    "model.layers.53.self_attn.v_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
-    "model.layers.53.self_attn.v_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.53.self_attn.v_proj.weight.quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.53.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
     "model.layers.54.input_layernorm.weight": "model-00005-of-00005.safetensors",
     "model.layers.54.mlp.down_proj.weight": "model-00005-of-00005.safetensors",
     "model.layers.54.mlp.down_proj.weight.absmax": "model-00005-of-00005.safetensors",
@@ -2330,33 +2295,33 @@
     "model.layers.54.mlp.up_proj.weight.quant_map": "model-00005-of-00005.safetensors",
     "model.layers.54.mlp.up_proj.weight.quant_state.bitsandbytes__nf4": "model-00005-of-00005.safetensors",
     "model.layers.54.post_attention_layernorm.weight": "model-00005-of-00005.safetensors",
-    "model.layers.54.self_attn.k_proj.bias": "model-00004-of-00005.safetensors",
-    "model.layers.54.self_attn.k_proj.weight": "model-00004-of-00005.safetensors",
-    "model.layers.54.self_attn.k_proj.weight.absmax": "model-00004-of-00005.safetensors",
-    "model.layers.54.self_attn.k_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
-    "model.layers.54.self_attn.k_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.54.self_attn.k_proj.weight.quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.54.self_attn.k_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
-    "model.layers.54.self_attn.o_proj.weight": "model-00004-of-00005.safetensors",
-    "model.layers.54.self_attn.o_proj.weight.absmax": "model-00004-of-00005.safetensors",
-    "model.layers.54.self_attn.o_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
-    "model.layers.54.self_attn.o_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.54.self_attn.o_proj.weight.quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.54.self_attn.o_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
-    "model.layers.54.self_attn.q_proj.bias": "model-00004-of-00005.safetensors",
-    "model.layers.54.self_attn.q_proj.weight": "model-00004-of-00005.safetensors",
-    "model.layers.54.self_attn.q_proj.weight.absmax": "model-00004-of-00005.safetensors",
-    "model.layers.54.self_attn.q_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
-    "model.layers.54.self_attn.q_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.54.self_attn.q_proj.weight.quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.54.self_attn.q_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
-    "model.layers.54.self_attn.v_proj.bias": "model-00004-of-00005.safetensors",
-    "model.layers.54.self_attn.v_proj.weight": "model-00004-of-00005.safetensors",
-    "model.layers.54.self_attn.v_proj.weight.absmax": "model-00004-of-00005.safetensors",
-    "model.layers.54.self_attn.v_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
-    "model.layers.54.self_attn.v_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.54.self_attn.v_proj.weight.quant_map": "model-00004-of-00005.safetensors",
-    "model.layers.54.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
     "model.layers.55.input_layernorm.weight": "model-00005-of-00005.safetensors",
     "model.layers.55.mlp.down_proj.weight": "model-00005-of-00005.safetensors",
     "model.layers.55.mlp.down_proj.weight.absmax": "model-00005-of-00005.safetensors",
@@ -2594,36 +2559,36 @@
     "model.layers.59.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00005-of-00005.safetensors",
     "model.layers.6.input_layernorm.weight": "model-00002-of-00005.safetensors",
     "model.layers.6.mlp.down_proj.weight": "model-00002-of-00005.safetensors",
-    "model.layers.6.mlp.gate_proj.weight": "model-00001-of-00005.safetensors",
     "model.layers.6.mlp.up_proj.weight": "model-00002-of-00005.safetensors",
     "model.layers.6.post_attention_layernorm.weight": "model-00002-of-00005.safetensors",
-    "model.layers.6.self_attn.k_proj.bias": "model-00001-of-00005.safetensors",
-    "model.layers.6.self_attn.k_proj.weight": "model-00001-of-00005.safetensors",
-    "model.layers.6.self_attn.k_proj.weight.absmax": "model-00001-of-00005.safetensors",
-    "model.layers.6.self_attn.k_proj.weight.nested_absmax": "model-00001-of-00005.safetensors",
-    "model.layers.6.self_attn.k_proj.weight.nested_quant_map": "model-00001-of-00005.safetensors",
-    "model.layers.6.self_attn.k_proj.weight.quant_map": "model-00001-of-00005.safetensors",
-    "model.layers.6.self_attn.k_proj.weight.quant_state.bitsandbytes__nf4": "model-00001-of-00005.safetensors",
-    "model.layers.6.self_attn.o_proj.weight": "model-00001-of-00005.safetensors",
-    "model.layers.6.self_attn.o_proj.weight.absmax": "model-00001-of-00005.safetensors",
-    "model.layers.6.self_attn.o_proj.weight.nested_absmax": "model-00001-of-00005.safetensors",
-    "model.layers.6.self_attn.o_proj.weight.nested_quant_map": "model-00001-of-00005.safetensors",
-    "model.layers.6.self_attn.o_proj.weight.quant_map": "model-00001-of-00005.safetensors",
-    "model.layers.6.self_attn.o_proj.weight.quant_state.bitsandbytes__nf4": "model-00001-of-00005.safetensors",
-    "model.layers.6.self_attn.q_proj.bias": "model-00001-of-00005.safetensors",
-    "model.layers.6.self_attn.q_proj.weight": "model-00001-of-00005.safetensors",
-    "model.layers.6.self_attn.q_proj.weight.absmax": "model-00001-of-00005.safetensors",
-    "model.layers.6.self_attn.q_proj.weight.nested_absmax": "model-00001-of-00005.safetensors",
-    "model.layers.6.self_attn.q_proj.weight.nested_quant_map": "model-00001-of-00005.safetensors",
-    "model.layers.6.self_attn.q_proj.weight.quant_map": "model-00001-of-00005.safetensors",
-    "model.layers.6.self_attn.q_proj.weight.quant_state.bitsandbytes__nf4": "model-00001-of-00005.safetensors",
-    "model.layers.6.self_attn.v_proj.bias": "model-00001-of-00005.safetensors",
-    "model.layers.6.self_attn.v_proj.weight": "model-00001-of-00005.safetensors",
-    "model.layers.6.self_attn.v_proj.weight.absmax": "model-00001-of-00005.safetensors",
-    "model.layers.6.self_attn.v_proj.weight.nested_absmax": "model-00001-of-00005.safetensors",
-    "model.layers.6.self_attn.v_proj.weight.nested_quant_map": "model-00001-of-00005.safetensors",
-    "model.layers.6.self_attn.v_proj.weight.quant_map": "model-00001-of-00005.safetensors",
-    "model.layers.6.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00001-of-00005.safetensors",
     "model.layers.60.input_layernorm.weight": "model-00005-of-00005.safetensors",
     "model.layers.60.mlp.down_proj.weight": "model-00005-of-00005.safetensors",
     "model.layers.60.mlp.down_proj.weight.absmax": "model-00005-of-00005.safetensors",
@@ -2814,8 +2779,23 @@
     "model.layers.63.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00005-of-00005.safetensors",
     "model.layers.7.input_layernorm.weight": "model-00002-of-00005.safetensors",
     "model.layers.7.mlp.down_proj.weight": "model-00002-of-00005.safetensors",
     "model.layers.7.mlp.gate_proj.weight": "model-00002-of-00005.safetensors",
     "model.layers.7.mlp.up_proj.weight": "model-00002-of-00005.safetensors",
     "model.layers.7.post_attention_layernorm.weight": "model-00002-of-00005.safetensors",
     "model.layers.7.self_attn.k_proj.bias": "model-00002-of-00005.safetensors",
     "model.layers.7.self_attn.k_proj.weight": "model-00002-of-00005.safetensors",
@@ -2846,23 +2826,8 @@
     "model.layers.7.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00002-of-00005.safetensors",
     "model.layers.8.input_layernorm.weight": "model-00002-of-00005.safetensors",
     "model.layers.8.mlp.down_proj.weight": "model-00002-of-00005.safetensors",
-    "model.layers.8.mlp.down_proj.weight.absmax": "model-00002-of-00005.safetensors",
-    "model.layers.8.mlp.down_proj.weight.nested_absmax": "model-00002-of-00005.safetensors",
-    "model.layers.8.mlp.down_proj.weight.nested_quant_map": "model-00002-of-00005.safetensors",
-    "model.layers.8.mlp.down_proj.weight.quant_map": "model-00002-of-00005.safetensors",
-    "model.layers.8.mlp.down_proj.weight.quant_state.bitsandbytes__nf4": "model-00002-of-00005.safetensors",
     "model.layers.8.mlp.gate_proj.weight": "model-00002-of-00005.safetensors",
-    "model.layers.8.mlp.gate_proj.weight.absmax": "model-00002-of-00005.safetensors",
-    "model.layers.8.mlp.gate_proj.weight.nested_absmax": "model-00002-of-00005.safetensors",
-    "model.layers.8.mlp.gate_proj.weight.nested_quant_map": "model-00002-of-00005.safetensors",
-    "model.layers.8.mlp.gate_proj.weight.quant_map": "model-00002-of-00005.safetensors",
-    "model.layers.8.mlp.gate_proj.weight.quant_state.bitsandbytes__nf4": "model-00002-of-00005.safetensors",
     "model.layers.8.mlp.up_proj.weight": "model-00002-of-00005.safetensors",
-    "model.layers.8.mlp.up_proj.weight.absmax": "model-00002-of-00005.safetensors",
-    "model.layers.8.mlp.up_proj.weight.nested_absmax": "model-00002-of-00005.safetensors",
-    "model.layers.8.mlp.up_proj.weight.nested_quant_map": "model-00002-of-00005.safetensors",
-    "model.layers.8.mlp.up_proj.weight.quant_map": "model-00002-of-00005.safetensors",
-    "model.layers.8.mlp.up_proj.weight.quant_state.bitsandbytes__nf4": "model-00002-of-00005.safetensors",
     "model.layers.8.post_attention_layernorm.weight": "model-00002-of-00005.safetensors",
     "model.layers.8.self_attn.k_proj.bias": "model-00002-of-00005.safetensors",
     "model.layers.8.self_attn.k_proj.weight": "model-00002-of-00005.safetensors",

 {
   "metadata": {
+    "total_size": 24467745165
   },
   "weight_map": {
     "lm_head.weight": "model-00005-of-00005.safetensors",
     "model.layers.14.self_attn.v_proj.weight.nested_quant_map": "model-00002-of-00005.safetensors",
     "model.layers.14.self_attn.v_proj.weight.quant_map": "model-00002-of-00005.safetensors",
     "model.layers.14.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00002-of-00005.safetensors",
+    "model.layers.15.input_layernorm.weight": "model-00003-of-00005.safetensors",
+    "model.layers.15.mlp.down_proj.weight": "model-00003-of-00005.safetensors",
     "model.layers.15.mlp.gate_proj.weight": "model-00002-of-00005.safetensors",
+    "model.layers.15.mlp.up_proj.weight": "model-00003-of-00005.safetensors",
+    "model.layers.15.post_attention_layernorm.weight": "model-00003-of-00005.safetensors",
     "model.layers.15.self_attn.k_proj.bias": "model-00002-of-00005.safetensors",
     "model.layers.15.self_attn.k_proj.weight": "model-00002-of-00005.safetensors",
     "model.layers.15.self_attn.k_proj.weight.absmax": "model-00002-of-00005.safetensors",
     "model.layers.15.self_attn.v_proj.weight.nested_quant_map": "model-00002-of-00005.safetensors",
     "model.layers.15.self_attn.v_proj.weight.quant_map": "model-00002-of-00005.safetensors",
     "model.layers.15.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00002-of-00005.safetensors",
+    "model.layers.16.input_layernorm.weight": "model-00003-of-00005.safetensors",
+    "model.layers.16.mlp.down_proj.weight": "model-00003-of-00005.safetensors",
+    "model.layers.16.mlp.gate_proj.weight": "model-00003-of-00005.safetensors",
+    "model.layers.16.mlp.up_proj.weight": "model-00003-of-00005.safetensors",
+    "model.layers.16.post_attention_layernorm.weight": "model-00003-of-00005.safetensors",
+    "model.layers.16.self_attn.k_proj.bias": "model-00003-of-00005.safetensors",
+    "model.layers.16.self_attn.k_proj.weight": "model-00003-of-00005.safetensors",
+    "model.layers.16.self_attn.k_proj.weight.absmax": "model-00003-of-00005.safetensors",
+    "model.layers.16.self_attn.k_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
+    "model.layers.16.self_attn.k_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
+    "model.layers.16.self_attn.k_proj.weight.quant_map": "model-00003-of-00005.safetensors",
+    "model.layers.16.self_attn.k_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
+    "model.layers.16.self_attn.o_proj.weight": "model-00003-of-00005.safetensors",
+    "model.layers.16.self_attn.o_proj.weight.absmax": "model-00003-of-00005.safetensors",
+    "model.layers.16.self_attn.o_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
+    "model.layers.16.self_attn.o_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
+    "model.layers.16.self_attn.o_proj.weight.quant_map": "model-00003-of-00005.safetensors",
+    "model.layers.16.self_attn.o_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
+    "model.layers.16.self_attn.q_proj.bias": "model-00003-of-00005.safetensors",
+    "model.layers.16.self_attn.q_proj.weight": "model-00003-of-00005.safetensors",
+    "model.layers.16.self_attn.q_proj.weight.absmax": "model-00003-of-00005.safetensors",
+    "model.layers.16.self_attn.q_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
+    "model.layers.16.self_attn.q_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
+    "model.layers.16.self_attn.q_proj.weight.quant_map": "model-00003-of-00005.safetensors",
+    "model.layers.16.self_attn.q_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
+    "model.layers.16.self_attn.v_proj.bias": "model-00003-of-00005.safetensors",
+    "model.layers.16.self_attn.v_proj.weight": "model-00003-of-00005.safetensors",
+    "model.layers.16.self_attn.v_proj.weight.absmax": "model-00003-of-00005.safetensors",
+    "model.layers.16.self_attn.v_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
+    "model.layers.16.self_attn.v_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
+    "model.layers.16.self_attn.v_proj.weight.quant_map": "model-00003-of-00005.safetensors",
+    "model.layers.16.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
     "model.layers.17.input_layernorm.weight": "model-00003-of-00005.safetensors",
     "model.layers.17.mlp.down_proj.weight": "model-00003-of-00005.safetensors",
     "model.layers.17.mlp.down_proj.weight.absmax": "model-00003-of-00005.safetensors",
     "model.layers.17.mlp.up_proj.weight.quant_map": "model-00003-of-00005.safetensors",
     "model.layers.17.mlp.up_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
     "model.layers.17.post_attention_layernorm.weight": "model-00003-of-00005.safetensors",
+    "model.layers.17.self_attn.k_proj.bias": "model-00003-of-00005.safetensors",
+    "model.layers.17.self_attn.k_proj.weight": "model-00003-of-00005.safetensors",
+    "model.layers.17.self_attn.k_proj.weight.absmax": "model-00003-of-00005.safetensors",
+    "model.layers.17.self_attn.k_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
+    "model.layers.17.self_attn.k_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
+    "model.layers.17.self_attn.k_proj.weight.quant_map": "model-00003-of-00005.safetensors",
+    "model.layers.17.self_attn.k_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
     "model.layers.17.self_attn.o_proj.weight": "model-00003-of-00005.safetensors",
     "model.layers.17.self_attn.o_proj.weight.absmax": "model-00003-of-00005.safetensors",
     "model.layers.17.self_attn.o_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
     "model.layers.17.self_attn.o_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
     "model.layers.17.self_attn.o_proj.weight.quant_map": "model-00003-of-00005.safetensors",
     "model.layers.17.self_attn.o_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
+    "model.layers.17.self_attn.q_proj.bias": "model-00003-of-00005.safetensors",
+    "model.layers.17.self_attn.q_proj.weight": "model-00003-of-00005.safetensors",
+    "model.layers.17.self_attn.q_proj.weight.absmax": "model-00003-of-00005.safetensors",
+    "model.layers.17.self_attn.q_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
+    "model.layers.17.self_attn.q_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
+    "model.layers.17.self_attn.q_proj.weight.quant_map": "model-00003-of-00005.safetensors",
+    "model.layers.17.self_attn.q_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
+    "model.layers.17.self_attn.v_proj.bias": "model-00003-of-00005.safetensors",
+    "model.layers.17.self_attn.v_proj.weight": "model-00003-of-00005.safetensors",
+    "model.layers.17.self_attn.v_proj.weight.absmax": "model-00003-of-00005.safetensors",
+    "model.layers.17.self_attn.v_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
+    "model.layers.17.self_attn.v_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
+    "model.layers.17.self_attn.v_proj.weight.quant_map": "model-00003-of-00005.safetensors",
+    "model.layers.17.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
     "model.layers.18.input_layernorm.weight": "model-00003-of-00005.safetensors",
     "model.layers.18.mlp.down_proj.weight": "model-00003-of-00005.safetensors",
     "model.layers.18.mlp.down_proj.weight.absmax": "model-00003-of-00005.safetensors",
     "model.layers.21.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
     "model.layers.22.input_layernorm.weight": "model-00003-of-00005.safetensors",
     "model.layers.22.mlp.down_proj.weight": "model-00003-of-00005.safetensors",
+    "model.layers.22.mlp.down_proj.weight.absmax": "model-00003-of-00005.safetensors",
+    "model.layers.22.mlp.down_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
+    "model.layers.22.mlp.down_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
+    "model.layers.22.mlp.down_proj.weight.quant_map": "model-00003-of-00005.safetensors",
+    "model.layers.22.mlp.down_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
     "model.layers.22.mlp.gate_proj.weight": "model-00003-of-00005.safetensors",
+    "model.layers.22.mlp.gate_proj.weight.absmax": "model-00003-of-00005.safetensors",
+    "model.layers.22.mlp.gate_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
+    "model.layers.22.mlp.gate_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
+    "model.layers.22.mlp.gate_proj.weight.quant_map": "model-00003-of-00005.safetensors",
+    "model.layers.22.mlp.gate_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
     "model.layers.22.mlp.up_proj.weight": "model-00003-of-00005.safetensors",
+    "model.layers.22.mlp.up_proj.weight.absmax": "model-00003-of-00005.safetensors",
+    "model.layers.22.mlp.up_proj.weight.nested_absmax": "model-00003-of-00005.safetensors",
+    "model.layers.22.mlp.up_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
+    "model.layers.22.mlp.up_proj.weight.quant_map": "model-00003-of-00005.safetensors",
+    "model.layers.22.mlp.up_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
     "model.layers.22.post_attention_layernorm.weight": "model-00003-of-00005.safetensors",
     "model.layers.22.self_attn.k_proj.bias": "model-00003-of-00005.safetensors",
     "model.layers.22.self_attn.k_proj.weight": "model-00003-of-00005.safetensors",
     "model.layers.30.self_attn.v_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
     "model.layers.30.self_attn.v_proj.weight.quant_map": "model-00003-of-00005.safetensors",
     "model.layers.30.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
+    "model.layers.31.input_layernorm.weight": "model-00004-of-00005.safetensors",
+    "model.layers.31.mlp.down_proj.weight": "model-00004-of-00005.safetensors",
+    "model.layers.31.mlp.down_proj.weight.absmax": "model-00004-of-00005.safetensors",
+    "model.layers.31.mlp.down_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
+    "model.layers.31.mlp.down_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.31.mlp.down_proj.weight.quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.31.mlp.down_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
+    "model.layers.31.mlp.gate_proj.weight": "model-00004-of-00005.safetensors",
+    "model.layers.31.mlp.gate_proj.weight.absmax": "model-00004-of-00005.safetensors",
+    "model.layers.31.mlp.gate_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
+    "model.layers.31.mlp.gate_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.31.mlp.gate_proj.weight.quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.31.mlp.gate_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
+    "model.layers.31.mlp.up_proj.weight": "model-00004-of-00005.safetensors",
+    "model.layers.31.mlp.up_proj.weight.absmax": "model-00004-of-00005.safetensors",
+    "model.layers.31.mlp.up_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
+    "model.layers.31.mlp.up_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.31.mlp.up_proj.weight.quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.31.mlp.up_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
+    "model.layers.31.post_attention_layernorm.weight": "model-00004-of-00005.safetensors",
     "model.layers.31.self_attn.k_proj.bias": "model-00003-of-00005.safetensors",
     "model.layers.31.self_attn.k_proj.weight": "model-00003-of-00005.safetensors",
     "model.layers.31.self_attn.k_proj.weight.absmax": "model-00003-of-00005.safetensors",
     "model.layers.31.self_attn.k_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
     "model.layers.31.self_attn.k_proj.weight.quant_map": "model-00003-of-00005.safetensors",
     "model.layers.31.self_attn.k_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
+    "model.layers.31.self_attn.o_proj.weight": "model-00004-of-00005.safetensors",
+    "model.layers.31.self_attn.o_proj.weight.absmax": "model-00004-of-00005.safetensors",
+    "model.layers.31.self_attn.o_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
+    "model.layers.31.self_attn.o_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.31.self_attn.o_proj.weight.quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.31.self_attn.o_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
     "model.layers.31.self_attn.q_proj.bias": "model-00003-of-00005.safetensors",
     "model.layers.31.self_attn.q_proj.weight": "model-00003-of-00005.safetensors",
     "model.layers.31.self_attn.q_proj.weight.absmax": "model-00003-of-00005.safetensors",
     "model.layers.31.self_attn.v_proj.weight.nested_quant_map": "model-00003-of-00005.safetensors",
     "model.layers.31.self_attn.v_proj.weight.quant_map": "model-00003-of-00005.safetensors",
     "model.layers.31.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00003-of-00005.safetensors",
+    "model.layers.32.input_layernorm.weight": "model-00004-of-00005.safetensors",
+    "model.layers.32.mlp.down_proj.weight": "model-00004-of-00005.safetensors",
+    "model.layers.32.mlp.down_proj.weight.absmax": "model-00004-of-00005.safetensors",
+    "model.layers.32.mlp.down_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
+    "model.layers.32.mlp.down_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.32.mlp.down_proj.weight.quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.32.mlp.down_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
+    "model.layers.32.mlp.gate_proj.weight": "model-00004-of-00005.safetensors",
+    "model.layers.32.mlp.gate_proj.weight.absmax": "model-00004-of-00005.safetensors",
+    "model.layers.32.mlp.gate_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
+    "model.layers.32.mlp.gate_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.32.mlp.gate_proj.weight.quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.32.mlp.gate_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
+    "model.layers.32.mlp.up_proj.weight": "model-00004-of-00005.safetensors",
+    "model.layers.32.mlp.up_proj.weight.absmax": "model-00004-of-00005.safetensors",
+    "model.layers.32.mlp.up_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
+    "model.layers.32.mlp.up_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.32.mlp.up_proj.weight.quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.32.mlp.up_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
+    "model.layers.32.post_attention_layernorm.weight": "model-00004-of-00005.safetensors",
+    "model.layers.32.self_attn.k_proj.bias": "model-00004-of-00005.safetensors",
+    "model.layers.32.self_attn.k_proj.weight": "model-00004-of-00005.safetensors",
+    "model.layers.32.self_attn.k_proj.weight.absmax": "model-00004-of-00005.safetensors",
+    "model.layers.32.self_attn.k_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
+    "model.layers.32.self_attn.k_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.32.self_attn.k_proj.weight.quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.32.self_attn.k_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
+    "model.layers.32.self_attn.o_proj.weight": "model-00004-of-00005.safetensors",
+    "model.layers.32.self_attn.o_proj.weight.absmax": "model-00004-of-00005.safetensors",
+    "model.layers.32.self_attn.o_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
+    "model.layers.32.self_attn.o_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.32.self_attn.o_proj.weight.quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.32.self_attn.o_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
+    "model.layers.32.self_attn.q_proj.bias": "model-00004-of-00005.safetensors",
+    "model.layers.32.self_attn.q_proj.weight": "model-00004-of-00005.safetensors",
+    "model.layers.32.self_attn.q_proj.weight.absmax": "model-00004-of-00005.safetensors",
+    "model.layers.32.self_attn.q_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
+    "model.layers.32.self_attn.q_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.32.self_attn.q_proj.weight.quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.32.self_attn.q_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
+    "model.layers.32.self_attn.v_proj.bias": "model-00004-of-00005.safetensors",
+    "model.layers.32.self_attn.v_proj.weight": "model-00004-of-00005.safetensors",
+    "model.layers.32.self_attn.v_proj.weight.absmax": "model-00004-of-00005.safetensors",
+    "model.layers.32.self_attn.v_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
+    "model.layers.32.self_attn.v_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.32.self_attn.v_proj.weight.quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.32.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
+    "model.layers.33.input_layernorm.weight": "model-00004-of-00005.safetensors",
+    "model.layers.33.mlp.down_proj.weight": "model-00004-of-00005.safetensors",
+    "model.layers.33.mlp.down_proj.weight.absmax": "model-00004-of-00005.safetensors",
+    "model.layers.33.mlp.down_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
+    "model.layers.33.mlp.down_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.33.mlp.down_proj.weight.quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.33.mlp.down_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
+    "model.layers.33.mlp.gate_proj.weight": "model-00004-of-00005.safetensors",
+    "model.layers.33.mlp.gate_proj.weight.absmax": "model-00004-of-00005.safetensors",
+    "model.layers.33.mlp.gate_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
+    "model.layers.33.mlp.gate_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.33.mlp.gate_proj.weight.quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.33.mlp.gate_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
+    "model.layers.33.mlp.up_proj.weight": "model-00004-of-00005.safetensors",
+    "model.layers.33.mlp.up_proj.weight.absmax": "model-00004-of-00005.safetensors",
+    "model.layers.33.mlp.up_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
+    "model.layers.33.mlp.up_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.33.mlp.up_proj.weight.quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.33.mlp.up_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
+    "model.layers.33.post_attention_layernorm.weight": "model-00004-of-00005.safetensors",
+    "model.layers.33.self_attn.k_proj.bias": "model-00004-of-00005.safetensors",
+    "model.layers.33.self_attn.k_proj.weight": "model-00004-of-00005.safetensors",
+    "model.layers.33.self_attn.k_proj.weight.absmax": "model-00004-of-00005.safetensors",
+    "model.layers.33.self_attn.k_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
+    "model.layers.33.self_attn.k_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.33.self_attn.k_proj.weight.quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.33.self_attn.k_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
+    "model.layers.33.self_attn.o_proj.weight": "model-00004-of-00005.safetensors",
+    "model.layers.33.self_attn.o_proj.weight.absmax": "model-00004-of-00005.safetensors",
+    "model.layers.33.self_attn.o_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
+    "model.layers.33.self_attn.o_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.33.self_attn.o_proj.weight.quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.33.self_attn.o_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
+    "model.layers.33.self_attn.q_proj.bias": "model-00004-of-00005.safetensors",
+    "model.layers.33.self_attn.q_proj.weight": "model-00004-of-00005.safetensors",
+    "model.layers.33.self_attn.q_proj.weight.absmax": "model-00004-of-00005.safetensors",
+    "model.layers.33.self_attn.q_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
+    "model.layers.33.self_attn.q_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.33.self_attn.q_proj.weight.quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.33.self_attn.q_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
+    "model.layers.33.self_attn.v_proj.bias": "model-00004-of-00005.safetensors",
+    "model.layers.33.self_attn.v_proj.weight": "model-00004-of-00005.safetensors",
+    "model.layers.33.self_attn.v_proj.weight.absmax": "model-00004-of-00005.safetensors",
+    "model.layers.33.self_attn.v_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
+    "model.layers.33.self_attn.v_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.33.self_attn.v_proj.weight.quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.33.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
     "model.layers.34.input_layernorm.weight": "model-00004-of-00005.safetensors",
     "model.layers.34.mlp.down_proj.weight": "model-00004-of-00005.safetensors",
     "model.layers.34.mlp.down_proj.weight.absmax": "model-00004-of-00005.safetensors",
     "model.layers.34.mlp.down_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
     "model.layers.34.mlp.down_proj.weight.quant_map": "model-00004-of-00005.safetensors",
     "model.layers.34.mlp.down_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
+    "model.layers.34.mlp.gate_proj.weight": "model-00004-of-00005.safetensors",
+    "model.layers.34.mlp.gate_proj.weight.absmax": "model-00004-of-00005.safetensors",
+    "model.layers.34.mlp.gate_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
+    "model.layers.34.mlp.gate_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.34.mlp.gate_proj.weight.quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.34.mlp.gate_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
     "model.layers.34.mlp.up_proj.weight": "model-00004-of-00005.safetensors",
     "model.layers.34.mlp.up_proj.weight.absmax": "model-00004-of-00005.safetensors",
     "model.layers.34.mlp.up_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
     "model.layers.34.mlp.up_proj.weight.quant_map": "model-00004-of-00005.safetensors",
     "model.layers.34.mlp.up_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
     "model.layers.34.post_attention_layernorm.weight": "model-00004-of-00005.safetensors",
+    "model.layers.34.self_attn.k_proj.bias": "model-00004-of-00005.safetensors",
+    "model.layers.34.self_attn.k_proj.weight": "model-00004-of-00005.safetensors",
+    "model.layers.34.self_attn.k_proj.weight.absmax": "model-00004-of-00005.safetensors",
+    "model.layers.34.self_attn.k_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
+    "model.layers.34.self_attn.k_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.34.self_attn.k_proj.weight.quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.34.self_attn.k_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
+    "model.layers.34.self_attn.o_proj.weight": "model-00004-of-00005.safetensors",
+    "model.layers.34.self_attn.o_proj.weight.absmax": "model-00004-of-00005.safetensors",
+    "model.layers.34.self_attn.o_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
+    "model.layers.34.self_attn.o_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.34.self_attn.o_proj.weight.quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.34.self_attn.o_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
+    "model.layers.34.self_attn.q_proj.bias": "model-00004-of-00005.safetensors",
+    "model.layers.34.self_attn.q_proj.weight": "model-00004-of-00005.safetensors",
+    "model.layers.34.self_attn.q_proj.weight.absmax": "model-00004-of-00005.safetensors",
+    "model.layers.34.self_attn.q_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
+    "model.layers.34.self_attn.q_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.34.self_attn.q_proj.weight.quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.34.self_attn.q_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
+    "model.layers.34.self_attn.v_proj.bias": "model-00004-of-00005.safetensors",
+    "model.layers.34.self_attn.v_proj.weight": "model-00004-of-00005.safetensors",
+    "model.layers.34.self_attn.v_proj.weight.absmax": "model-00004-of-00005.safetensors",
+    "model.layers.34.self_attn.v_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
+    "model.layers.34.self_attn.v_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.34.self_attn.v_proj.weight.quant_map": "model-00004-of-00005.safetensors",
+    "model.layers.34.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
     "model.layers.35.input_layernorm.weight": "model-00004-of-00005.safetensors",
     "model.layers.35.mlp.down_proj.weight": "model-00004-of-00005.safetensors",
     "model.layers.35.mlp.down_proj.weight.absmax": "model-00004-of-00005.safetensors",
     "model.layers.49.self_attn.v_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
     "model.layers.49.self_attn.v_proj.weight.quant_map": "model-00004-of-00005.safetensors",
     "model.layers.49.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
+    "model.layers.5.input_layernorm.weight": "model-00002-of-00005.safetensors",
+    "model.layers.5.mlp.down_proj.weight": "model-00002-of-00005.safetensors",
     "model.layers.5.mlp.gate_proj.weight": "model-00001-of-00005.safetensors",
     "model.layers.5.mlp.up_proj.weight": "model-00001-of-00005.safetensors",
+    "model.layers.5.post_attention_layernorm.weight": "model-00002-of-00005.safetensors",
     "model.layers.5.self_attn.k_proj.bias": "model-00001-of-00005.safetensors",
     "model.layers.5.self_attn.k_proj.weight": "model-00001-of-00005.safetensors",
     "model.layers.5.self_attn.o_proj.weight": "model-00001-of-00005.safetensors",
     "model.layers.5.self_attn.q_proj.bias": "model-00001-of-00005.safetensors",
     "model.layers.5.self_attn.q_proj.weight": "model-00001-of-00005.safetensors",
     "model.layers.5.self_attn.v_proj.bias": "model-00001-of-00005.safetensors",
     "model.layers.5.self_attn.v_proj.weight": "model-00001-of-00005.safetensors",
+    "model.layers.50.input_layernorm.weight": "model-00005-of-00005.safetensors",
+    "model.layers.50.mlp.down_proj.weight": "model-00005-of-00005.safetensors",
+    "model.layers.50.mlp.down_proj.weight.absmax": "model-00005-of-00005.safetensors",
+    "model.layers.50.mlp.down_proj.weight.nested_absmax": "model-00005-of-00005.safetensors",
+    "model.layers.50.mlp.down_proj.weight.nested_quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.50.mlp.down_proj.weight.quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.50.mlp.down_proj.weight.quant_state.bitsandbytes__nf4": "model-00005-of-00005.safetensors",
     "model.layers.50.mlp.gate_proj.weight": "model-00004-of-00005.safetensors",
     "model.layers.50.mlp.gate_proj.weight.absmax": "model-00004-of-00005.safetensors",
     "model.layers.50.mlp.gate_proj.weight.nested_absmax": "model-00004-of-00005.safetensors",
     "model.layers.50.mlp.up_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
     "model.layers.50.mlp.up_proj.weight.quant_map": "model-00004-of-00005.safetensors",
     "model.layers.50.mlp.up_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
+    "model.layers.50.post_attention_layernorm.weight": "model-00005-of-00005.safetensors",
     "model.layers.50.self_attn.k_proj.bias": "model-00004-of-00005.safetensors",
     "model.layers.50.self_attn.k_proj.weight": "model-00004-of-00005.safetensors",
     "model.layers.50.self_attn.k_proj.weight.absmax": "model-00004-of-00005.safetensors",
     "model.layers.50.self_attn.v_proj.weight.nested_quant_map": "model-00004-of-00005.safetensors",
     "model.layers.50.self_attn.v_proj.weight.quant_map": "model-00004-of-00005.safetensors",
     "model.layers.50.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00004-of-00005.safetensors",
+    "model.layers.51.input_layernorm.weight": "model-00005-of-00005.safetensors",
+    "model.layers.51.mlp.down_proj.weight": "model-00005-of-00005.safetensors",
+    "model.layers.51.mlp.down_proj.weight.absmax": "model-00005-of-00005.safetensors",
+    "model.layers.51.mlp.down_proj.weight.nested_absmax": "model-00005-of-00005.safetensors",
+    "model.layers.51.mlp.down_proj.weight.nested_quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.51.mlp.down_proj.weight.quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.51.mlp.down_proj.weight.quant_state.bitsandbytes__nf4": "model-00005-of-00005.safetensors",
+    "model.layers.51.mlp.gate_proj.weight": "model-00005-of-00005.safetensors",
+    "model.layers.51.mlp.gate_proj.weight.absmax": "model-00005-of-00005.safetensors",
+    "model.layers.51.mlp.gate_proj.weight.nested_absmax": "model-00005-of-00005.safetensors",
+    "model.layers.51.mlp.gate_proj.weight.nested_quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.51.mlp.gate_proj.weight.quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.51.mlp.gate_proj.weight.quant_state.bitsandbytes__nf4": "model-00005-of-00005.safetensors",
+    "model.layers.51.mlp.up_proj.weight": "model-00005-of-00005.safetensors",
+    "model.layers.51.mlp.up_proj.weight.absmax": "model-00005-of-00005.safetensors",
+    "model.layers.51.mlp.up_proj.weight.nested_absmax": "model-00005-of-00005.safetensors",
+    "model.layers.51.mlp.up_proj.weight.nested_quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.51.mlp.up_proj.weight.quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.51.mlp.up_proj.weight.quant_state.bitsandbytes__nf4": "model-00005-of-00005.safetensors",
+    "model.layers.51.post_attention_layernorm.weight": "model-00005-of-00005.safetensors",
+    "model.layers.51.self_attn.k_proj.bias": "model-00005-of-00005.safetensors",
+    "model.layers.51.self_attn.k_proj.weight": "model-00005-of-00005.safetensors",
+    "model.layers.51.self_attn.k_proj.weight.absmax": "model-00005-of-00005.safetensors",
+    "model.layers.51.self_attn.k_proj.weight.nested_absmax": "model-00005-of-00005.safetensors",
+    "model.layers.51.self_attn.k_proj.weight.nested_quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.51.self_attn.k_proj.weight.quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.51.self_attn.k_proj.weight.quant_state.bitsandbytes__nf4": "model-00005-of-00005.safetensors",
+    "model.layers.51.self_attn.o_proj.weight": "model-00005-of-00005.safetensors",
+    "model.layers.51.self_attn.o_proj.weight.absmax": "model-00005-of-00005.safetensors",
+    "model.layers.51.self_attn.o_proj.weight.nested_absmax": "model-00005-of-00005.safetensors",
+    "model.layers.51.self_attn.o_proj.weight.nested_quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.51.self_attn.o_proj.weight.quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.51.self_attn.o_proj.weight.quant_state.bitsandbytes__nf4": "model-00005-of-00005.safetensors",
+    "model.layers.51.self_attn.q_proj.bias": "model-00005-of-00005.safetensors",
+    "model.layers.51.self_attn.q_proj.weight": "model-00005-of-00005.safetensors",
+    "model.layers.51.self_attn.q_proj.weight.absmax": "model-00005-of-00005.safetensors",
+    "model.layers.51.self_attn.q_proj.weight.nested_absmax": "model-00005-of-00005.safetensors",
+    "model.layers.51.self_attn.q_proj.weight.nested_quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.51.self_attn.q_proj.weight.quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.51.self_attn.q_proj.weight.quant_state.bitsandbytes__nf4": "model-00005-of-00005.safetensors",
+    "model.layers.51.self_attn.v_proj.bias": "model-00005-of-00005.safetensors",
+    "model.layers.51.self_attn.v_proj.weight": "model-00005-of-00005.safetensors",
+    "model.layers.51.self_attn.v_proj.weight.absmax": "model-00005-of-00005.safetensors",
+    "model.layers.51.self_attn.v_proj.weight.nested_absmax": "model-00005-of-00005.safetensors",
+    "model.layers.51.self_attn.v_proj.weight.nested_quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.51.self_attn.v_proj.weight.quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.51.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00005-of-00005.safetensors",
+    "model.layers.52.input_layernorm.weight": "model-00005-of-00005.safetensors",
+    "model.layers.52.mlp.down_proj.weight": "model-00005-of-00005.safetensors",
+    "model.layers.52.mlp.down_proj.weight.absmax": "model-00005-of-00005.safetensors",
+    "model.layers.52.mlp.down_proj.weight.nested_absmax": "model-00005-of-00005.safetensors",
+    "model.layers.52.mlp.down_proj.weight.nested_quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.52.mlp.down_proj.weight.quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.52.mlp.down_proj.weight.quant_state.bitsandbytes__nf4": "model-00005-of-00005.safetensors",
+    "model.layers.52.mlp.gate_proj.weight": "model-00005-of-00005.safetensors",
+    "model.layers.52.mlp.gate_proj.weight.absmax": "model-00005-of-00005.safetensors",
+    "model.layers.52.mlp.gate_proj.weight.nested_absmax": "model-00005-of-00005.safetensors",
+    "model.layers.52.mlp.gate_proj.weight.nested_quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.52.mlp.gate_proj.weight.quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.52.mlp.gate_proj.weight.quant_state.bitsandbytes__nf4": "model-00005-of-00005.safetensors",
+    "model.layers.52.mlp.up_proj.weight": "model-00005-of-00005.safetensors",
+    "model.layers.52.mlp.up_proj.weight.absmax": "model-00005-of-00005.safetensors",
+    "model.layers.52.mlp.up_proj.weight.nested_absmax": "model-00005-of-00005.safetensors",
+    "model.layers.52.mlp.up_proj.weight.nested_quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.52.mlp.up_proj.weight.quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.52.mlp.up_proj.weight.quant_state.bitsandbytes__nf4": "model-00005-of-00005.safetensors",
+    "model.layers.52.post_attention_layernorm.weight": "model-00005-of-00005.safetensors",
+    "model.layers.52.self_attn.k_proj.bias": "model-00005-of-00005.safetensors",
+    "model.layers.52.self_attn.k_proj.weight": "model-00005-of-00005.safetensors",
+    "model.layers.52.self_attn.k_proj.weight.absmax": "model-00005-of-00005.safetensors",
+    "model.layers.52.self_attn.k_proj.weight.nested_absmax": "model-00005-of-00005.safetensors",
+    "model.layers.52.self_attn.k_proj.weight.nested_quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.52.self_attn.k_proj.weight.quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.52.self_attn.k_proj.weight.quant_state.bitsandbytes__nf4": "model-00005-of-00005.safetensors",
+    "model.layers.52.self_attn.o_proj.weight": "model-00005-of-00005.safetensors",
+    "model.layers.52.self_attn.o_proj.weight.absmax": "model-00005-of-00005.safetensors",
+    "model.layers.52.self_attn.o_proj.weight.nested_absmax": "model-00005-of-00005.safetensors",
+    "model.layers.52.self_attn.o_proj.weight.nested_quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.52.self_attn.o_proj.weight.quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.52.self_attn.o_proj.weight.quant_state.bitsandbytes__nf4": "model-00005-of-00005.safetensors",
+    "model.layers.52.self_attn.q_proj.bias": "model-00005-of-00005.safetensors",
+    "model.layers.52.self_attn.q_proj.weight": "model-00005-of-00005.safetensors",
+    "model.layers.52.self_attn.q_proj.weight.absmax": "model-00005-of-00005.safetensors",
+    "model.layers.52.self_attn.q_proj.weight.nested_absmax": "model-00005-of-00005.safetensors",
+    "model.layers.52.self_attn.q_proj.weight.nested_quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.52.self_attn.q_proj.weight.quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.52.self_attn.q_proj.weight.quant_state.bitsandbytes__nf4": "model-00005-of-00005.safetensors",
+    "model.layers.52.self_attn.v_proj.bias": "model-00005-of-00005.safetensors",
+    "model.layers.52.self_attn.v_proj.weight": "model-00005-of-00005.safetensors",
+    "model.layers.52.self_attn.v_proj.weight.absmax": "model-00005-of-00005.safetensors",
+    "model.layers.52.self_attn.v_proj.weight.nested_absmax": "model-00005-of-00005.safetensors",
+    "model.layers.52.self_attn.v_proj.weight.nested_quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.52.self_attn.v_proj.weight.quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.52.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00005-of-00005.safetensors",
+    "model.layers.53.input_layernorm.weight": "model-00005-of-00005.safetensors",
+    "model.layers.53.mlp.down_proj.weight": "model-00005-of-00005.safetensors",
+    "model.layers.53.mlp.down_proj.weight.absmax": "model-00005-of-00005.safetensors",
+    "model.layers.53.mlp.down_proj.weight.nested_absmax": "model-00005-of-00005.safetensors",
+    "model.layers.53.mlp.down_proj.weight.nested_quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.53.mlp.down_proj.weight.quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.53.mlp.down_proj.weight.quant_state.bitsandbytes__nf4": "model-00005-of-00005.safetensors",
+    "model.layers.53.mlp.gate_proj.weight": "model-00005-of-00005.safetensors",
+    "model.layers.53.mlp.gate_proj.weight.absmax": "model-00005-of-00005.safetensors",
+    "model.layers.53.mlp.gate_proj.weight.nested_absmax": "model-00005-of-00005.safetensors",
+    "model.layers.53.mlp.gate_proj.weight.nested_quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.53.mlp.gate_proj.weight.quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.53.mlp.gate_proj.weight.quant_state.bitsandbytes__nf4": "model-00005-of-00005.safetensors",
+    "model.layers.53.mlp.up_proj.weight": "model-00005-of-00005.safetensors",
+    "model.layers.53.mlp.up_proj.weight.absmax": "model-00005-of-00005.safetensors",
+    "model.layers.53.mlp.up_proj.weight.nested_absmax": "model-00005-of-00005.safetensors",
+    "model.layers.53.mlp.up_proj.weight.nested_quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.53.mlp.up_proj.weight.quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.53.mlp.up_proj.weight.quant_state.bitsandbytes__nf4": "model-00005-of-00005.safetensors",
+    "model.layers.53.post_attention_layernorm.weight": "model-00005-of-00005.safetensors",
+    "model.layers.53.self_attn.k_proj.bias": "model-00005-of-00005.safetensors",
+    "model.layers.53.self_attn.k_proj.weight": "model-00005-of-00005.safetensors",
+    "model.layers.53.self_attn.k_proj.weight.absmax": "model-00005-of-00005.safetensors",
+    "model.layers.53.self_attn.k_proj.weight.nested_absmax": "model-00005-of-00005.safetensors",
+    "model.layers.53.self_attn.k_proj.weight.nested_quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.53.self_attn.k_proj.weight.quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.53.self_attn.k_proj.weight.quant_state.bitsandbytes__nf4": "model-00005-of-00005.safetensors",
+    "model.layers.53.self_attn.o_proj.weight": "model-00005-of-00005.safetensors",
+    "model.layers.53.self_attn.o_proj.weight.absmax": "model-00005-of-00005.safetensors",
+    "model.layers.53.self_attn.o_proj.weight.nested_absmax": "model-00005-of-00005.safetensors",
+    "model.layers.53.self_attn.o_proj.weight.nested_quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.53.self_attn.o_proj.weight.quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.53.self_attn.o_proj.weight.quant_state.bitsandbytes__nf4": "model-00005-of-00005.safetensors",
+    "model.layers.53.self_attn.q_proj.bias": "model-00005-of-00005.safetensors",
+    "model.layers.53.self_attn.q_proj.weight": "model-00005-of-00005.safetensors",
+    "model.layers.53.self_attn.q_proj.weight.absmax": "model-00005-of-00005.safetensors",
+    "model.layers.53.self_attn.q_proj.weight.nested_absmax": "model-00005-of-00005.safetensors",
+    "model.layers.53.self_attn.q_proj.weight.nested_quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.53.self_attn.q_proj.weight.quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.53.self_attn.q_proj.weight.quant_state.bitsandbytes__nf4": "model-00005-of-00005.safetensors",
+    "model.layers.53.self_attn.v_proj.bias": "model-00005-of-00005.safetensors",
+    "model.layers.53.self_attn.v_proj.weight": "model-00005-of-00005.safetensors",
+    "model.layers.53.self_attn.v_proj.weight.absmax": "model-00005-of-00005.safetensors",
+    "model.layers.53.self_attn.v_proj.weight.nested_absmax": "model-00005-of-00005.safetensors",
+    "model.layers.53.self_attn.v_proj.weight.nested_quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.53.self_attn.v_proj.weight.quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.53.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00005-of-00005.safetensors",
     "model.layers.54.input_layernorm.weight": "model-00005-of-00005.safetensors",
     "model.layers.54.mlp.down_proj.weight": "model-00005-of-00005.safetensors",
     "model.layers.54.mlp.down_proj.weight.absmax": "model-00005-of-00005.safetensors",
     "model.layers.54.mlp.up_proj.weight.quant_map": "model-00005-of-00005.safetensors",
     "model.layers.54.mlp.up_proj.weight.quant_state.bitsandbytes__nf4": "model-00005-of-00005.safetensors",
     "model.layers.54.post_attention_layernorm.weight": "model-00005-of-00005.safetensors",
+    "model.layers.54.self_attn.k_proj.bias": "model-00005-of-00005.safetensors",
+    "model.layers.54.self_attn.k_proj.weight": "model-00005-of-00005.safetensors",
+    "model.layers.54.self_attn.k_proj.weight.absmax": "model-00005-of-00005.safetensors",
+    "model.layers.54.self_attn.k_proj.weight.nested_absmax": "model-00005-of-00005.safetensors",
+    "model.layers.54.self_attn.k_proj.weight.nested_quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.54.self_attn.k_proj.weight.quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.54.self_attn.k_proj.weight.quant_state.bitsandbytes__nf4": "model-00005-of-00005.safetensors",
+    "model.layers.54.self_attn.o_proj.weight": "model-00005-of-00005.safetensors",
+    "model.layers.54.self_attn.o_proj.weight.absmax": "model-00005-of-00005.safetensors",
+    "model.layers.54.self_attn.o_proj.weight.nested_absmax": "model-00005-of-00005.safetensors",
+    "model.layers.54.self_attn.o_proj.weight.nested_quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.54.self_attn.o_proj.weight.quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.54.self_attn.o_proj.weight.quant_state.bitsandbytes__nf4": "model-00005-of-00005.safetensors",
+    "model.layers.54.self_attn.q_proj.bias": "model-00005-of-00005.safetensors",
+    "model.layers.54.self_attn.q_proj.weight": "model-00005-of-00005.safetensors",
+    "model.layers.54.self_attn.q_proj.weight.absmax": "model-00005-of-00005.safetensors",
+    "model.layers.54.self_attn.q_proj.weight.nested_absmax": "model-00005-of-00005.safetensors",
+    "model.layers.54.self_attn.q_proj.weight.nested_quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.54.self_attn.q_proj.weight.quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.54.self_attn.q_proj.weight.quant_state.bitsandbytes__nf4": "model-00005-of-00005.safetensors",
+    "model.layers.54.self_attn.v_proj.bias": "model-00005-of-00005.safetensors",
+    "model.layers.54.self_attn.v_proj.weight": "model-00005-of-00005.safetensors",
+    "model.layers.54.self_attn.v_proj.weight.absmax": "model-00005-of-00005.safetensors",
+    "model.layers.54.self_attn.v_proj.weight.nested_absmax": "model-00005-of-00005.safetensors",
+    "model.layers.54.self_attn.v_proj.weight.nested_quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.54.self_attn.v_proj.weight.quant_map": "model-00005-of-00005.safetensors",
+    "model.layers.54.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00005-of-00005.safetensors",
     "model.layers.55.input_layernorm.weight": "model-00005-of-00005.safetensors",
     "model.layers.55.mlp.down_proj.weight": "model-00005-of-00005.safetensors",
     "model.layers.55.mlp.down_proj.weight.absmax": "model-00005-of-00005.safetensors",
     "model.layers.59.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00005-of-00005.safetensors",
     "model.layers.6.input_layernorm.weight": "model-00002-of-00005.safetensors",
     "model.layers.6.mlp.down_proj.weight": "model-00002-of-00005.safetensors",
+    "model.layers.6.mlp.gate_proj.weight": "model-00002-of-00005.safetensors",
     "model.layers.6.mlp.up_proj.weight": "model-00002-of-00005.safetensors",
     "model.layers.6.post_attention_layernorm.weight": "model-00002-of-00005.safetensors",
+    "model.layers.6.self_attn.k_proj.bias": "model-00002-of-00005.safetensors",
+    "model.layers.6.self_attn.k_proj.weight": "model-00002-of-00005.safetensors",
+    "model.layers.6.self_attn.k_proj.weight.absmax": "model-00002-of-00005.safetensors",
+    "model.layers.6.self_attn.k_proj.weight.nested_absmax": "model-00002-of-00005.safetensors",
+    "model.layers.6.self_attn.k_proj.weight.nested_quant_map": "model-00002-of-00005.safetensors",
+    "model.layers.6.self_attn.k_proj.weight.quant_map": "model-00002-of-00005.safetensors",
+    "model.layers.6.self_attn.k_proj.weight.quant_state.bitsandbytes__nf4": "model-00002-of-00005.safetensors",
+    "model.layers.6.self_attn.o_proj.weight": "model-00002-of-00005.safetensors",
+    "model.layers.6.self_attn.o_proj.weight.absmax": "model-00002-of-00005.safetensors",
+    "model.layers.6.self_attn.o_proj.weight.nested_absmax": "model-00002-of-00005.safetensors",
+    "model.layers.6.self_attn.o_proj.weight.nested_quant_map": "model-00002-of-00005.safetensors",
+    "model.layers.6.self_attn.o_proj.weight.quant_map": "model-00002-of-00005.safetensors",
+    "model.layers.6.self_attn.o_proj.weight.quant_state.bitsandbytes__nf4": "model-00002-of-00005.safetensors",
+    "model.layers.6.self_attn.q_proj.bias": "model-00002-of-00005.safetensors",
+    "model.layers.6.self_attn.q_proj.weight": "model-00002-of-00005.safetensors",
+    "model.layers.6.self_attn.q_proj.weight.absmax": "model-00002-of-00005.safetensors",
+    "model.layers.6.self_attn.q_proj.weight.nested_absmax": "model-00002-of-00005.safetensors",
+    "model.layers.6.self_attn.q_proj.weight.nested_quant_map": "model-00002-of-00005.safetensors",
+    "model.layers.6.self_attn.q_proj.weight.quant_map": "model-00002-of-00005.safetensors",
+    "model.layers.6.self_attn.q_proj.weight.quant_state.bitsandbytes__nf4": "model-00002-of-00005.safetensors",
+    "model.layers.6.self_attn.v_proj.bias": "model-00002-of-00005.safetensors",
+    "model.layers.6.self_attn.v_proj.weight": "model-00002-of-00005.safetensors",
+    "model.layers.6.self_attn.v_proj.weight.absmax": "model-00002-of-00005.safetensors",
+    "model.layers.6.self_attn.v_proj.weight.nested_absmax": "model-00002-of-00005.safetensors",
+    "model.layers.6.self_attn.v_proj.weight.nested_quant_map": "model-00002-of-00005.safetensors",
+    "model.layers.6.self_attn.v_proj.weight.quant_map": "model-00002-of-00005.safetensors",
+    "model.layers.6.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00002-of-00005.safetensors",
     "model.layers.60.input_layernorm.weight": "model-00005-of-00005.safetensors",
     "model.layers.60.mlp.down_proj.weight": "model-00005-of-00005.safetensors",
     "model.layers.60.mlp.down_proj.weight.absmax": "model-00005-of-00005.safetensors",
     "model.layers.63.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00005-of-00005.safetensors",
     "model.layers.7.input_layernorm.weight": "model-00002-of-00005.safetensors",
     "model.layers.7.mlp.down_proj.weight": "model-00002-of-00005.safetensors",
+    "model.layers.7.mlp.down_proj.weight.absmax": "model-00002-of-00005.safetensors",
+    "model.layers.7.mlp.down_proj.weight.nested_absmax": "model-00002-of-00005.safetensors",
+    "model.layers.7.mlp.down_proj.weight.nested_quant_map": "model-00002-of-00005.safetensors",
+    "model.layers.7.mlp.down_proj.weight.quant_map": "model-00002-of-00005.safetensors",
+    "model.layers.7.mlp.down_proj.weight.quant_state.bitsandbytes__nf4": "model-00002-of-00005.safetensors",
     "model.layers.7.mlp.gate_proj.weight": "model-00002-of-00005.safetensors",
+    "model.layers.7.mlp.gate_proj.weight.absmax": "model-00002-of-00005.safetensors",
+    "model.layers.7.mlp.gate_proj.weight.nested_absmax": "model-00002-of-00005.safetensors",
+    "model.layers.7.mlp.gate_proj.weight.nested_quant_map": "model-00002-of-00005.safetensors",
+    "model.layers.7.mlp.gate_proj.weight.quant_map": "model-00002-of-00005.safetensors",
+    "model.layers.7.mlp.gate_proj.weight.quant_state.bitsandbytes__nf4": "model-00002-of-00005.safetensors",
     "model.layers.7.mlp.up_proj.weight": "model-00002-of-00005.safetensors",
+    "model.layers.7.mlp.up_proj.weight.absmax": "model-00002-of-00005.safetensors",
+    "model.layers.7.mlp.up_proj.weight.nested_absmax": "model-00002-of-00005.safetensors",
+    "model.layers.7.mlp.up_proj.weight.nested_quant_map": "model-00002-of-00005.safetensors",
+    "model.layers.7.mlp.up_proj.weight.quant_map": "model-00002-of-00005.safetensors",
+    "model.layers.7.mlp.up_proj.weight.quant_state.bitsandbytes__nf4": "model-00002-of-00005.safetensors",
     "model.layers.7.post_attention_layernorm.weight": "model-00002-of-00005.safetensors",
     "model.layers.7.self_attn.k_proj.bias": "model-00002-of-00005.safetensors",
     "model.layers.7.self_attn.k_proj.weight": "model-00002-of-00005.safetensors",
     "model.layers.7.self_attn.v_proj.weight.quant_state.bitsandbytes__nf4": "model-00002-of-00005.safetensors",
     "model.layers.8.input_layernorm.weight": "model-00002-of-00005.safetensors",
     "model.layers.8.mlp.down_proj.weight": "model-00002-of-00005.safetensors",
     "model.layers.8.mlp.gate_proj.weight": "model-00002-of-00005.safetensors",
     "model.layers.8.mlp.up_proj.weight": "model-00002-of-00005.safetensors",
     "model.layers.8.post_attention_layernorm.weight": "model-00002-of-00005.safetensors",
     "model.layers.8.self_attn.k_proj.bias": "model-00002-of-00005.safetensors",
     "model.layers.8.self_attn.k_proj.weight": "model-00002-of-00005.safetensors",

tokenizer_config.json CHANGED Viewed

@@ -195,16 +195,16 @@
     "<|video_pad|>"
   ],
   "bos_token": null,
-  "chat_template": "{%- if tools %}\n    {{- '<|im_start|>system\\n' }}\n    {%- if messages[0]['role'] == 'system' %}\n        {{- messages[0]['content'] }}\n    {%- else %}\n        {{- 'You are a helpful assistant.' }}\n    {%- endif %}\n    {{- \"\\n\\n# Tools\\n\\nYou may call one or more functions to assist with the user query.\\n\\nYou are provided with function signatures within <tools></tools> XML tags:\\n<tools>\" }}\n    {%- for tool in tools %}\n        {{- \"\\n\" }}\n        {{- tool | tojson }}\n    {%- endfor %}\n    {{- \"\\n</tools>\\n\\nFor each function call, return a json object with function name and arguments within <tool_call></tool_call> XML tags:\\n<tool_call>\\n{\\\"name\\\": <function-name>, \\\"arguments\\\": <args-json-object>}\\n</tool_call><|im_end|>\\n\" }}\n{%- else %}\n    {%- if messages[0]['role'] == 'system' %}\n        {{- '<|im_start|>system\\n' + messages[0]['content'] + '<|im_end|>\\n' }}\n    {%- else %}\n        {{- '<|im_start|>system\\nYou are a helpful assistant.<|im_end|>\\n' }}\n    {%- endif %}\n{%- endif %}\n{%- for message in messages %}\n    {%- if (message.role == \"user\") or (message.role == \"system\" and not loop.first) or (message.role == \"assistant\" and not message.tool_calls) %}\n        {{- '<|im_start|>' + message.role + '\\n' + message.content + '<|im_end|>' + '\\n' }}\n    {%- elif message.role == \"assistant\" %}\n        {{- '<|im_start|>' + message.role }}\n        {%- if message.content %}\n            {{- '\\n' + message.content }}\n        {%- endif %}\n        {%- for tool_call in message.tool_calls %}\n            {%- if tool_call.function is defined %}\n                {%- set tool_call = tool_call.function %}\n            {%- endif %}\n            {{- '\\n<tool_call>\\n{\"name\": \"' }}\n            {{- tool_call.name }}\n            {{- '\", \"arguments\": ' }}\n            {{- tool_call.arguments | tojson }}\n            {{- '}\\n</tool_call>' }}\n        {%- endfor %}\n        {{- '<|im_end|>\\n' }}\n    {%- elif message.role == \"tool\" %}\n        {%- if (loop.index0 == 0) or (messages[loop.index0 - 1].role != \"tool\") %}\n            {{- '<|im_start|>user' }}\n        {%- endif %}\n        {{- '\\n<tool_response>\\n' }}\n        {{- message.content }}\n        {{- '\\n</tool_response>' }}\n        {%- if loop.last or (messages[loop.index0 + 1].role != \"tool\") %}\n            {{- '<|im_end|>\\n' }}\n        {%- endif %}\n    {%- endif %}\n{%- endfor %}\n{%- if add_generation_prompt %}\n    {{- '<|im_start|>assistant\\n' }}\n{%- endif %}\n",
   "clean_up_tokenization_spaces": false,
   "eos_token": "<|im_end|>",
   "errors": "replace",
   "extra_special_tokens": {},
-  "model_max_length": 32768,
   "pad_token": "<|vision_pad|>",
   "padding_side": "left",
   "processor_class": "Qwen2_5_VLProcessor",
   "split_special_tokens": false,
   "tokenizer_class": "Qwen2Tokenizer",
-  "unk_token": null
-}

     "<|video_pad|>"
   ],
   "bos_token": null,
   "clean_up_tokenization_spaces": false,
   "eos_token": "<|im_end|>",
   "errors": "replace",
   "extra_special_tokens": {},
+  "model_max_length": 128000,
   "pad_token": "<|vision_pad|>",
   "padding_side": "left",
   "processor_class": "Qwen2_5_VLProcessor",
   "split_special_tokens": false,
   "tokenizer_class": "Qwen2Tokenizer",
+  "unk_token": null,
+  "chat_template": "{% set image_count = namespace(value=0) %}{% set video_count = namespace(value=0) %}{% for message in messages %}{% if loop.first and message['role'] != 'system' %}<|im_start|>system\nYou are a helpful assistant.<|im_end|>\n{% endif %}<|im_start|>{{ message['role'] }}\n{% if message['content'] is string %}{{ message['content'] }}<|im_end|>\n{% else %}{% for content in message['content'] %}{% if content['type'] == 'image' or 'image' in content or 'image_url' in content %}{% set image_count.value = image_count.value + 1 %}{% if add_vision_id %}Picture {{ image_count.value }}: {% endif %}<|vision_start|><|image_pad|><|vision_end|>{% elif content['type'] == 'video' or 'video' in content %}{% set video_count.value = video_count.value + 1 %}{% if add_vision_id %}Video {{ video_count.value }}: {% endif %}<|vision_start|><|video_pad|><|vision_end|>{% elif 'text' in content %}{{ content['text'] }}{% endif %}{% endfor %}<|im_end|>\n{% endif %}{% endfor %}{% if add_generation_prompt %}<|im_start|>assistant\n{% endif %}"
+}