scottto commited on 12 days ago

Commit

0aed1d9

1 Parent(s): f816f6a

add quantized weights

Browse files

Files changed (37) hide show

.gitattributes +1 -0
LICENSE +21 -0
README.md +115 -3
mlc-chat-config.json +76 -0
ndarray-cache.json +0 -0
params_shard_0.bin +3 -0
params_shard_1.bin +3 -0
params_shard_10.bin +3 -0
params_shard_11.bin +3 -0
params_shard_12.bin +3 -0
params_shard_13.bin +3 -0
params_shard_14.bin +3 -0
params_shard_15.bin +3 -0
params_shard_16.bin +3 -0
params_shard_17.bin +3 -0
params_shard_18.bin +3 -0
params_shard_19.bin +3 -0
params_shard_2.bin +3 -0
params_shard_20.bin +3 -0
params_shard_21.bin +3 -0
params_shard_22.bin +3 -0
params_shard_23.bin +3 -0
params_shard_24.bin +3 -0
params_shard_25.bin +3 -0
params_shard_26.bin +3 -0
params_shard_27.bin +3 -0
params_shard_28.bin +3 -0
params_shard_29.bin +3 -0
params_shard_3.bin +3 -0
params_shard_4.bin +3 -0
params_shard_5.bin +3 -0
params_shard_6.bin +3 -0
params_shard_7.bin +3 -0
params_shard_8.bin +3 -0
params_shard_9.bin +3 -0
tokenizer.json +3 -0
tokenizer_config.json +195 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+tokenizer.json filter=lfs diff=lfs merge=lfs -text

LICENSE ADDED Viewed

	@@ -0,0 +1,21 @@

+MIT License
+Copyright (c) 2025 Agentica
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.

README.md CHANGED Viewed

@@ -1,3 +1,115 @@
----
-license: mit
----

+---
+license: mit
+library_name: transformers
+datasets:
+- AI-MO/NuminaMath-CoT
+- KbsdJames/Omni-MATH
+- RUC-AIBOX/STILL-3-Preview-RL-Data
+- hendrycks/competition_math
+language:
+- en
+base_model:
+- deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B
+---
+<div align="center">
+<span style="font-family: default; font-size: 1.5em;">DeepScaleR-1.5B-Preview</span>
+<div>
+🚀 Democratizing Reinforcement Learning for LLMs 🌟
+</div>
+</div>
+<br>
+<div align="center" style="line-height: 1;">
+  <a href="https://github.com/agentica-project/deepscaler" style="margin: 2px;">
+    <img alt="Code" src="https://img.shields.io/badge/DeepScaleR-000000?style=for-the-badge&logo=github&logoColor=000&logoColor=white" style="display: inline-block; vertical-align: middle;"/>
+  </a>
+  <a href="https://pretty-radio-b75.notion.site/DeepScaleR-Surpassing-O1-Preview-with-a-1-5B-Model-by-Scaling-RL-19681902c1468005bed8ca303013a4e2" target="_blank" style="margin: 2px;">
+    <img alt="Blog" src="https://img.shields.io/badge/Notion-%23000000.svg?style=for-the-badge&logo=notion&logoColor=white" style="display: inline-block; vertical-align: middle;"/>
+  </a>
+  <a href="https://x.com/Agentica_/status/1889006266661617779" style="margin: 2px;">
+    <img alt="X.ai" src="https://img.shields.io/badge/Agentica-white?style=for-the-badge&logo=X&logoColor=000&color=000&labelColor=white" style="display: inline-block; vertical-align: middle;"/>
+  </a>
+  <a href="https://huggingface.co/agentica-org" style="margin: 2px;">
+    <img alt="Hugging Face" src="https://img.shields.io/badge/Agentica-fcd022?style=for-the-badge&logo=huggingface&logoColor=000&labelColor" style="display: inline-block; vertical-align: middle;"/>
+  </a>
+</div>
+</div>
+</div>
+## DeepScaleR Overview
+DeepScaleR-1.5B-Preview is a language model fine-tuned from DeepSeek-R1-Distilled-Qwen-1.5B using distributed reinforcement learning (RL) to scale up to long context lengths. The model achieves 43.1% Pass@1 accuracy on AIME 2024, representing a 15% improvement over the base model (28.8%) and surpassing OpenAI's O1-Preview performance with just 1.5B parameters.
+## Data
+Our training dataset consists of approximately 40,000 unique problem-answer pairs compiled from:
+- AIME problems (1984-2023)
+- AMC problems (prior to 2023)
+- Omni-MATH dataset
+- Still dataset
+## Training Recipe
+We employ Deepseek's Group Relative Policy Optimization (GRPO), a simplified RL algorithm that extends PPO by:
+- Normalizing advantage function over all samples generated from the same prompt.
+- Applying KL divergence regularization on top of PPO's surrogate loss to prevent significant policy drift.
+**Reward Function**: Our reward function is simple but effective:
+- 1 for correct answers passing LaTeX/Sympy checks
+- 0 for incorrect or improperly formatted answers
+- Note: No partial rewards (such as PRMs) or intermediate feedback.
+**Iterative Context Lengthening**: A key challenge in scaling RL for reasoning is compute cost. Our approach trains models with progressively longer contexts as the model improves, thus saving monetary costs and end2end training time:
+- Initial 8K Context (0-1040 steps):
+    - 22.9% -> 33% Pass@1 on AIME 2024
+    - Trained on 8 A100-80GB GPUs, BS= (Prompts) * (Samples/Prompt) = 128 * 8 = 1024
+- Extended to 16K (steps 1040-1520):
+    - 33% -> 43% Pass@1 on AIME 2024
+    - Trained on 32 A100-80GB GPUs, BS= (Prompts) * (Samples/Prompt) = 128 * 16 = 2048
+- Further extended to 24K (step 1520+):
+    - 38% -> 43% Pass@1 on AIME 2024
+    - Trained on 32 A100-80GB GPUs, BS= (Prompts) * (Samples/Prompt) = 128 * 16 = 2048
+    - Significant improvements within <200 steps
+A more detailed description of the training recipe can be found in our [blog post](https://pretty-radio-b75.notion.site/DeepScaleR-Surpassing-O1-Preview-with-a-1-5B-Model-by-Scaling-RL-19681902c1468005bed8ca303013a4e2).
+## Evaluation
+We report Pass@1 accuracy averaged over 16 samples for each problem.
+| Model | AIME 2024 | MATH 500 | AMC 2023 | Minerva Math | OlympiadBench | Avg. |
+|-------|-----------|-----------|-----------|--------------|---------------|------|
+| 2.5-7B-Instruct | 13.3 | 79.8 | 50.6 | 34.6 | 40.7 | 43.8 |
+| rStar-Math-7B | 26.7 | 78.4 | 47.5 | - | 47.1 | - |
+| Eurus-2-7B-PRIME | 26.7 | 79.2 | 57.8 | 38.6 | 42.1 | 48.9 |
+| Qwen2.5-7B-SimpleRL | 26.7 | 82.4 | 62.5 | <strong>39.7</strong> | 43.3 | 50.9 |
+| DeepSeek-R1-Distill-Qwen-1.5B | 28.8 | 82.8 | 62.9 | 26.5 | 43.3 | 48.9 |
+| Still-1.5B | 32.5 | 84.4 | 66.7 | 29.0 | 45.4 | 51.6 |
+| <strong>DeepScaleR-1.5B-Preview</strong> | <strong>43.1</strong> | <strong>87.8</strong> | <strong>73.6</strong> | 30.2 | <strong>50.0</strong> | <strong>57.0</strong> |
+| O1-Preview | 40.0 | 81.4 | - | - | - | - |
+## Serving DeepScaleR
+Our model can be served using popular high-performance inference systems:
+- vLLM
+- Hugging Face Text Generation Inference (TGI)
+- SGLang
+- TensorRT-LLM
+All these systems support the OpenAI Chat Completions API format.
+## License
+This project is released under the MIT License, reflecting our commitment to open and accessible AI development.
+We believe in democratizing AI technology by making our work freely available for anyone to use, modify, and build upon.
+This permissive license ensures that researchers, developers, and enthusiasts worldwide can leverage and extend our work without restrictions, fostering innovation and collaboration in the AI community.
+## Acknowledgement
+- Our training experiments are powered by our heavily modified fork of [Verl](https://github.com/agentica-project/verl), an open-source RLHF library.
+- Our model is trained on top of [`DeepSeek-R1-Distill-Qwen-1.5B`](https://huggingface.co/deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B).
+- Our work is done as part of  [Berkeley Sky Computing Lab](https://skycomputing.berkeley.edu/) and [Berkeley AI Research](https://bair.berkeley.edu/).
+## Citation
+```bibtex
+@misc{deepscaler2025,
+  title={DeepScaleR: Surpassing O1-Preview with a 1.5B Model by Scaling RL},
+  author={Michael Luo and Sijun Tan and Justin Wong and Xiaoxiang Shi and William Tang and Manan Roongta and Colin Cai and Jeffrey Luo and Tianjun Zhang and Erran Li and Raluca Ada Popa and Ion Stoica},
+  year={2025},
+  howpublished={\url{https://pretty-radio-b75.notion.site/DeepScaleR-Surpassing-O1-Preview-with-a-1-5B-Model-by-Scaling-RL-19681902c1468005bed8ca303013a4e2}},
+  note={Notion Blog}
+  year={2025}
+}

mlc-chat-config.json ADDED Viewed

	@@ -0,0 +1,76 @@

+{
+  "version": "0.1.0",
+  "model_type": "qwen2",
+  "quantization": "q4f16_1",
+  "model_config": {
+    "hidden_act": "silu",
+    "hidden_size": 1536,
+    "intermediate_size": 8960,
+    "num_attention_heads": 12,
+    "num_hidden_layers": 28,
+    "num_key_value_heads": 2,
+    "rms_norm_eps": 1e-06,
+    "rope_theta": 10000,
+    "vocab_size": 151936,
+    "tie_word_embeddings": false,
+    "context_window_size": 131072,
+    "prefill_chunk_size": 2048,
+    "tensor_parallel_shards": 1,
+    "head_dim": 128,
+    "dtype": "float32",
+    "max_batch_size": 80
+  },
+  "vocab_size": 151936,
+  "context_window_size": 131072,
+  "sliding_window_size": -1,
+  "prefill_chunk_size": 2048,
+  "attention_sink_size": -1,
+  "tensor_parallel_shards": 1,
+  "pipeline_parallel_stages": 1,
+  "temperature": 0.6,
+  "presence_penalty": 0.0,
+  "frequency_penalty": 0.0,
+  "repetition_penalty": 1.0,
+  "top_p": 0.95,
+  "tokenizer_files": [
+    "tokenizer.json",
+    "tokenizer_config.json"
+  ],
+  "tokenizer_info": {
+    "token_postproc_method": "byte_level",
+    "prepend_space_in_encode": false,
+    "strip_space_in_decode": false
+  },
+  "conv_template": {
+      "name": "deepseek_r1_qwen",
+      "system_template": "<\uff5cbegin\u2581of\u2581sentence\uff5c>{system_message}",
+      "system_message": "You are a helpful assistant.",
+      "system_prefix_token_ids": null,
+      "add_role_after_system_message": true,
+      "roles": {
+        "user": "<\uff5cUser\uff5c>",
+        "assistant": "<\uff5cAssistant\uff5c>"
+      },
+      "role_templates": {
+        "user": "{user_message}",
+        "assistant": "{assistant_message}",
+        "tool": "{tool_message}"
+      },
+      "messages": [],
+      "seps": [
+        "",
+        "<\uff5cend\u2581of\u2581sentence\uff5c>"
+      ],
+      "role_content_sep": "",
+      "role_empty_sep": "",
+      "stop_str": [],
+      "stop_token_ids": [
+        151643
+      ],
+      "function_string": "",
+      "use_function_calling": false
+    },
+  "pad_token_id": 151643,
+  "bos_token_id": 151646,
+  "eos_token_id": 151643
+}

ndarray-cache.json ADDED Viewed

The diff for this file is too large to render. See raw diff

params_shard_0.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:54a304bbe2da18a2642ec8b4457463ac2904ed72d67d8c789b2bb35d37502596
+size 116686848

params_shard_1.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:53ac65553153295811642f339e5c2d74cf327e78a7b15314f4e672aefc6df883
+size 30077952

params_shard_10.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b60fe0d7b2634dc3b8a22f328300b506e2d84bec99673c4bbb6be57253b77959
+size 27191296

params_shard_11.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6592208ffa1cc164b3e90104ff628fbd3a8ff454ed87b469b1d16a16a6b46be4
+size 26331136

params_shard_12.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:91c0dca8cf4ddc4eb0df09ddc41cd5c5af09ec6d81c9dcadcff3de666159d090
+size 26331136

params_shard_13.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ab3a3f1a66c86b268aa6b3a1a00d36e4a3008ab213279fa7564f62ea3623d525
+size 26331136

params_shard_14.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:812b2ec18af8816e3645881c62dc379097316ffef9f4d0da5583af9c66572d23
+size 26331136

params_shard_15.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:85994a5500bc011e42bd3a258d8ff42080356a90a83ae19314a62ff1b9aae59b
+size 26331136

params_shard_16.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:250f6ef520e4995c97dd4df271b103c952dfb650d5770fe593e86bf48ffaf0c2
+size 26331136

params_shard_17.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e56880551b0b149b24b8cba4f9ae64e67ff2dfd9a9fc14a9edf7a2ffec9fd843
+size 26331136

params_shard_18.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5af310bbfba22b2457d1ea0a5404b7fe213612c5cb6bc3a349a18013fd252894
+size 26331136

params_shard_19.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:baeb0a7195632a1891b142b8378c63de16824e93e68250a2778b8be5fa2ec7cb
+size 26331136

params_shard_2.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f9300cb0cfd012b89e45e4aee9de1cbf1fa20041a93edd1cf105f9efdae64a88
+size 26331136

params_shard_20.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:71a328ed80c930373df56fdd400c77e320cccb5ceab250bd0f9b0ff2ad1a32be
+size 26331136

params_shard_21.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6207aac0610aa9d275df2e159ee00178c22fc91d75ef0d9bbbe566ff8cab67c4
+size 26331136

params_shard_22.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8ed66b467587a2b9849d55a1a0921d71f5e180944a18e77a0c25b47bcbc54fc2
+size 32349184

params_shard_23.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dc32e3b7476336ce6f6f50941747fb9367b34c45e6f1f6b4e926ab98da516fa2
+size 31155200

params_shard_24.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0aa1bbd64b532885f0cd3a4953d13453f15c697d37f3f50ab8b15702b69087db
+size 33212416

params_shard_25.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:93b49befef6faf0cffe51d5c688c5e97fa26cf350b55eb1ed15e2673adeafc70
+size 27191296

params_shard_26.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0f324302b2b62e5d18cee3224c384f9280a1ba35a80b056c9a699ec874264094
+size 26331136

params_shard_27.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ee6cfea35aa350371cbd51af13100403c67d0c2b4ad9abde708b5a2e9c5176f1
+size 26331136

params_shard_28.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:685f3c5cb968ea6297d847634ed292ea39b7c1c5d1dadaa1d530690fb5151907
+size 26331136

params_shard_29.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:23d6037c97fe642776fca3b4b5734080cb822d79a8004a1cc9afc6e9e2841ed9
+size 18586624

params_shard_3.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8250007426e2105002651f2b4d211c23b3330ce0e6434742a3e2d191753f8bf2
+size 26331136

params_shard_4.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bb7a35f829061b3344cf3ae415e5f046c76ca462ec0203aee8aa692e2c10e3ef
+size 26331136

params_shard_5.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:93761ef26bd5145f957fefc94508b8a223baa7b16d23cb89415502f5c85ace5d
+size 26331136

params_shard_6.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4533d67d2564a08068af97efc0e748e4ff381b4f776ce800a1d4ad317a686a02
+size 26331136

params_shard_7.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cb48e34ad4670b766a3aab925108490990c92fd7f772c292b2e027b7011bec59
+size 116686848

params_shard_8.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ca59a548497ef92eef74ee207488c400603ff4b9c869498efcb48d59a48aca09
+size 33178624

params_shard_9.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e5c3e9f234f54311e76043f8de33de03a86b701ca756663e73572c50cffcc708
+size 33212416

tokenizer.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893
+size 11422778

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,195 @@

+{
+  "add_bos_token": true,
+  "add_eos_token": false,
+  "add_prefix_space": null,
+  "added_tokens_decoder": {
+    "151643": {
+      "content": "<｜end▁of▁sentence｜>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151644": {
+      "content": "<｜User｜>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151645": {
+      "content": "<｜Assistant｜>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151646": {
+      "content": "<｜begin▁of▁sentence｜>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151647": {
+      "content": "<|EOT|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151648": {
+      "content": "<think>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151649": {
+      "content": "</think>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151650": {
+      "content": "<|quad_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151651": {
+      "content": "<|quad_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151652": {
+      "content": "<|vision_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151653": {
+      "content": "<|vision_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151654": {
+      "content": "<|vision_pad|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151655": {
+      "content": "<|image_pad|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151656": {
+      "content": "<|video_pad|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151657": {
+      "content": "<tool_call>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151658": {
+      "content": "</tool_call>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151659": {
+      "content": "<|fim_prefix|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151660": {
+      "content": "<|fim_middle|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151661": {
+      "content": "<|fim_suffix|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151662": {
+      "content": "<|fim_pad|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151663": {
+      "content": "<|repo_name|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151664": {
+      "content": "<|file_sep|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    }
+  },
+  "bos_token": "<｜begin▁of▁sentence｜>",
+  "chat_template": "{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% set ns = namespace(is_first=false, is_tool=false, is_output_first=true, system_prompt='') %}{%- for message in messages %}{%- if message['role'] == 'system' %}{% set ns.system_prompt = message['content'] %}{%- endif %}{%- endfor %}{{bos_token}}{{ns.system_prompt}}{%- for message in messages %}{%- if message['role'] == 'user' %}{%- set ns.is_tool = false -%}{{'<｜User｜>' + message['content']}}{%- endif %}{%- if message['role'] == 'assistant' and message['content'] is none %}{%- set ns.is_tool = false -%}{%- for tool in message['tool_calls']%}{%- if not ns.is_first %}{{'<｜Assistant｜><｜tool▁calls▁begin｜><｜tool▁call▁begin��>' + tool['type'] + '<｜tool▁sep｜>' + tool['function']['name'] + '\\n' + '```json' + '\\n' + tool['function']['arguments'] + '\\n' + '```' + '<｜tool▁call▁end｜>'}}{%- set ns.is_first = true -%}{%- else %}{{'\\n' + '<｜tool▁call▁begin｜>' + tool['type'] + '<｜tool▁sep｜>' + tool['function']['name'] + '\\n' + '```json' + '\\n' + tool['function']['arguments'] + '\\n' + '```' + '<｜tool▁call▁end｜>'}}{{'<｜tool▁calls▁end｜><｜end▁of▁sentence｜>'}}{%- endif %}{%- endfor %}{%- endif %}{%- if message['role'] == 'assistant' and message['content'] is not none %}{%- if ns.is_tool %}{{'<｜tool▁outputs▁end｜>' + message['content'] + '<｜end▁of▁sentence｜>'}}{%- set ns.is_tool = false -%}{%- else %}{% set content = message['content'] %}{% if '</think>' in content %}{% set content = content.split('</think>')[-1] %}{% endif %}{{'<｜Assistant｜>' + content + '<｜end▁of▁sentence｜>'}}{%- endif %}{%- endif %}{%- if message['role'] == 'tool' %}{%- set ns.is_tool = true -%}{%- if ns.is_output_first %}{{'<｜tool▁outputs▁begin｜><｜tool▁output▁begin｜>' + message['content'] + '<｜tool▁output▁end｜>'}}{%- set ns.is_output_first = false %}{%- else %}{{'\\n<｜tool▁output▁begin｜>' + message['content'] + '<｜tool▁output▁end｜>'}}{%- endif %}{%- endif %}{%- endfor -%}{% if ns.is_tool %}{{'<｜tool▁outputs▁end｜>'}}{% endif %}{% if add_generation_prompt and not ns.is_tool %}{{'<｜Assistant｜>'}}{% endif %}",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "<｜end▁of▁sentence｜>",
+  "extra_special_tokens": {},
+  "legacy": true,
+  "model_max_length": 16384,
+  "pad_token": "<｜end▁of▁sentence｜>",
+  "sp_model_kwargs": {},
+  "tokenizer_class": "LlamaTokenizer",
+  "unk_token": null,
+  "use_default_system_prompt": false
+}