diff --git a/.gitattributes b/.gitattributes
index a6344aac8c09253b3b630fb776ae94478aa0275b..52373fe24473b1aa44333d318f578ae6bf04b49b 100644
--- a/.gitattributes
+++ b/.gitattributes
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
*.zip filter=lfs diff=lfs merge=lfs -text
*.zst filter=lfs diff=lfs merge=lfs -text
*tfevents* filter=lfs diff=lfs merge=lfs -text
+tokenizer.json filter=lfs diff=lfs merge=lfs -text
diff --git a/README.md b/README.md
index 7be5fc7f47d5db027d120b8024982df93db95b74..d8dd05d76d41d426b46cba2a018415ed9596f3c1 100644
--- a/README.md
+++ b/README.md
@@ -1,3 +1,11 @@
---
+language:
+- en
license: mit
+base_model: deepseek-ai/DeepSeek-R1-Distill-Qwen-32B
+base_model_relation: quantized
+library_name: mlc-llm
+pipeline_tag: text-generation
---
+
+4-bit GPTQ quantized version of [DeepSeek-R1-Distill-Qwen-32B](https://huggingface.co/deepseek-ai/DeepSeek-R1-Distill-Qwen-32B) for inference with the [Private LLM](http://privatellm.app) app.
diff --git a/config.json b/config.json
new file mode 100644
index 0000000000000000000000000000000000000000..d9e7e08f5c8e277065c653a7c72987d064f55208
--- /dev/null
+++ b/config.json
@@ -0,0 +1,5 @@
+{
+ "quantization_config": {
+ "bits": 4
+ }
+}
diff --git a/ndarray-cache.json b/ndarray-cache.json
new file mode 100644
index 0000000000000000000000000000000000000000..6d2dcf4e8c185f1851680db8193ff41661180a47
--- /dev/null
+++ b/ndarray-cache.json
@@ -0,0 +1,9679 @@
+{
+ "metadata": {
+ "ParamSize": 709,
+ "ParamBytes": 16895535104.0,
+ "BitsPerParam": 4.125405656518088
+ },
+ "records": [
+ {
+ "dataPath": "params_shard_0.bin",
+ "format": "raw-shard",
+ "nbytes": 389283840,
+ "records": [
+ {
+ "name": "model.embed_tokens.q_weight",
+ "shape": [
+ 152064,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 389283840,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2160f6cbda407f70c0d2058e2543e6e5"
+ },
+ {
+ "dataPath": "params_shard_1.bin",
+ "format": "raw-shard",
+ "nbytes": 31102976,
+ "records": [
+ {
+ "name": "model.embed_tokens.q_scale",
+ "shape": [
+ 152064,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 12165120,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.0.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 12165120
+ },
+ {
+ "name": "model.layers.0.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 12179456
+ },
+ {
+ "name": "model.layers.0.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 30529536
+ }
+ ],
+ "md5sum": "3e7b67ece44d93b493924d79c6e6ce05"
+ },
+ {
+ "dataPath": "params_shard_2.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.0.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "119dd1b983309d741fb6645287b3702f"
+ },
+ {
+ "dataPath": "params_shard_3.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.0.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0bbf6497e76bfb60cf2ba7bdb6ca3a7b"
+ },
+ {
+ "dataPath": "params_shard_4.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.1.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "94574e053f2946b34cc18c6ad455e2f4"
+ },
+ {
+ "dataPath": "params_shard_5.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.0.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.0.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.0.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.0.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.0.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.0.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.1.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.1.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "14708d8170909015b1096ec11ab4f372"
+ },
+ {
+ "dataPath": "params_shard_6.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.1.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "70b0cbe76cc3a36fed44a3ce139d4d84"
+ },
+ {
+ "dataPath": "params_shard_7.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.1.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e2056907dbd6075a67a2388fbdcc1291"
+ },
+ {
+ "dataPath": "params_shard_8.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.2.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "93aeefac78495adfbff7688d5c74ea96"
+ },
+ {
+ "dataPath": "params_shard_9.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.1.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.1.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.1.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.1.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.1.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.1.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.2.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.2.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "ea2d624f6622d3445d58d13e5677e4d2"
+ },
+ {
+ "dataPath": "params_shard_10.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.2.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "bffe6947fe04ebfeda1e870bdc709fed"
+ },
+ {
+ "dataPath": "params_shard_11.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.2.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c791b3013aeb710277c34596cef78ec8"
+ },
+ {
+ "dataPath": "params_shard_12.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.3.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c378315c566a5f4eea531446c9d85f06"
+ },
+ {
+ "dataPath": "params_shard_13.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.2.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.2.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.2.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.2.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.2.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.2.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.3.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.3.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "4a840d2c0a5f15ef221dd465c48323eb"
+ },
+ {
+ "dataPath": "params_shard_14.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.3.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "af441f9290d817cdd1d3756fd61a2c89"
+ },
+ {
+ "dataPath": "params_shard_15.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.3.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fe24e0d000e6dda24b0586318950bf02"
+ },
+ {
+ "dataPath": "params_shard_16.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.4.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "dd617527c23fefa8e0a614d33e9935cb"
+ },
+ {
+ "dataPath": "params_shard_17.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.3.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.3.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.3.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.3.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.3.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.3.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.4.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.4.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "0cefde893c512bc1b75d0b9ccafb6b5c"
+ },
+ {
+ "dataPath": "params_shard_18.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.4.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b4ba7d9a7b5237d57c0f6833a763a740"
+ },
+ {
+ "dataPath": "params_shard_19.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.4.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "977fe394c4eb993a1970617469d3e4f1"
+ },
+ {
+ "dataPath": "params_shard_20.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.5.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "aa65d4713ffa59abf9d193892930a51f"
+ },
+ {
+ "dataPath": "params_shard_21.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.4.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.4.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.4.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.4.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.4.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.4.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.5.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.5.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "f9e308928ed17337766a5d2fad9b50da"
+ },
+ {
+ "dataPath": "params_shard_22.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.5.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b8ece74db336880634a7c0d229d243d4"
+ },
+ {
+ "dataPath": "params_shard_23.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.5.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e728ca537c79a652011990af144456e6"
+ },
+ {
+ "dataPath": "params_shard_24.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.6.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7fb726ef8305615d7caaeda6b5560795"
+ },
+ {
+ "dataPath": "params_shard_25.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.5.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.5.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.5.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.5.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.5.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.5.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.6.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.6.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "17d7098b25d681c038d16067e363d278"
+ },
+ {
+ "dataPath": "params_shard_26.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.6.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "51e7231580c1a235b660b3d727b3fe5e"
+ },
+ {
+ "dataPath": "params_shard_27.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.6.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1f6a5f32f306d7729280d0c7263eef0f"
+ },
+ {
+ "dataPath": "params_shard_28.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.7.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5716e7f55bd03f4113e17c9f70e86314"
+ },
+ {
+ "dataPath": "params_shard_29.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.6.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.6.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.6.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.6.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.6.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.6.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.7.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.7.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "ee20465108ed5057b8682ab4546442b3"
+ },
+ {
+ "dataPath": "params_shard_30.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.7.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "27b8aab15ad3a8ca6a78b3636e474d89"
+ },
+ {
+ "dataPath": "params_shard_31.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.7.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "315248fbdd2a5b0bc0c46c1857538605"
+ },
+ {
+ "dataPath": "params_shard_32.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.8.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f790cf2677aad8f00e7e1f23261f8fc6"
+ },
+ {
+ "dataPath": "params_shard_33.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.7.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.7.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.7.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.7.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.7.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.7.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.8.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.8.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "cf844ba0e6bf9c818d61597e5ab8fa35"
+ },
+ {
+ "dataPath": "params_shard_34.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.8.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c884d21ea633b395886e367ef4dff398"
+ },
+ {
+ "dataPath": "params_shard_35.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.8.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c089da007faf5ee21e96cc88f4617b58"
+ },
+ {
+ "dataPath": "params_shard_36.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.9.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f2d4a40314adcbdca25c42cb22fb9b27"
+ },
+ {
+ "dataPath": "params_shard_37.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.8.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.8.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.8.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.8.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.8.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.8.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.9.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.9.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "f71a70dc44ae2b7afacd71c4fd4eb40b"
+ },
+ {
+ "dataPath": "params_shard_38.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.9.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b25d84bdf6b77388a109b7857ebe8653"
+ },
+ {
+ "dataPath": "params_shard_39.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.9.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2944d74529e0db8e33de6d5d1f3a1459"
+ },
+ {
+ "dataPath": "params_shard_40.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.10.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7bb1fe32b6001e785c82f67c7690d7db"
+ },
+ {
+ "dataPath": "params_shard_41.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.9.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.9.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.9.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.9.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.9.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.9.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.10.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.10.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "e23a9f00a2cb9698b6653ac36b1b147a"
+ },
+ {
+ "dataPath": "params_shard_42.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.10.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d185d30973d17350dd8bfabab736440c"
+ },
+ {
+ "dataPath": "params_shard_43.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.10.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "38c6bb718b1de9d9f7e9c31db494eee7"
+ },
+ {
+ "dataPath": "params_shard_44.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.11.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e23ea4f4a7491b9e2336373c15caf9b2"
+ },
+ {
+ "dataPath": "params_shard_45.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.10.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.10.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.10.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.10.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.10.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.10.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.11.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.11.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "a452a14dd9795b4cbb672a574e92531d"
+ },
+ {
+ "dataPath": "params_shard_46.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.11.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d1343ad7477d62e03847f5813223194b"
+ },
+ {
+ "dataPath": "params_shard_47.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.11.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1fdace10adebcca80a7fcb89e77b90a4"
+ },
+ {
+ "dataPath": "params_shard_48.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.12.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2b4c345718dc03e30b6253112123617a"
+ },
+ {
+ "dataPath": "params_shard_49.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.11.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.11.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.11.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.11.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.11.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.11.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.12.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.12.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "34296b36fab4ce93229c00bee31b22ff"
+ },
+ {
+ "dataPath": "params_shard_50.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.12.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "26129bfca73a8ab19c0648fe94a230e2"
+ },
+ {
+ "dataPath": "params_shard_51.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.12.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "224191bac3aa158c602002653178983d"
+ },
+ {
+ "dataPath": "params_shard_52.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.13.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a07cce1357a66c0347e143e47710df8e"
+ },
+ {
+ "dataPath": "params_shard_53.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.12.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.12.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.12.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.12.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.12.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.12.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.13.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.13.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "aa64e483e5f20dd4563aa18b5bff6855"
+ },
+ {
+ "dataPath": "params_shard_54.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.13.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e29690928c42b9621e3f4301d726d89b"
+ },
+ {
+ "dataPath": "params_shard_55.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.13.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "56399646a1d029a57ae60547081cc64c"
+ },
+ {
+ "dataPath": "params_shard_56.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.14.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b848262f4a7cbcabc29f375470547334"
+ },
+ {
+ "dataPath": "params_shard_57.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.13.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.13.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.13.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.13.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.13.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.13.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.14.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.14.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "f1299f4f688a9f2d4e0574ec0c4f69bb"
+ },
+ {
+ "dataPath": "params_shard_58.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.14.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "65d1212958007a5624e8f69725951048"
+ },
+ {
+ "dataPath": "params_shard_59.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.14.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6c1de3942623361ff6aa759694cf78c2"
+ },
+ {
+ "dataPath": "params_shard_60.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.15.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3211346e07963a5fc1cb7713fd3b5b3e"
+ },
+ {
+ "dataPath": "params_shard_61.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.14.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.14.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.14.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.14.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.14.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.14.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.15.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.15.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "1e221b2c244a3eee7888a53f08af3e7d"
+ },
+ {
+ "dataPath": "params_shard_62.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.15.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1a3a8a7da9b68fa3a507a5752b049e4f"
+ },
+ {
+ "dataPath": "params_shard_63.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.15.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d8acc4dee55e1fccdb5cdad5921bb83b"
+ },
+ {
+ "dataPath": "params_shard_64.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.16.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2d355331b73623c261a5897ae30e3b00"
+ },
+ {
+ "dataPath": "params_shard_65.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.15.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.15.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.15.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.15.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.15.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.15.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.16.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.16.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "1572b102bded95ab329ecf3986ac96fb"
+ },
+ {
+ "dataPath": "params_shard_66.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.16.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6116374350074ac6bb3f26489eca8769"
+ },
+ {
+ "dataPath": "params_shard_67.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.16.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8cc644440b754dea2d0a170d7e1adc5e"
+ },
+ {
+ "dataPath": "params_shard_68.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.17.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3e70a049a96b1f40bdcf83e8db658c6c"
+ },
+ {
+ "dataPath": "params_shard_69.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.16.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.16.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.16.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.16.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.16.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.16.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.17.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.17.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "39affe6d48a41d2e5bc1f8b688ca86b7"
+ },
+ {
+ "dataPath": "params_shard_70.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.17.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b2315972297d13bd32ce620b95189ce6"
+ },
+ {
+ "dataPath": "params_shard_71.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.17.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "57a5f81b247934ccefd30e51c02382bc"
+ },
+ {
+ "dataPath": "params_shard_72.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.18.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b213f0092c857edc6b76e130567ed416"
+ },
+ {
+ "dataPath": "params_shard_73.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.17.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.17.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.17.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.17.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.17.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.17.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.18.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.18.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "6dfc58dcec1894f66e689d884ec4d43a"
+ },
+ {
+ "dataPath": "params_shard_74.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.18.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "da06290cbb25c063a187010f91deccdf"
+ },
+ {
+ "dataPath": "params_shard_75.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.18.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d3dd9f61d3a6fb2ebc8d009147edc62c"
+ },
+ {
+ "dataPath": "params_shard_76.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.19.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f4701ea2c6bde074e24e0715750bd2cf"
+ },
+ {
+ "dataPath": "params_shard_77.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.18.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.18.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.18.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.18.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.18.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.18.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.19.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.19.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "5fb47fdbd774a72f1f172125d824ccff"
+ },
+ {
+ "dataPath": "params_shard_78.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.19.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a766879e78138eaa000eec95ea9377ff"
+ },
+ {
+ "dataPath": "params_shard_79.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.19.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "df7df24d74f3db624c427f9568e561ff"
+ },
+ {
+ "dataPath": "params_shard_80.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.20.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9fc978c2ba9d7fc175ef93e7138076c8"
+ },
+ {
+ "dataPath": "params_shard_81.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.19.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.19.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.19.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.19.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.19.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.19.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.20.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.20.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "0f6770226bc44adf1ba7fc9bd8f2ec76"
+ },
+ {
+ "dataPath": "params_shard_82.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.20.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f0f6f5fd27e3b567316ea6024822f1fa"
+ },
+ {
+ "dataPath": "params_shard_83.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.20.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "883555eefffcf083ece5f455db6c3cdc"
+ },
+ {
+ "dataPath": "params_shard_84.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.21.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ebbc6852b3feb201be04a0c7c91d722b"
+ },
+ {
+ "dataPath": "params_shard_85.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.20.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.20.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.20.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.20.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.20.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.20.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.21.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.21.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "e45a8d0df1e3552bfd0a4d2ab514b0f4"
+ },
+ {
+ "dataPath": "params_shard_86.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.21.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ffce06c9d902246e7a5b52f13c9e99df"
+ },
+ {
+ "dataPath": "params_shard_87.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.21.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2fb2d3cdc6d68235bbfbca1bd6d7e0e2"
+ },
+ {
+ "dataPath": "params_shard_88.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.22.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9ece9f579d6a07ada436d104b6c827a1"
+ },
+ {
+ "dataPath": "params_shard_89.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.21.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.21.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.21.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.21.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.21.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.21.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.22.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.22.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "7524774d4cf32fc49d85adfedd0c3436"
+ },
+ {
+ "dataPath": "params_shard_90.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.22.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "84e9e89e81f285755b398bf90c4721ac"
+ },
+ {
+ "dataPath": "params_shard_91.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.22.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e9a352bf2329aaf3c49dcb13516ffdf9"
+ },
+ {
+ "dataPath": "params_shard_92.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.23.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "bf083879dc03cc194b745feea25f1489"
+ },
+ {
+ "dataPath": "params_shard_93.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.22.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.22.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.22.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.22.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.22.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.22.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.23.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.23.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "c48df471d1122384219e1d82b4c9e647"
+ },
+ {
+ "dataPath": "params_shard_94.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.23.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "701a4849aa1e1d270908310ffce474b8"
+ },
+ {
+ "dataPath": "params_shard_95.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.23.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4a4ac1f12f1201e6763316645c41d99c"
+ },
+ {
+ "dataPath": "params_shard_96.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.24.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a112217764718957849bc22544e27862"
+ },
+ {
+ "dataPath": "params_shard_97.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.23.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.23.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.23.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.23.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.23.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.23.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.24.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.24.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "2c408e376f752ba75faced6f1e9d8f72"
+ },
+ {
+ "dataPath": "params_shard_98.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.24.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2ada0be5b3542f20f19634c9fb66cd29"
+ },
+ {
+ "dataPath": "params_shard_99.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.24.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4edecd2c041ac46d48a1bd3521620eb3"
+ },
+ {
+ "dataPath": "params_shard_100.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.25.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "05dbda6e592d43e1518f0f3c34948df2"
+ },
+ {
+ "dataPath": "params_shard_101.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.24.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.24.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.24.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.24.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.24.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.24.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.25.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.25.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "e6504138d7f091a3be9fbfaf4158b8e2"
+ },
+ {
+ "dataPath": "params_shard_102.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.25.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "327878dabeae075a191d86a723770f2d"
+ },
+ {
+ "dataPath": "params_shard_103.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.25.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b0a49538754dd1eb7ef22e2e469e652c"
+ },
+ {
+ "dataPath": "params_shard_104.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.26.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5715c38c928ef849eff57e83bb402de0"
+ },
+ {
+ "dataPath": "params_shard_105.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.25.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.25.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.25.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.25.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.25.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.25.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.26.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.26.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "5fbece675c2fab8dd915829e16bf710b"
+ },
+ {
+ "dataPath": "params_shard_106.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.26.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "dd31b35d51c3d33a61819f1cace75856"
+ },
+ {
+ "dataPath": "params_shard_107.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.26.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1520d129a8dcdedbdc5a96c4b77d9127"
+ },
+ {
+ "dataPath": "params_shard_108.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.27.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ec5af2121c5e2953c8522e9342ff8e5c"
+ },
+ {
+ "dataPath": "params_shard_109.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.26.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.26.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.26.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.26.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.26.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.26.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.27.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.27.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "6e02bceda4e0a01619cf5ee0e8efdc2c"
+ },
+ {
+ "dataPath": "params_shard_110.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.27.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5cd0e2b0f1aa99430ad4a17b8eee514d"
+ },
+ {
+ "dataPath": "params_shard_111.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.27.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "866df094fbaca4a3426cd54631fc96f4"
+ },
+ {
+ "dataPath": "params_shard_112.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.28.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d85d79d1b1fe09a1d131a85044128777"
+ },
+ {
+ "dataPath": "params_shard_113.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.27.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.27.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.27.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.27.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.27.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.27.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.28.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.28.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "709244a8e90e01762c14e92ffe0998f6"
+ },
+ {
+ "dataPath": "params_shard_114.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.28.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "968e8cb9d0334af826c7efc350d53b8e"
+ },
+ {
+ "dataPath": "params_shard_115.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.28.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9fa043aacd80997da0e6a27c0db0495f"
+ },
+ {
+ "dataPath": "params_shard_116.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.29.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fc299560c0938278fd75ce262b8e7278"
+ },
+ {
+ "dataPath": "params_shard_117.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.28.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.28.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.28.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.28.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.28.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.28.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.29.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.29.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "bb7a341721cc8adda13dc78b65c3da89"
+ },
+ {
+ "dataPath": "params_shard_118.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.29.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2ac8aee7a8315acca8f3d0c72d4b3838"
+ },
+ {
+ "dataPath": "params_shard_119.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.29.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "045d146248d9c4dd6c3fac285da34a72"
+ },
+ {
+ "dataPath": "params_shard_120.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.30.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "59b3c945307dd14f47fe40907b6ce717"
+ },
+ {
+ "dataPath": "params_shard_121.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.29.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.29.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.29.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.29.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.29.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.29.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.30.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.30.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "0072f6be1a905bc1b270b31aff237f38"
+ },
+ {
+ "dataPath": "params_shard_122.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.30.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7774723a300f98138a1c40da549fbaf1"
+ },
+ {
+ "dataPath": "params_shard_123.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.30.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7a102deb562c1ad2d6f6ba8cea1416e1"
+ },
+ {
+ "dataPath": "params_shard_124.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.31.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7077e5a06d582c0b63af856e17bbf05b"
+ },
+ {
+ "dataPath": "params_shard_125.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.30.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.30.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.30.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.30.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.30.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.30.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.31.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.31.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "a747d29541a9f943cadef7f7aa00229e"
+ },
+ {
+ "dataPath": "params_shard_126.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.31.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4b3ca70cce415094a4f40cb6507de7f4"
+ },
+ {
+ "dataPath": "params_shard_127.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.31.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c8edc22cc57966fbc509b8ac1f1cdb27"
+ },
+ {
+ "dataPath": "params_shard_128.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.32.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1ab2670f5a992f840a66853373ca57fd"
+ },
+ {
+ "dataPath": "params_shard_129.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.31.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.31.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.31.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.31.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.31.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.31.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.32.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.32.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "d397427d77fc63755b97011c5f409bb1"
+ },
+ {
+ "dataPath": "params_shard_130.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.32.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "58f905932d9ec361f28d52f38fa9f1fc"
+ },
+ {
+ "dataPath": "params_shard_131.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.32.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5281d63585003be532ddca700f257a0f"
+ },
+ {
+ "dataPath": "params_shard_132.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.33.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "24520890af85661be2cb07cf7dcf2bd4"
+ },
+ {
+ "dataPath": "params_shard_133.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.32.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.32.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.32.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.32.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.32.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.32.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.33.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.33.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "aee25acd5522ef2f333e4e918166cfc3"
+ },
+ {
+ "dataPath": "params_shard_134.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.33.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ccda67286e192f31ec443e9c7a8130a0"
+ },
+ {
+ "dataPath": "params_shard_135.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.33.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e6b841d299513d6f2638cf85a739d6a7"
+ },
+ {
+ "dataPath": "params_shard_136.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.34.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b31789e0903e19e1c9d2b9ee553856c4"
+ },
+ {
+ "dataPath": "params_shard_137.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.33.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.33.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.33.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.33.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.33.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.33.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.34.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.34.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "4f08dc97743de07320b7ab3e01b48dcc"
+ },
+ {
+ "dataPath": "params_shard_138.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.34.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "931d799b4221cac82100b80d88692a85"
+ },
+ {
+ "dataPath": "params_shard_139.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.34.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3336b2fa2e272db789c66bf2b361c720"
+ },
+ {
+ "dataPath": "params_shard_140.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.35.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2b18275c4239150aed533ce51827369f"
+ },
+ {
+ "dataPath": "params_shard_141.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.34.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.34.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.34.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.34.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.34.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.34.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.35.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.35.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "5ecb264fceb38a49c98e0d230ae28f8f"
+ },
+ {
+ "dataPath": "params_shard_142.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.35.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9a1ef78265ea6d872c015f832d0fa3d5"
+ },
+ {
+ "dataPath": "params_shard_143.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.35.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "01755d31ccbcf7036f7cfaec5949b0c5"
+ },
+ {
+ "dataPath": "params_shard_144.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.36.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2e35b8fcf4ae7dd9a1beb4b849de3f1c"
+ },
+ {
+ "dataPath": "params_shard_145.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.35.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.35.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.35.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.35.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.35.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.35.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.36.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.36.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "626e255e5e7690ef0872d531b36e338c"
+ },
+ {
+ "dataPath": "params_shard_146.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.36.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "de3a8eb0d18638c0f9d4afb4658c9560"
+ },
+ {
+ "dataPath": "params_shard_147.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.36.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "043cd5c3413c1335b358c295d43d42fb"
+ },
+ {
+ "dataPath": "params_shard_148.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.37.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ff1c6c4973342f2faf776793e6585e17"
+ },
+ {
+ "dataPath": "params_shard_149.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.36.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.36.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.36.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.36.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.36.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.36.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.37.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.37.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "99c3980fcd6937f3dc24d19fba8f4134"
+ },
+ {
+ "dataPath": "params_shard_150.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.37.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7a918b4561804225473b8e3bfb7e1335"
+ },
+ {
+ "dataPath": "params_shard_151.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.37.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b861b297d56ac6541fa304b47fd85b77"
+ },
+ {
+ "dataPath": "params_shard_152.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.38.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6715df4058c9fed0199a73d5d82464f5"
+ },
+ {
+ "dataPath": "params_shard_153.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.37.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.37.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.37.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.37.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.37.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.37.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.38.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.38.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "f93ea50e0787957f0101c3a80900aa9b"
+ },
+ {
+ "dataPath": "params_shard_154.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.38.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9aa8dc9dac6e5504ed69ad983343c620"
+ },
+ {
+ "dataPath": "params_shard_155.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.38.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6bb58194eeeeb552559c7b71ee6065f2"
+ },
+ {
+ "dataPath": "params_shard_156.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.39.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "374180a4c7fef97b48ffc5825d5ba0f6"
+ },
+ {
+ "dataPath": "params_shard_157.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.38.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.38.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.38.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.38.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.38.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.38.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.39.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.39.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "838526860f24873ed1dbc21d7656f751"
+ },
+ {
+ "dataPath": "params_shard_158.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.39.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "68e6c31e94f5504bbecfbeaccfada0aa"
+ },
+ {
+ "dataPath": "params_shard_159.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.39.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1525dd24f902765585611cca3b5d73f8"
+ },
+ {
+ "dataPath": "params_shard_160.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.40.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "39d81091371af41c874358e0053c3eee"
+ },
+ {
+ "dataPath": "params_shard_161.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.39.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.39.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.39.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.39.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.39.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.39.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.40.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.40.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "51d158ba008cfc3ee58379d40c38551f"
+ },
+ {
+ "dataPath": "params_shard_162.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.40.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e376330c3202f3742681eb202baff45f"
+ },
+ {
+ "dataPath": "params_shard_163.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.40.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3370cc282a0901e322921fac361b2f08"
+ },
+ {
+ "dataPath": "params_shard_164.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.41.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c4414ce1701f39ca9ec67ab28d76f1a6"
+ },
+ {
+ "dataPath": "params_shard_165.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.40.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.40.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.40.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.40.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.40.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.40.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.41.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.41.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "be8a4165d49bdd85f715274d7d5e99f3"
+ },
+ {
+ "dataPath": "params_shard_166.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.41.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a078e70ed9c6a3af22bf13447f7263b0"
+ },
+ {
+ "dataPath": "params_shard_167.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.41.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "102b4979cde838e7bc5ef818efb3dcdc"
+ },
+ {
+ "dataPath": "params_shard_168.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.42.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3787cb38574ed062b69aa230d23188f1"
+ },
+ {
+ "dataPath": "params_shard_169.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.41.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.41.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.41.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.41.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.41.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.41.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.42.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.42.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "5199a6ff9ba1cc51bf62c1aea790a9d2"
+ },
+ {
+ "dataPath": "params_shard_170.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.42.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "64680482c6620b22869d3125ee422abb"
+ },
+ {
+ "dataPath": "params_shard_171.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.42.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "13a5d6abd1d4e9accdb8fc2b54268005"
+ },
+ {
+ "dataPath": "params_shard_172.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.43.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "cf73c32865dffac58f10ff7ded1318db"
+ },
+ {
+ "dataPath": "params_shard_173.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.42.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.42.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.42.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.42.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.42.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.42.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.43.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.43.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "6bddf71d18cf11ac9a9ada290fee87f1"
+ },
+ {
+ "dataPath": "params_shard_174.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.43.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ff87f3db3dcd6e10ccf8428efa483469"
+ },
+ {
+ "dataPath": "params_shard_175.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.43.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b8c25432754145973d783fcdeff83261"
+ },
+ {
+ "dataPath": "params_shard_176.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.44.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "002eedac2e4115717764ceed27db8f88"
+ },
+ {
+ "dataPath": "params_shard_177.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.43.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.43.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.43.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.43.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.43.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.43.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.44.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.44.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "e85a5acd64990d644d7199e709b34451"
+ },
+ {
+ "dataPath": "params_shard_178.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.44.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d232d273dcd9f4be8beb00f4133c7b1b"
+ },
+ {
+ "dataPath": "params_shard_179.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.44.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f9ae30fafcf433b8658e2e499ce23a71"
+ },
+ {
+ "dataPath": "params_shard_180.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.45.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a25047ec68f3d46c53e4a855514e66b5"
+ },
+ {
+ "dataPath": "params_shard_181.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.44.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.44.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.44.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.44.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.44.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.44.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.45.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.45.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "4f3b6ffe4897a33ff3001474a32c9a4d"
+ },
+ {
+ "dataPath": "params_shard_182.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.45.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4fcc28226d557d950f9933d456aae8d0"
+ },
+ {
+ "dataPath": "params_shard_183.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.45.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "91bf07c36335eeaf00ebbec8d62f81ab"
+ },
+ {
+ "dataPath": "params_shard_184.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.46.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "95ffee93c9d2f4b508ac10d87633147d"
+ },
+ {
+ "dataPath": "params_shard_185.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.45.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.45.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.45.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.45.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.45.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.45.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.46.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.46.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "1b07832d6b01e8ae06a395e53b5961de"
+ },
+ {
+ "dataPath": "params_shard_186.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.46.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "703a4d735956756f562d91bb7b45b11f"
+ },
+ {
+ "dataPath": "params_shard_187.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.46.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3438d1f58cf8f125a07348c6c507d6be"
+ },
+ {
+ "dataPath": "params_shard_188.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.47.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "515e7a2cb93bca3c00d95e7fc6f6a8c5"
+ },
+ {
+ "dataPath": "params_shard_189.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.46.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.46.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.46.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.46.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.46.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.46.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.47.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.47.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "d0b671afdc393b5290f3f5493e70b026"
+ },
+ {
+ "dataPath": "params_shard_190.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.47.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "af8f500889b2e95a4290c5e8580703bf"
+ },
+ {
+ "dataPath": "params_shard_191.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.47.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "88154cc67ac23106b0b21f8ca3601d61"
+ },
+ {
+ "dataPath": "params_shard_192.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.48.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f4a3154ea87ed593529b33aefb6b2c6c"
+ },
+ {
+ "dataPath": "params_shard_193.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.47.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.47.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.47.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.47.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.47.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.47.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.48.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.48.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "3595a1fabe9757621b616ac893db66aa"
+ },
+ {
+ "dataPath": "params_shard_194.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.48.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9994a0c53cf465a55a845171a41d36a7"
+ },
+ {
+ "dataPath": "params_shard_195.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.48.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b2d2ec85f61a1d0c4b5e4056aa230e0b"
+ },
+ {
+ "dataPath": "params_shard_196.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.49.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3d5ff400d76f66d49affc65944451542"
+ },
+ {
+ "dataPath": "params_shard_197.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.48.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.48.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.48.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.48.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.48.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.48.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.49.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.49.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "069bcdd0e63bbb120a7249de211b9286"
+ },
+ {
+ "dataPath": "params_shard_198.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.49.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "748e482d7dbf63b3753be89a80859134"
+ },
+ {
+ "dataPath": "params_shard_199.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.49.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "00d49e1eda6b6ca614f8f0cc5fa1521f"
+ },
+ {
+ "dataPath": "params_shard_200.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.50.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f1c751d62e2d1794a381124553a385b7"
+ },
+ {
+ "dataPath": "params_shard_201.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.49.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.49.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.49.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.49.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.49.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.49.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.50.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.50.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "7524c75aeb936919d71f37b4bd39a0af"
+ },
+ {
+ "dataPath": "params_shard_202.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.50.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "27980e95cb6d8d10d10b237f18ba0bc2"
+ },
+ {
+ "dataPath": "params_shard_203.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.50.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ab1108e739c650ddc736199879bc08b0"
+ },
+ {
+ "dataPath": "params_shard_204.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.51.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "33ad4ca86b20f8a651d3df4cf569bbf1"
+ },
+ {
+ "dataPath": "params_shard_205.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.50.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.50.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.50.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.50.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.50.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.50.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.51.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.51.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "cac4a093113db35da3f95fd91f0f3e2a"
+ },
+ {
+ "dataPath": "params_shard_206.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.51.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3c37f007492f8cba9562554dc8f4f373"
+ },
+ {
+ "dataPath": "params_shard_207.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.51.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8c7a52989da9769cbbc63545ffef9f9c"
+ },
+ {
+ "dataPath": "params_shard_208.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.52.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5a594a1873cc20888fce790aafd98768"
+ },
+ {
+ "dataPath": "params_shard_209.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.51.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.51.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.51.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.51.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.51.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.51.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.52.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.52.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "acc40d31f42002acd4a1fd50dd70069f"
+ },
+ {
+ "dataPath": "params_shard_210.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.52.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "440b34764937367439e428a0c1b61257"
+ },
+ {
+ "dataPath": "params_shard_211.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.52.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "90db33ba1225a24999c24fe938bc3328"
+ },
+ {
+ "dataPath": "params_shard_212.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.53.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0fb9426f5b3c71580e713f833ac12683"
+ },
+ {
+ "dataPath": "params_shard_213.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.52.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.52.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.52.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.52.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.52.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.52.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.53.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.53.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "10e51be53fc743c1410976867848b599"
+ },
+ {
+ "dataPath": "params_shard_214.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.53.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "113013aff8050f785af7e738774119ae"
+ },
+ {
+ "dataPath": "params_shard_215.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.53.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "64edecd78d7bfcefdd26e88085f9f6e2"
+ },
+ {
+ "dataPath": "params_shard_216.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.54.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2d15cbf82473a4a5071da340b576b941"
+ },
+ {
+ "dataPath": "params_shard_217.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.53.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.53.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.53.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.53.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.53.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.53.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.54.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.54.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "dfb201548db77bb9a98f2e04c9204d0e"
+ },
+ {
+ "dataPath": "params_shard_218.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.54.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a89caf16a40e49022cecead4806ada4d"
+ },
+ {
+ "dataPath": "params_shard_219.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.54.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "75ebdc208de081a2f7816aea2dec4cf5"
+ },
+ {
+ "dataPath": "params_shard_220.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.55.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2d623ed33fd7ed53675427436a7bce1d"
+ },
+ {
+ "dataPath": "params_shard_221.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.54.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.54.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.54.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.54.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.54.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.54.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.55.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.55.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "797095d9e274247b90b07cd6feac3f22"
+ },
+ {
+ "dataPath": "params_shard_222.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.55.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3a5c819a8445e41badbd475e513c96d7"
+ },
+ {
+ "dataPath": "params_shard_223.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.55.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "daa14cd0be6d653b11b6e6c2da8518bc"
+ },
+ {
+ "dataPath": "params_shard_224.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.56.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "05822cee9f1457b36fa0c67953d1d959"
+ },
+ {
+ "dataPath": "params_shard_225.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.55.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.55.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.55.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.55.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.55.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.55.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.56.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.56.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "5e91903be3764d5e63651b017afc53f7"
+ },
+ {
+ "dataPath": "params_shard_226.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.56.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "acf4b82bbedcb07ab4eac2511217ebf9"
+ },
+ {
+ "dataPath": "params_shard_227.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.56.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7dae008d7bc32cf56fe11747fede857a"
+ },
+ {
+ "dataPath": "params_shard_228.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.57.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f139967c301a14b663ac32d70bef87a5"
+ },
+ {
+ "dataPath": "params_shard_229.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.56.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.56.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.56.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.56.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.56.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.56.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.57.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.57.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "d308708405e74aeeccd311cff9b97b11"
+ },
+ {
+ "dataPath": "params_shard_230.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.57.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b9c431f6a2e0dae210224e1d81573e40"
+ },
+ {
+ "dataPath": "params_shard_231.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.57.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "bc0797370fbd5638d7ae57f3e96c03f3"
+ },
+ {
+ "dataPath": "params_shard_232.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.58.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b9109d9848f836e97745086eaa8b29e4"
+ },
+ {
+ "dataPath": "params_shard_233.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.57.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.57.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.57.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.57.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.57.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.57.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.58.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.58.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "50e66174cb716541b499ebd6a89ad56c"
+ },
+ {
+ "dataPath": "params_shard_234.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.58.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "92107572a4c50fd005d3a644ab69dbd4"
+ },
+ {
+ "dataPath": "params_shard_235.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.58.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d5f13b196a006bc15d4fee2b3ede5c7a"
+ },
+ {
+ "dataPath": "params_shard_236.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.59.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "712fc8aff74c3bd8255a3a33c6503b8f"
+ },
+ {
+ "dataPath": "params_shard_237.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.58.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.58.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.58.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.58.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.58.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.58.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.59.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.59.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "ea4b6c1f1497cc4e06cf04dbce59c43c"
+ },
+ {
+ "dataPath": "params_shard_238.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.59.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "931d813731cb8656c8dba0ef8d7752c1"
+ },
+ {
+ "dataPath": "params_shard_239.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.59.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d504d6bed5290fbcfe16a0c40ee085ab"
+ },
+ {
+ "dataPath": "params_shard_240.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.60.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "59b5d7e8cc9df0805a63260d304a2eff"
+ },
+ {
+ "dataPath": "params_shard_241.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.59.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.59.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.59.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.59.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.59.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.59.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.60.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.60.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "962dfc64cb1143fbaed9076816a82b6b"
+ },
+ {
+ "dataPath": "params_shard_242.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.60.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9e743b1073cc7328c3f93fe96065ca57"
+ },
+ {
+ "dataPath": "params_shard_243.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.60.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9d3cf9efaa9b67f00baf253f28373444"
+ },
+ {
+ "dataPath": "params_shard_244.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.61.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "04596f452078ea3830ee679dc57e424d"
+ },
+ {
+ "dataPath": "params_shard_245.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.60.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.60.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.60.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.60.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.60.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.60.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.61.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.61.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "ffebd6c05ce0f67964035af0df5b1102"
+ },
+ {
+ "dataPath": "params_shard_246.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.61.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "44f3d11d7194b5c0ae43fa1003d059d0"
+ },
+ {
+ "dataPath": "params_shard_247.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.61.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9b85ceb37a98bc96d24f27d9cbe9d2e1"
+ },
+ {
+ "dataPath": "params_shard_248.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.62.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "cb9fd6ec6f3dba630bd7b9b04944766a"
+ },
+ {
+ "dataPath": "params_shard_249.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.61.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.61.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.61.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.61.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.61.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.61.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.62.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.62.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "ea3dde8a543fbd02679e87ec1e4f21e7"
+ },
+ {
+ "dataPath": "params_shard_250.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.62.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "81b1d5dcbb6db64635997fe00e4d9fda"
+ },
+ {
+ "dataPath": "params_shard_251.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.62.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "98bca412296ab3ae73f30150ce557fa2"
+ },
+ {
+ "dataPath": "params_shard_252.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.63.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f5c1050e97a9f8bddb1097a90bc2e6e1"
+ },
+ {
+ "dataPath": "params_shard_253.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.62.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.62.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.62.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.62.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.62.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.62.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.63.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.63.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "a71c36eadf9412ee5b9ab4506d681675"
+ },
+ {
+ "dataPath": "params_shard_254.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.63.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6bb3cd53f75fcce7e6cdfffa0fcdc3a4"
+ },
+ {
+ "dataPath": "params_shard_255.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.63.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ddf4b635c6e5a5fe2d9cdb3d44069ced"
+ },
+ {
+ "dataPath": "params_shard_256.bin",
+ "format": "raw-shard",
+ "nbytes": 389283840,
+ "records": [
+ {
+ "name": "lm_head.q_weight",
+ "shape": [
+ 640,
+ 152064
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 389283840,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fc6101d4aec293d4610b4d061da07594"
+ },
+ {
+ "dataPath": "params_shard_257.bin",
+ "format": "raw-shard",
+ "nbytes": 32348160,
+ "records": [
+ {
+ "name": "model.layers.63.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.63.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.63.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.63.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 17940480
+ },
+ {
+ "name": "model.layers.63.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20152320
+ },
+ {
+ "name": "model.layers.63.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.norm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "lm_head.q_scale",
+ "shape": [
+ 40,
+ 152064
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 12165120,
+ "byteOffset": 20183040
+ }
+ ],
+ "md5sum": "814c979637fb930826b64089b7044687"
+ }
+ ]
+}
\ No newline at end of file
diff --git a/params_shard_0.bin b/params_shard_0.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f02631b19fef83d77e3d1870367892a335b82a9a
--- /dev/null
+++ b/params_shard_0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:92771e7ea852f0045445e03e2f129a8568ed9bddad391417ebbc9f902b4c7fce
+size 389283840
diff --git a/params_shard_1.bin b/params_shard_1.bin
new file mode 100644
index 0000000000000000000000000000000000000000..988bfe7bf442f76fdbe0b0e49bc4e44726d79f55
--- /dev/null
+++ b/params_shard_1.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:251c179559a9d8953524275ced4ab92034a8927472f330c885c71480f79a36dd
+size 31102976
diff --git a/params_shard_10.bin b/params_shard_10.bin
new file mode 100644
index 0000000000000000000000000000000000000000..aa2c40ce075e0cd94ecf94a39bc626b87242c3b6
--- /dev/null
+++ b/params_shard_10.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e44784230eb654b982856dc84dd1d3dd7c66b86a8c0bda3632febc3f9e8ed1ee
+size 141557760
diff --git a/params_shard_100.bin b/params_shard_100.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7921795f4ceed9d86d4f5f977d6d058c2ff90243
--- /dev/null
+++ b/params_shard_100.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:22bf9489a3bd22dc73ce81946deb0bcf9e5e60bc5623c6fee72449ab7f38ece6
+size 18350080
diff --git a/params_shard_101.bin b/params_shard_101.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ffcab03e8706e388a0ea4951618651cf95862d19
--- /dev/null
+++ b/params_shard_101.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:48eaaf373bf7b6f5b59cbc480fdab3d8e81fa3b4bc833b34215043f12fc82b18
+size 20760576
diff --git a/params_shard_102.bin b/params_shard_102.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ef80e1c508733c2052b5ae6fbcbc55eb3c5f4b61
--- /dev/null
+++ b/params_shard_102.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3c9d68f57d7034d65f573f46f95ea571ab92bb9b49917bebfd3777aadab0d62e
+size 141557760
diff --git a/params_shard_103.bin b/params_shard_103.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e3c86894b9aad90b3292e5a2c2c5074ff509ac0e
--- /dev/null
+++ b/params_shard_103.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c0b8870989fb3475353ffde5b2754ff523d814cb557fcdb1ed75a8d32baea903
+size 70778880
diff --git a/params_shard_104.bin b/params_shard_104.bin
new file mode 100644
index 0000000000000000000000000000000000000000..79b61fd421291ad27924a7e34d7ef58369fcb9df
--- /dev/null
+++ b/params_shard_104.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9d03d54afde04e13ea53686b8d522e892dd721d79980a997ffc7d75ed7473eb5
+size 18350080
diff --git a/params_shard_105.bin b/params_shard_105.bin
new file mode 100644
index 0000000000000000000000000000000000000000..40bed0316ee41fe42da49b60ab50d472fd23507d
--- /dev/null
+++ b/params_shard_105.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:713c5295eb20b8fe7d67c203ef82e317be005ecedf8b8d21565ac972744b1417
+size 20760576
diff --git a/params_shard_106.bin b/params_shard_106.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b83d7cdedaa0651e61d58e7700ec88fd5998bce6
--- /dev/null
+++ b/params_shard_106.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7d69dfa5a435cc91fb01961e3aef21c9aa9e13941282cf6e7f12eef39dc779c2
+size 141557760
diff --git a/params_shard_107.bin b/params_shard_107.bin
new file mode 100644
index 0000000000000000000000000000000000000000..88a8333958575b5d7b5e9e5a0f157c14a7fa6aa8
--- /dev/null
+++ b/params_shard_107.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e180ee449b6397114a5a2a26b13e14a1142ac3905acc3e77149754943b8c286d
+size 70778880
diff --git a/params_shard_108.bin b/params_shard_108.bin
new file mode 100644
index 0000000000000000000000000000000000000000..38ba1e396ceed58b8fff0d2d8c7a3f3be41670b4
--- /dev/null
+++ b/params_shard_108.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f1932903bdea49fe517c0c485de0575a33bb4efcaba6c37945aa1d0e0d0928ff
+size 18350080
diff --git a/params_shard_109.bin b/params_shard_109.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b546af3f35ce5cf6a5490c3b966bf4f50ec1c022
--- /dev/null
+++ b/params_shard_109.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:82724a49e393996304509208099f588648c6a570127fc4096a1ad5069e8592a1
+size 20760576
diff --git a/params_shard_11.bin b/params_shard_11.bin
new file mode 100644
index 0000000000000000000000000000000000000000..94de2aec53f92562083f68043d279a95f9e15d12
--- /dev/null
+++ b/params_shard_11.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e3c130fa2f96143b6e52b7d460dd801546d7c7db318d268e28fa4a4c74fed6e0
+size 70778880
diff --git a/params_shard_110.bin b/params_shard_110.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cf6d3a35190d3eff5857736ea4241d556cc197e8
--- /dev/null
+++ b/params_shard_110.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9514b4c7b7b6d0642f113e3fb29f6ac08e44086bf7f92575be689d0d98217f15
+size 141557760
diff --git a/params_shard_111.bin b/params_shard_111.bin
new file mode 100644
index 0000000000000000000000000000000000000000..38e0816027b87d83d6ae26797b4fad84969e81b0
--- /dev/null
+++ b/params_shard_111.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b187c1094c64a65823291ab915d5d4725ee4681bb53290009114808136f8e477
+size 70778880
diff --git a/params_shard_112.bin b/params_shard_112.bin
new file mode 100644
index 0000000000000000000000000000000000000000..151c0e41bc67b728daea3dbd7de810c0343c9f6e
--- /dev/null
+++ b/params_shard_112.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:875d273906b2668de01f599e46b86802a9f86c2a0fabd0faf5b28f97c1731eac
+size 18350080
diff --git a/params_shard_113.bin b/params_shard_113.bin
new file mode 100644
index 0000000000000000000000000000000000000000..465eb3994248c51feb24656d88c369328c33f6bb
--- /dev/null
+++ b/params_shard_113.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6cf6d7ecf6d40b8a6028ba4ac52fd23b1231f88cfe8f20b05cae7d053957e0b9
+size 20760576
diff --git a/params_shard_114.bin b/params_shard_114.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2e7ae4b0f09966cffb1cbd63469157e898709345
--- /dev/null
+++ b/params_shard_114.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bcfa75eb0c29dcd98c709107cfb3e2ba9f4ab5a4f4df1ac279f14fdfbe0d55bf
+size 141557760
diff --git a/params_shard_115.bin b/params_shard_115.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9ad28923271b18fd3e9d4803657906ea67437c80
--- /dev/null
+++ b/params_shard_115.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2a154b6f0b33c5f33fdd0691a06abcc229e9722926fbdfffe2e2127b0f4b9c2d
+size 70778880
diff --git a/params_shard_116.bin b/params_shard_116.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6680d3f95fa8eb58f53b223c6572dd607d64dd45
--- /dev/null
+++ b/params_shard_116.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5cdb2c92c5f419ddf273334bdd4d8e7708ec6f5d816fae36c48ec988222a0f29
+size 18350080
diff --git a/params_shard_117.bin b/params_shard_117.bin
new file mode 100644
index 0000000000000000000000000000000000000000..82133400d49cc99f17463431d8663a7abdeb7405
--- /dev/null
+++ b/params_shard_117.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6488a7ecee6aa2ee5e1b6e0e2720c3399b59cdfb873b8fce00ce0ce8cec5235b
+size 20760576
diff --git a/params_shard_118.bin b/params_shard_118.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c151f72df725d7d3fe1dddc0025ef49442a06bb4
--- /dev/null
+++ b/params_shard_118.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c349e846e99d8779cc52c65cdb2b4bd8d80310b9bba37459c7d622368fe8e451
+size 141557760
diff --git a/params_shard_119.bin b/params_shard_119.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e564e4e2dcfc628802d73d4543232e7598db8882
--- /dev/null
+++ b/params_shard_119.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f2a99f3543047424a610b8ee7bbaa56d9cd4c7d0476665523f840299ec29ec3c
+size 70778880
diff --git a/params_shard_12.bin b/params_shard_12.bin
new file mode 100644
index 0000000000000000000000000000000000000000..08193dad9b487de1d7f1946d9ab3b9532c8c6010
--- /dev/null
+++ b/params_shard_12.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:63727b903b641c05cf6175d84d8872d510ab9671f51a32ffbf26332a3b2f0ea7
+size 18350080
diff --git a/params_shard_120.bin b/params_shard_120.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1ce267eac68e979ec27e3e7b528c0fbafa3248ed
--- /dev/null
+++ b/params_shard_120.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b70c0a12e89f13310b87a373aaf2349cd2292edc7835c0404542e4385a748bdd
+size 18350080
diff --git a/params_shard_121.bin b/params_shard_121.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8487f6390b2bc161d2094cc2cbb0b73e6811e22a
--- /dev/null
+++ b/params_shard_121.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bbcc5bcc8b315cd1a42b885187e3fb00f7e88d2b365814882faad33ce09fd6f6
+size 20760576
diff --git a/params_shard_122.bin b/params_shard_122.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e34bb9262df81329219423aef619ab1a345c063f
--- /dev/null
+++ b/params_shard_122.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:845443a0ee172b2fa30797a824405d823aca132d8fb01ac1d365a1f24ddc3daf
+size 141557760
diff --git a/params_shard_123.bin b/params_shard_123.bin
new file mode 100644
index 0000000000000000000000000000000000000000..dbdfb8c5d2af4447ad9a47b18dbe7d3c1e07829b
--- /dev/null
+++ b/params_shard_123.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:82ca9b47b15a81b40a5a55779c952fadaaaac31783f3a99fb11c58d437cf1581
+size 70778880
diff --git a/params_shard_124.bin b/params_shard_124.bin
new file mode 100644
index 0000000000000000000000000000000000000000..449b1a70b2409b95f17ffaa9ad23897ae75c6840
--- /dev/null
+++ b/params_shard_124.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:29f0e117fd70d107a59120d0ba96caa83459a6e2ba8e379e267a639593a7f20b
+size 18350080
diff --git a/params_shard_125.bin b/params_shard_125.bin
new file mode 100644
index 0000000000000000000000000000000000000000..72ebcb91f147b56403c8464e50762cef837016fa
--- /dev/null
+++ b/params_shard_125.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bb6eb60134374036e2f76dd886d279f69c7ba0fd2f3648f4f515fcda7e2c1ec8
+size 20760576
diff --git a/params_shard_126.bin b/params_shard_126.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5508dfda7c796df8f814a2c63482b64f82888b88
--- /dev/null
+++ b/params_shard_126.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dde73603957a8b3c4446ae51bf16a9b475781c05331cbd722a149452b0dc44e5
+size 141557760
diff --git a/params_shard_127.bin b/params_shard_127.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f7b46eba8b32774786bf1c550efebfb3aad50510
--- /dev/null
+++ b/params_shard_127.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:18fd9bb801177aa13f0ce0942744ab7bc9dfe56395b87b68fd5986cad6b07ba2
+size 70778880
diff --git a/params_shard_128.bin b/params_shard_128.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1fc51b50527f3d543724ec2e64557842f58d8502
--- /dev/null
+++ b/params_shard_128.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:acc107cc06d62cc6b062df689767a82ef886ad8a50183b0e07461dca35fe6f46
+size 18350080
diff --git a/params_shard_129.bin b/params_shard_129.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3c5daae2493da2deadeda4d3c6dd2805e48191f2
--- /dev/null
+++ b/params_shard_129.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d741339cf2efe07c3572204faef5a64c690ed18819304df7dc3e19025be5f3cb
+size 20760576
diff --git a/params_shard_13.bin b/params_shard_13.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ffe1eaecfa4bcb7079a3301742c19ff4f2cd9ec7
--- /dev/null
+++ b/params_shard_13.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ea6608fee0857359400b1d17eabd87594b131eff6dfc4d7892782c89861a37a3
+size 20760576
diff --git a/params_shard_130.bin b/params_shard_130.bin
new file mode 100644
index 0000000000000000000000000000000000000000..419208e547e3ce068d898b3d2f56271559a5e690
--- /dev/null
+++ b/params_shard_130.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2f172bd1deadcdb2a6457c64b2fe7a4b163fdd7cabd16431cdae2aa3a997dfb3
+size 141557760
diff --git a/params_shard_131.bin b/params_shard_131.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f91aa7b4b552fb3e74d9f901856fa03dca69b8f0
--- /dev/null
+++ b/params_shard_131.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:41312d9fcbcfd14a2c32b117999f79529caf00202278fc2c0916166002de14d2
+size 70778880
diff --git a/params_shard_132.bin b/params_shard_132.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b8e7cbf8957d581e358bed27619476f8f71eec87
--- /dev/null
+++ b/params_shard_132.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b4731c4d60bddc30f18ca0243eed8e9e0188100dcaf20f0d9fd716bd64fae8e9
+size 18350080
diff --git a/params_shard_133.bin b/params_shard_133.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1421a14ea249d4c419540289455f8311299db334
--- /dev/null
+++ b/params_shard_133.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5fc517df65134bf159c6a6f03eac76e98916d0216156dce910e5b9dc6be6b5d3
+size 20760576
diff --git a/params_shard_134.bin b/params_shard_134.bin
new file mode 100644
index 0000000000000000000000000000000000000000..16ea7305fc4c3297b43fff7b56267aacf2568eec
--- /dev/null
+++ b/params_shard_134.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c6790dc7789788ca967e33d6287a1ca29f09bd20f028a004890f66c4808854cb
+size 141557760
diff --git a/params_shard_135.bin b/params_shard_135.bin
new file mode 100644
index 0000000000000000000000000000000000000000..601f7866947abee4e1769d14410b37b08eac98e8
--- /dev/null
+++ b/params_shard_135.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a3641de8d707728a58b013ef027f14f79a08995188ce94065bc97904bd59668c
+size 70778880
diff --git a/params_shard_136.bin b/params_shard_136.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e729aee6221bc284e66402d099074d2790904cdc
--- /dev/null
+++ b/params_shard_136.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:381b683b3a91d547dd8417bf0ecc646658710192827fde3b4d9ca29ed8158986
+size 18350080
diff --git a/params_shard_137.bin b/params_shard_137.bin
new file mode 100644
index 0000000000000000000000000000000000000000..665421140e73ab0ddecf066e06a178b7f9b3b583
--- /dev/null
+++ b/params_shard_137.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a38cb226bcba04ea153fe73819c0d27ef0c1017896bd2d793ced8bcc64bac6e5
+size 20760576
diff --git a/params_shard_138.bin b/params_shard_138.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5ca27401ac925092a43657cbbecb52442dd25a1e
--- /dev/null
+++ b/params_shard_138.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3f3a34f0dd34b79852f4dc046056b2937c80e8cafb3cbf7c14b2d55db4b51826
+size 141557760
diff --git a/params_shard_139.bin b/params_shard_139.bin
new file mode 100644
index 0000000000000000000000000000000000000000..edd258db33a816ebc35e96dc2ff548b029da8f3f
--- /dev/null
+++ b/params_shard_139.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:84ffd185b0a54d00dc12821ec26b3064a28d5e29ed8b1dfa9d1f40a7672524f8
+size 70778880
diff --git a/params_shard_14.bin b/params_shard_14.bin
new file mode 100644
index 0000000000000000000000000000000000000000..aa923656147477e278a9beec762aaaf1e839d0bc
--- /dev/null
+++ b/params_shard_14.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:eb5548a3f33e3e193df1aba79bab3f966ff38549d51e31282a6c1e02822727f7
+size 141557760
diff --git a/params_shard_140.bin b/params_shard_140.bin
new file mode 100644
index 0000000000000000000000000000000000000000..08982c3b0e4053d791c09e5d7cb0cab1c56bc723
--- /dev/null
+++ b/params_shard_140.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e38d75c50036b877e83d9caaf5b847526d53494c25659efe3a46f26688eb1237
+size 18350080
diff --git a/params_shard_141.bin b/params_shard_141.bin
new file mode 100644
index 0000000000000000000000000000000000000000..29c5ce9762862841fc1d0c6cd283b8e6825013d3
--- /dev/null
+++ b/params_shard_141.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:694381a0b4eb98a8e38b447fd10d71d20d5599ce194b2fa0e81d3f58e27575b7
+size 20760576
diff --git a/params_shard_142.bin b/params_shard_142.bin
new file mode 100644
index 0000000000000000000000000000000000000000..36141b2793c5c1dd902f04b5634665cf3fddb334
--- /dev/null
+++ b/params_shard_142.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8765ccc8142176ea5dd151978e5259b7c528bf552befb33a6350367b88af7d48
+size 141557760
diff --git a/params_shard_143.bin b/params_shard_143.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1db46110f1e5a2833b3838450e64656eb1a1b55e
--- /dev/null
+++ b/params_shard_143.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8aaef5110cd4262eb5c97f4223d40ca4043da009bf51e359837173669cb7549c
+size 70778880
diff --git a/params_shard_144.bin b/params_shard_144.bin
new file mode 100644
index 0000000000000000000000000000000000000000..72f2133c4c816d62e9a567dd8e0965852f2a7bee
--- /dev/null
+++ b/params_shard_144.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f4df91cc988ed8ddbfeb0170f2ddd6d99eeb344b3aeb37becce7e17e21f497aa
+size 18350080
diff --git a/params_shard_145.bin b/params_shard_145.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cf5972fa74f809eb19d1f4bd61dc8c61da14b6af
--- /dev/null
+++ b/params_shard_145.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:166bf693edc418462ad6570e82e19996139336654f3ec4feeb20eb5bb62e40b0
+size 20760576
diff --git a/params_shard_146.bin b/params_shard_146.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b549e7b6252bc5ad3eb220052241da4b5460fb05
--- /dev/null
+++ b/params_shard_146.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6db2b80aa6f53835334649667d1389fb174a49a94feaca43014e014c1b8e4540
+size 141557760
diff --git a/params_shard_147.bin b/params_shard_147.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a0aec4843955fbae167a6954a6a1b06be722dd86
--- /dev/null
+++ b/params_shard_147.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:615f7f6d7645743d910dd193503d0cfee365e57567e4445aebd7162a39e73098
+size 70778880
diff --git a/params_shard_148.bin b/params_shard_148.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f058316525638c7a7bd6886a755f5b7df5b987de
--- /dev/null
+++ b/params_shard_148.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:32ef95cd4a5f8401eb26ceeacdde50425b0e445013f230b210ec880247f20bcc
+size 18350080
diff --git a/params_shard_149.bin b/params_shard_149.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3031ec6030cfad6fb735a5b1a952e9f53bef7673
--- /dev/null
+++ b/params_shard_149.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9d0380e0eeb586a520b6342661be6375c61f9fecc11287de168264e4c640b20b
+size 20760576
diff --git a/params_shard_15.bin b/params_shard_15.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f949c97eec3e70bed4138bd74daa649bd6cb70ce
--- /dev/null
+++ b/params_shard_15.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e747737f72829c2f66c4ca4eb59af5e1970a1eac3f0f3d69c3259831d3eb970b
+size 70778880
diff --git a/params_shard_150.bin b/params_shard_150.bin
new file mode 100644
index 0000000000000000000000000000000000000000..54dbff2cd1be645171d531226f07bdef4a05321b
--- /dev/null
+++ b/params_shard_150.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3c3731c27ab41d5726904f84cf24691b2f34891c09304702695245fb89006197
+size 141557760
diff --git a/params_shard_151.bin b/params_shard_151.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2a2688f3c6e1af96362f381467d8ba1940604532
--- /dev/null
+++ b/params_shard_151.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a18b67238f381ac0518afdfb8d3d68521809cad679bc98b770e7e6cdfc110ea7
+size 70778880
diff --git a/params_shard_152.bin b/params_shard_152.bin
new file mode 100644
index 0000000000000000000000000000000000000000..fd9849088ff56c7f85597bb13528a3f51e37ca7d
--- /dev/null
+++ b/params_shard_152.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b1fe1ea2805284f0428a5f13bbcc0245108be8d690afd1e03e5a8411bbb64896
+size 18350080
diff --git a/params_shard_153.bin b/params_shard_153.bin
new file mode 100644
index 0000000000000000000000000000000000000000..750ed639d131e81130f4b8949e536b6a5046bdf9
--- /dev/null
+++ b/params_shard_153.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b9b7c69be96e1a9c18ed9d1f3da03c9399027b00a2f2925c6a5e180749a7e293
+size 20760576
diff --git a/params_shard_154.bin b/params_shard_154.bin
new file mode 100644
index 0000000000000000000000000000000000000000..dbf7199610d232b9f0d388956ac21627ba62fba9
--- /dev/null
+++ b/params_shard_154.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:46a270f8093103a5134b8fc337ec1559f3a98bafb9bab341bd7fa421ea3616fb
+size 141557760
diff --git a/params_shard_155.bin b/params_shard_155.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b0a7ff95bddc5f178df27aa0d2780f730719573e
--- /dev/null
+++ b/params_shard_155.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:df76920de2978e0bf631bc946a448880575d57d4c7f0b3712715ae5a9c5ed7ef
+size 70778880
diff --git a/params_shard_156.bin b/params_shard_156.bin
new file mode 100644
index 0000000000000000000000000000000000000000..53b9aa505a8c4e769170a69c2de740f224a973b0
--- /dev/null
+++ b/params_shard_156.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7f37e50aed65383ee43ccc7c0e43423ff91250f96d896cb3867d1b120e9d26d6
+size 18350080
diff --git a/params_shard_157.bin b/params_shard_157.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f8597396e42b56eb09c4e949c63a497556af6e55
--- /dev/null
+++ b/params_shard_157.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0bf1c6cbf1cf06a06196911bdf780b84f4c0ae9469b4aa0dc87b2585d4a8be34
+size 20760576
diff --git a/params_shard_158.bin b/params_shard_158.bin
new file mode 100644
index 0000000000000000000000000000000000000000..666cf5adb041b42fd9864c1febdd966c19f131f3
--- /dev/null
+++ b/params_shard_158.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e33ef6de52acd66a8bfd6e456de9fadba72720157d4b1ba8bf15ae6a2e2b2ffd
+size 141557760
diff --git a/params_shard_159.bin b/params_shard_159.bin
new file mode 100644
index 0000000000000000000000000000000000000000..44899d059cd508494e8d8d597d81180eb124b945
--- /dev/null
+++ b/params_shard_159.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:269bcef3e692302caac33b5e6306f3d8c6d2f14345018cb86e102cfdfa506ae0
+size 70778880
diff --git a/params_shard_16.bin b/params_shard_16.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d17145e28b47e4c9568c0831f2dd74ee9e148ba6
--- /dev/null
+++ b/params_shard_16.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4ff684822f293129fdf9c5f6bad3306e39cfc089f1ca5077f212f845da9d1cdf
+size 18350080
diff --git a/params_shard_160.bin b/params_shard_160.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e677907a4aff2ba793fc65b1821ceb26def7095b
--- /dev/null
+++ b/params_shard_160.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dd3d343f0bcc6c3cc6f76d0a3c09a304fb83c959a21e2751d1d73a2e6e75e813
+size 18350080
diff --git a/params_shard_161.bin b/params_shard_161.bin
new file mode 100644
index 0000000000000000000000000000000000000000..85af16b4bb30f72ecf6de984a4f4d7c0b6c4b840
--- /dev/null
+++ b/params_shard_161.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:542d5ca0bd1929b03daa8643ee91c4c8d14a9c240b29ae478e556f480968c699
+size 20760576
diff --git a/params_shard_162.bin b/params_shard_162.bin
new file mode 100644
index 0000000000000000000000000000000000000000..35654217883998ff2a5c71683c45068f427029b3
--- /dev/null
+++ b/params_shard_162.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7308fd37e5837e504a7279b417e0d1c23dbb36591c77c468063b6d0b2519413c
+size 141557760
diff --git a/params_shard_163.bin b/params_shard_163.bin
new file mode 100644
index 0000000000000000000000000000000000000000..66d02682f9a37f51adfe3062d3e06439212c4141
--- /dev/null
+++ b/params_shard_163.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f6bdfe790055676c70457e7577fa5c1716a7a961c2f8cf370e651e83224ac1f5
+size 70778880
diff --git a/params_shard_164.bin b/params_shard_164.bin
new file mode 100644
index 0000000000000000000000000000000000000000..76354d8780e2c012b7c1b62332110d8774d82a4c
--- /dev/null
+++ b/params_shard_164.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:714750d31d7545ee6cdafee297ac4f1d8563cc93fef97ec52950034084f02805
+size 18350080
diff --git a/params_shard_165.bin b/params_shard_165.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2f04b027a341d72945dcfcb48d679fa5e5a9b9a4
--- /dev/null
+++ b/params_shard_165.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5f84e9f3382487ef60aaebb4829249082a73b1ae420c19becb448645a2a18457
+size 20760576
diff --git a/params_shard_166.bin b/params_shard_166.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2271074bcfd32bdb844898a89b1a029503f39cc1
--- /dev/null
+++ b/params_shard_166.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9e5abefbb5a3b381b378c39332d240c21f0675f29a47a6b69391df0c87731b63
+size 141557760
diff --git a/params_shard_167.bin b/params_shard_167.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a1639cbd412d19007929855ce079b27374f3738f
--- /dev/null
+++ b/params_shard_167.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:121b8c568a6737e0ad5523a1c5d112bed0de05894bbf9fab5fb906ce0fee1388
+size 70778880
diff --git a/params_shard_168.bin b/params_shard_168.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a181f87552763b44652ea6bcf1290f5a69e1d978
--- /dev/null
+++ b/params_shard_168.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0ebbf306f259e688f9e191dbed48dba6785078701d33a7344432f812defba1ba
+size 18350080
diff --git a/params_shard_169.bin b/params_shard_169.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2098c2aa1cac8c51ae9190c15ce860637d27b4a0
--- /dev/null
+++ b/params_shard_169.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:15eb8bc971b56884b21a82eb27950fab03cf32d090ed4002972f399dae7d1443
+size 20760576
diff --git a/params_shard_17.bin b/params_shard_17.bin
new file mode 100644
index 0000000000000000000000000000000000000000..76bd042691859e0924c89ac9a8068d5b648c7f72
--- /dev/null
+++ b/params_shard_17.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4366241915bdea21e6dd0b11617d0aab07da8d5d92e7c64c307044d468c24144
+size 20760576
diff --git a/params_shard_170.bin b/params_shard_170.bin
new file mode 100644
index 0000000000000000000000000000000000000000..53f119b492cb0821d9b336eaea10f83e77c54aba
--- /dev/null
+++ b/params_shard_170.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bbf49b3ac8569c19edebd65d5b0b3bdbaf7de24f3e71b48bc8932142e3c7a254
+size 141557760
diff --git a/params_shard_171.bin b/params_shard_171.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7e0a8040f16893037a986fc017000fd6ef4c3889
--- /dev/null
+++ b/params_shard_171.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:37f73192e6255ecbac164d6bbc25cca7a4f4c61a25c1e836f5c12b2331092f64
+size 70778880
diff --git a/params_shard_172.bin b/params_shard_172.bin
new file mode 100644
index 0000000000000000000000000000000000000000..dd7b2a76f384d8ec6c351454d6011c3a3ab46718
--- /dev/null
+++ b/params_shard_172.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e1297109efba620ecaaaf5e2fa2bd10227595c837975b2640209af0e2290bb93
+size 18350080
diff --git a/params_shard_173.bin b/params_shard_173.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6c7d9aed8498452aa0b32a87a98b31a001644ab7
--- /dev/null
+++ b/params_shard_173.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:780794af7d045bd3a5dc651bdd9b6b75611296aea8a6eb0c563044d7961b2deb
+size 20760576
diff --git a/params_shard_174.bin b/params_shard_174.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d5de6a0972502b75fe42c470896dfd106b8bfe09
--- /dev/null
+++ b/params_shard_174.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a03ceeec34baeed76e69678d1e5789272ad4a738193eb959fa0c5ed410cfab32
+size 141557760
diff --git a/params_shard_175.bin b/params_shard_175.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c08454c944a911dd22ed6202a163fc80fbb5ffaf
--- /dev/null
+++ b/params_shard_175.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:68de6dd0124e65ca3eddee53894c0a32e64178b6fed6caf32b9e74de7ee6b7df
+size 70778880
diff --git a/params_shard_176.bin b/params_shard_176.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2a59100c314699e8c18223d9cfd9bc9fd314be5c
--- /dev/null
+++ b/params_shard_176.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fc9359797de4721a71c23b8a71537278ac5af9d493b6b95250bf11f120441577
+size 18350080
diff --git a/params_shard_177.bin b/params_shard_177.bin
new file mode 100644
index 0000000000000000000000000000000000000000..245df681c0fa4123e2dcf26c52202bb732ebf4a6
--- /dev/null
+++ b/params_shard_177.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9864b7efb4b919ce3be3fb33dbf5438d8f5a5b361d1b5526c561d35011680318
+size 20760576
diff --git a/params_shard_178.bin b/params_shard_178.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ea5024481d840bd6e883963911e0e787f5b17f0f
--- /dev/null
+++ b/params_shard_178.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d57a6e45a1995ee3b0c168d0e6d19110c35a1475ff57cf0216e65d1b32ba78be
+size 141557760
diff --git a/params_shard_179.bin b/params_shard_179.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0ada68f68b090f2b73c6b505d1d59cf3410edff7
--- /dev/null
+++ b/params_shard_179.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fdfb2e1d90870e99dcb84ae2cc2cc2c7f9ee7f11006206ba31873a44e08d97ef
+size 70778880
diff --git a/params_shard_18.bin b/params_shard_18.bin
new file mode 100644
index 0000000000000000000000000000000000000000..80096e0705e33756b4a28bdc600665426afabced
--- /dev/null
+++ b/params_shard_18.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ac476d0cd024365b788a13eb3bad636355d589de515ba4744484ea736414c91b
+size 141557760
diff --git a/params_shard_180.bin b/params_shard_180.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5306f188f648a5336fe8ca71cc10c4b88164f536
--- /dev/null
+++ b/params_shard_180.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e45b7841b3e34be9969d95f57855d8caad91ed7f31281fc3749c32193a564896
+size 18350080
diff --git a/params_shard_181.bin b/params_shard_181.bin
new file mode 100644
index 0000000000000000000000000000000000000000..821538fea4167479e5e55c8fc29d2cd9c545d271
--- /dev/null
+++ b/params_shard_181.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5b7386b6bdc358424bd50a666a66657ff03272cc6b6a7e2f2f46b198f16dc2d4
+size 20760576
diff --git a/params_shard_182.bin b/params_shard_182.bin
new file mode 100644
index 0000000000000000000000000000000000000000..abbf84e71c58e484bb3a5ad6b225c8531ebb8578
--- /dev/null
+++ b/params_shard_182.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ccdc48ac5d5bfdee8fb2f831325c0d282791aa9e966a6c376ae6c07db6a67358
+size 141557760
diff --git a/params_shard_183.bin b/params_shard_183.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3c0f7c91257fe776b8bbd76beb5948753338ccf1
--- /dev/null
+++ b/params_shard_183.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:eb5872409c3150879b18cd44f6f5d69c48185577041b6c019650175a6ac34b21
+size 70778880
diff --git a/params_shard_184.bin b/params_shard_184.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d4271a69d40246edda68bfd28f27a5f7c6fc607d
--- /dev/null
+++ b/params_shard_184.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ad9c3d1cce1319dc18153bfa02787b2a81b443ee4e73957848753e4915266a5d
+size 18350080
diff --git a/params_shard_185.bin b/params_shard_185.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b4973a7f0ded5ab5143815d5e161313b0c061046
--- /dev/null
+++ b/params_shard_185.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b7a8d4b409f9c4e9146f3dc49045ec094b3ba09daab6ff1a51d7ba397400e4bc
+size 20760576
diff --git a/params_shard_186.bin b/params_shard_186.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a32843b5977093293894bbff2070cb5cef0af53d
--- /dev/null
+++ b/params_shard_186.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cf8e2c055ea4bb00cb2daf27ec4f097e68c38abb47314f5ec996ef27f780f649
+size 141557760
diff --git a/params_shard_187.bin b/params_shard_187.bin
new file mode 100644
index 0000000000000000000000000000000000000000..678087310ccb29b438594cafb6c438ce8990a1d3
--- /dev/null
+++ b/params_shard_187.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:84fbf2a156836e055d3ccbdb7053390e7fd54e5a99dc49df4d1bdfed161d825a
+size 70778880
diff --git a/params_shard_188.bin b/params_shard_188.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c52653c39a342cb700384d1ce37b44ca4347cfd5
--- /dev/null
+++ b/params_shard_188.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:70b147da6badd6ef38e6c88d9251be46021e7e18c91e0c41ea835a6e21c4fe30
+size 18350080
diff --git a/params_shard_189.bin b/params_shard_189.bin
new file mode 100644
index 0000000000000000000000000000000000000000..642275c67b34dd127485a653cbd87258199dc27b
--- /dev/null
+++ b/params_shard_189.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:92b2384d0f0878aa8281332aaac41fb647db5127871f0e7639faecaaa7283f44
+size 20760576
diff --git a/params_shard_19.bin b/params_shard_19.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f2abfe94b85c48d3bb54cfad7bacad1372876dc3
--- /dev/null
+++ b/params_shard_19.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7399212f2a3fed4022ec0102e23e92334c76b1ba21644b403eb80e08acbee122
+size 70778880
diff --git a/params_shard_190.bin b/params_shard_190.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8f4676e1ef78811ffe26b8669830be28ceec872b
--- /dev/null
+++ b/params_shard_190.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2656a2b584699d650834a898294b4f05a9929dad51bfe56611ebe1dfbe74009d
+size 141557760
diff --git a/params_shard_191.bin b/params_shard_191.bin
new file mode 100644
index 0000000000000000000000000000000000000000..670ed9ef37d75750d0871a9f822422a8c3d24969
--- /dev/null
+++ b/params_shard_191.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5172622c082346c67ac63b8ae52e6a1882708583b388b8427afff48bdfe3616f
+size 70778880
diff --git a/params_shard_192.bin b/params_shard_192.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b05cdd9938071e14558118041d703364930a6ebe
--- /dev/null
+++ b/params_shard_192.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:224793e4a10d4ad37f0265839ac76cf83fcab2fc152ce736472c33d53534cc95
+size 18350080
diff --git a/params_shard_193.bin b/params_shard_193.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9ff8ce04c7f9c5b898603e7e790e32761d1e417f
--- /dev/null
+++ b/params_shard_193.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:13be8aa8787916d1ce94729afa673f072c538c229d490b98e794742537539261
+size 20760576
diff --git a/params_shard_194.bin b/params_shard_194.bin
new file mode 100644
index 0000000000000000000000000000000000000000..951b17ba20c8acf45118713d77602e61c2e28a0f
--- /dev/null
+++ b/params_shard_194.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0053723d7df4854d2195163f9fbd9132009792657914a544f6e5c52ef578a15f
+size 141557760
diff --git a/params_shard_195.bin b/params_shard_195.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a6255331f6517824037ef8a0c70db2052b8db0f1
--- /dev/null
+++ b/params_shard_195.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7db5b5b0001bc970dc875b0d779b8714ce5171f7f54b0d35af697437f6669bab
+size 70778880
diff --git a/params_shard_196.bin b/params_shard_196.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d12f10d018b3d9cb2cefadd85b5c8e5c3c2a3041
--- /dev/null
+++ b/params_shard_196.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:39601f7aee9e55a0bdebdeaa2be4018e17fff657aaa498f1abda487942d2adc5
+size 18350080
diff --git a/params_shard_197.bin b/params_shard_197.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1221dc2ea80e35c7603f91e0bd4bb7c8f92f8cd6
--- /dev/null
+++ b/params_shard_197.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:88db75819fe68316b6a806461303fa21c59094c975ef9c0ed15a4c64d6370a99
+size 20760576
diff --git a/params_shard_198.bin b/params_shard_198.bin
new file mode 100644
index 0000000000000000000000000000000000000000..462a3461a2bf9627a0e2cc7ba4f0dfd3c6c2ab28
--- /dev/null
+++ b/params_shard_198.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ef2cd31fff5df360579a3e392297c8ad55f36c33bcce6cc283a0ac2882f7215f
+size 141557760
diff --git a/params_shard_199.bin b/params_shard_199.bin
new file mode 100644
index 0000000000000000000000000000000000000000..924f5135031f3899d938b209e8197a2d731ca31a
--- /dev/null
+++ b/params_shard_199.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7df84acc1691e1fe9c510993591036cff19bc9156feb5b4cccc401c3f72cfcd0
+size 70778880
diff --git a/params_shard_2.bin b/params_shard_2.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3b92ac5c5bd6e54da627e1496ac983169b549fb5
--- /dev/null
+++ b/params_shard_2.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bebdfbc23b7495127361ee616f0909c67354fb79e44050e5b98235f825ea5fa6
+size 141557760
diff --git a/params_shard_20.bin b/params_shard_20.bin
new file mode 100644
index 0000000000000000000000000000000000000000..016490285d560859c9f8c9b2531f3dd0366140af
--- /dev/null
+++ b/params_shard_20.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:40a06348b8a4e1b8296ee768873473dcac414490672873196891c9e8b19fabf6
+size 18350080
diff --git a/params_shard_200.bin b/params_shard_200.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e371153cc4f72122312a3af5d916d3d847863589
--- /dev/null
+++ b/params_shard_200.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:168bee2dc8b76582709abbc29dd49901017a3b8a84779f728db90353128fb6bd
+size 18350080
diff --git a/params_shard_201.bin b/params_shard_201.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5730ae9820a31b183a88efd3d888590826585676
--- /dev/null
+++ b/params_shard_201.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b0666b8bb2ff4e29b2f06076cb94a26b14a4cf4354d9f8f9fbaf0b9665904174
+size 20760576
diff --git a/params_shard_202.bin b/params_shard_202.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7bde6b1323a601bcf0b4e42bfea7c5673118c4b7
--- /dev/null
+++ b/params_shard_202.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:abb9d81b6f1ac3aadc93bb6bad667930344411dabba5bc4d1a0c8dfde9b3faa7
+size 141557760
diff --git a/params_shard_203.bin b/params_shard_203.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1e2388409f0672a312063f9bd3ac9593c8255e44
--- /dev/null
+++ b/params_shard_203.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:84f6fe2213a150ae6f3db7cd9bb539ce8af8cc6e9d88a8e2978719690ea443dc
+size 70778880
diff --git a/params_shard_204.bin b/params_shard_204.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5c1d2421c97e5f318e5079fc4b4ade2cc7d17b77
--- /dev/null
+++ b/params_shard_204.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c35daa3361bedf908740bd92960a8bf2b77bf67e98ca1e4e18c6d150541cd896
+size 18350080
diff --git a/params_shard_205.bin b/params_shard_205.bin
new file mode 100644
index 0000000000000000000000000000000000000000..51abdef7f4ff8da280b0f2a6b441dcae7c839d7f
--- /dev/null
+++ b/params_shard_205.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:aca3b2e56db5dec8e29b06f48e59fce3be2022db2537e2505888b49890c233da
+size 20760576
diff --git a/params_shard_206.bin b/params_shard_206.bin
new file mode 100644
index 0000000000000000000000000000000000000000..de22f52b42d2af1163eb416bdc3f98289c3a14e6
--- /dev/null
+++ b/params_shard_206.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1360c264e76525d9d9165aefde52306d0147f61db4d7085b97e6a5efa57d1931
+size 141557760
diff --git a/params_shard_207.bin b/params_shard_207.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4cd281d7c6e7b08c009e6cd9166fb5a6bdc2fc5b
--- /dev/null
+++ b/params_shard_207.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f1f1204b183824217ecab501cf8473ae2204b2ebb0febe2a7b1336e486eb871c
+size 70778880
diff --git a/params_shard_208.bin b/params_shard_208.bin
new file mode 100644
index 0000000000000000000000000000000000000000..92b72493dc104e22970bb0ac22a8401ca81fda50
--- /dev/null
+++ b/params_shard_208.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:37fa67d3105bd2b1a17e76911f7e1bfb60ad31a70813746bc01d0758c931124c
+size 18350080
diff --git a/params_shard_209.bin b/params_shard_209.bin
new file mode 100644
index 0000000000000000000000000000000000000000..67745de6a40c5f195949aa3d07153a59beeefe46
--- /dev/null
+++ b/params_shard_209.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c96ff5213d6f10f5ad47405dd741e0a15c363ce3237e66f5bd3572aca3896247
+size 20760576
diff --git a/params_shard_21.bin b/params_shard_21.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a7eb03d6f782f6c5a8d515fde457116694796561
--- /dev/null
+++ b/params_shard_21.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8e166df6eb3b584ee7624a7d2e967cf59d42449ac35d94ddc3a15dbfba3fae74
+size 20760576
diff --git a/params_shard_210.bin b/params_shard_210.bin
new file mode 100644
index 0000000000000000000000000000000000000000..15bfaf1f0520416b48f16b787ecae5c65eea2ca1
--- /dev/null
+++ b/params_shard_210.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:49b2d698ad83c130f6f00db38868994a5cd0f46c47b301f75398a476468a502d
+size 141557760
diff --git a/params_shard_211.bin b/params_shard_211.bin
new file mode 100644
index 0000000000000000000000000000000000000000..72e83dc765514cd06c84d0f4ca1bcae4e0dcc74d
--- /dev/null
+++ b/params_shard_211.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4d228a91fa83c4debe4ef565e3e3aba4f3103d18cc4c3bf36d77f0d989a0769d
+size 70778880
diff --git a/params_shard_212.bin b/params_shard_212.bin
new file mode 100644
index 0000000000000000000000000000000000000000..541b6fe99ead280d5a6d78f64aee45e2555ca002
--- /dev/null
+++ b/params_shard_212.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:86775d675ea1f305406797965ec362f80d4b5d67f9a428b686bb9769cca16392
+size 18350080
diff --git a/params_shard_213.bin b/params_shard_213.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4a9ce3741c9a773404c45c3cdba0c3a1b6eb4294
--- /dev/null
+++ b/params_shard_213.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:96283ce32b5f95eb39541a5974509def91dc158c020624eaf0f5e863cf8a60d1
+size 20760576
diff --git a/params_shard_214.bin b/params_shard_214.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cf2a6eb1e50a888dd00759445281dc0160c320ac
--- /dev/null
+++ b/params_shard_214.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:60d5d3957656618d70a1af83ff216cf4102b7cf67d3e84b218acfb496bfb1ada
+size 141557760
diff --git a/params_shard_215.bin b/params_shard_215.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e08ccea4860374ad723e432c0281e67af0b5c5e0
--- /dev/null
+++ b/params_shard_215.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:104e6e7e2433e996076ba7d413a9b650a444c24eb16cf83584203a568a1807c3
+size 70778880
diff --git a/params_shard_216.bin b/params_shard_216.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bf5a8ecf96bfe923be3548dcdcc4ea186e04f36e
--- /dev/null
+++ b/params_shard_216.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:43b639282477f15a16b3134e3a2324bbfe85bc7c750c133b2f1cd062aaa63dd6
+size 18350080
diff --git a/params_shard_217.bin b/params_shard_217.bin
new file mode 100644
index 0000000000000000000000000000000000000000..15df76111b24dc6770a97aa1a3392b96ef1e98c0
--- /dev/null
+++ b/params_shard_217.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6f388dcdc3dec37b0b7c16c5c05d053ba590a4dd34cf6c97b56b7986b68372e9
+size 20760576
diff --git a/params_shard_218.bin b/params_shard_218.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6648a717a8bafdf5100732a28c7e23e920a2146f
--- /dev/null
+++ b/params_shard_218.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e9fd200ffba09a99c0d11e1b89a8b7dea34caf21ad5a424ac76350602fdb86b1
+size 141557760
diff --git a/params_shard_219.bin b/params_shard_219.bin
new file mode 100644
index 0000000000000000000000000000000000000000..340fc5c426164136976e5a1e7b81b968c2fc598c
--- /dev/null
+++ b/params_shard_219.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f2981bd2ec41102afcaf30c7421492667719822442802b4f65daf66f02d2ea79
+size 70778880
diff --git a/params_shard_22.bin b/params_shard_22.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d99ad8e2f22c708dcffb5c94c033f5616d6c1789
--- /dev/null
+++ b/params_shard_22.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c66e0cd32c7cc05337cfb6e07bf71871bc28e9394f57e19882e2a01c2f565792
+size 141557760
diff --git a/params_shard_220.bin b/params_shard_220.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c7566bd069a40dc2a99c704e3dcf73e508e2ff92
--- /dev/null
+++ b/params_shard_220.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:74bf1eab81be87094617451f9833eb76a878a43a8d5b498d4f5543bc7410055b
+size 18350080
diff --git a/params_shard_221.bin b/params_shard_221.bin
new file mode 100644
index 0000000000000000000000000000000000000000..eeab9041e3ba2170ce9799388f12df25101e21be
--- /dev/null
+++ b/params_shard_221.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a4fb726f05c71199a4cb8550a3a1222b261bc8145cf0f96af0fd5b4ca55c004f
+size 20760576
diff --git a/params_shard_222.bin b/params_shard_222.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ed8511f55b6f109c3b74110dd7b30dab1777da41
--- /dev/null
+++ b/params_shard_222.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9638cb4e0620110ee485a0fb9521ea0b12d808e4237eaecde4dfa4ed4e4ab8b9
+size 141557760
diff --git a/params_shard_223.bin b/params_shard_223.bin
new file mode 100644
index 0000000000000000000000000000000000000000..87992157a2a71151eb4f05ee0d1049fa1a4c9103
--- /dev/null
+++ b/params_shard_223.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c00e9b24fb6a5eb5076ca142a384e15d701879c517009c6ea62586c67b9eb060
+size 70778880
diff --git a/params_shard_224.bin b/params_shard_224.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8a870a6d1c62730b0fdf37212e76f6a290e3d93d
--- /dev/null
+++ b/params_shard_224.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:72d3a1c15eb7469a244b379fc65e2e3affc44831a54a4b06f9cdd3ebbea1827a
+size 18350080
diff --git a/params_shard_225.bin b/params_shard_225.bin
new file mode 100644
index 0000000000000000000000000000000000000000..46e583777471226b67634c3f47c2fd41740f87ef
--- /dev/null
+++ b/params_shard_225.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:63010b3a3a1d80d3579d3404e24cc7ee1b007a4c1423b11f27ab155a4df53279
+size 20760576
diff --git a/params_shard_226.bin b/params_shard_226.bin
new file mode 100644
index 0000000000000000000000000000000000000000..db6513081e3770a93ce4b7abccd68c868f6d2fb6
--- /dev/null
+++ b/params_shard_226.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:05796b919b8732738a9c92bd07c91b663048841e5e9fa311c3d39c160da5bec9
+size 141557760
diff --git a/params_shard_227.bin b/params_shard_227.bin
new file mode 100644
index 0000000000000000000000000000000000000000..fc7434475ba7fe4d46c73f07b4f35d2cdeb808eb
--- /dev/null
+++ b/params_shard_227.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2f70eeac62d53c0719e1948d04106ab46508e4af674efdb9c9727c9751c88d91
+size 70778880
diff --git a/params_shard_228.bin b/params_shard_228.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8addf1277925f2fd5cd5f10b3d524fc38fd9f9d5
--- /dev/null
+++ b/params_shard_228.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b01edd2d484ede7800ff74e0c69cb56f1b9244bbcb5c6e40cbce8b35858701c8
+size 18350080
diff --git a/params_shard_229.bin b/params_shard_229.bin
new file mode 100644
index 0000000000000000000000000000000000000000..de5b44da42cad0a3f000b8e213939824f90ecc17
--- /dev/null
+++ b/params_shard_229.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dce09c2753e221094153d7de7b3e5792190cc180d3d1fc8225e166364f427d44
+size 20760576
diff --git a/params_shard_23.bin b/params_shard_23.bin
new file mode 100644
index 0000000000000000000000000000000000000000..de1fc91121060c68ae22722b77ee815ae27fdd12
--- /dev/null
+++ b/params_shard_23.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1439fc431a81e67c4fc8891f63d1571d57e74c37e1f5571ba2d07651c9157956
+size 70778880
diff --git a/params_shard_230.bin b/params_shard_230.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f701d23f1eeea7b754fd928e8f89f6d8f2b4892f
--- /dev/null
+++ b/params_shard_230.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1a43b69a18345b3018078f358b4365e4889d90a617e79b14ccc00cdcedcf6aea
+size 141557760
diff --git a/params_shard_231.bin b/params_shard_231.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2716e68fb71121c4dda73b1d4346955b0e51de2c
--- /dev/null
+++ b/params_shard_231.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fb215dc910e6dfe50807a9ae3fe46473b056ca5122225022796d569b52a72862
+size 70778880
diff --git a/params_shard_232.bin b/params_shard_232.bin
new file mode 100644
index 0000000000000000000000000000000000000000..98da7faec95b862c927e22c6fccdc449539563c5
--- /dev/null
+++ b/params_shard_232.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e021824f469e49e566f75e3873287a76d02567ed039819ad917a65ca5df015f6
+size 18350080
diff --git a/params_shard_233.bin b/params_shard_233.bin
new file mode 100644
index 0000000000000000000000000000000000000000..405d3c0349b6ef84a206a382da026ac9104a3ba0
--- /dev/null
+++ b/params_shard_233.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4939aa5cbaa5851c9ca382e1bba23ab4d508f14d5013c25ffe666b1441d4fa31
+size 20760576
diff --git a/params_shard_234.bin b/params_shard_234.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1bc046be2f3f278b22198c6ce8c9fb2176cb52c5
--- /dev/null
+++ b/params_shard_234.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1250af4b4f1ffbae7080c0796ac7b6146b2d41d82a2a84b3cac310ade4f709b4
+size 141557760
diff --git a/params_shard_235.bin b/params_shard_235.bin
new file mode 100644
index 0000000000000000000000000000000000000000..119354673d7752563c7e316f0cec744ea205f67a
--- /dev/null
+++ b/params_shard_235.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b907bc185816348116510bd8423c774cec1fb52677c9297a31b3d7f8fd1b74d1
+size 70778880
diff --git a/params_shard_236.bin b/params_shard_236.bin
new file mode 100644
index 0000000000000000000000000000000000000000..33c61f969f4db27a72e3227919420a708db8b104
--- /dev/null
+++ b/params_shard_236.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8b379067d3be7391226eb89db5c61edb7960d7ef9e8d4ec09ac2c1a6c61974a0
+size 18350080
diff --git a/params_shard_237.bin b/params_shard_237.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ad363c482a8386eb5add36b7c1d8e27c34869d27
--- /dev/null
+++ b/params_shard_237.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:da6efecb13a6e3f204a0beed7e11d3bc09413a993c791be30af6e163fbdfdadd
+size 20760576
diff --git a/params_shard_238.bin b/params_shard_238.bin
new file mode 100644
index 0000000000000000000000000000000000000000..72fece7fff56be0c731e71a115e74c024ce47189
--- /dev/null
+++ b/params_shard_238.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:69b0767d667e7d1ad919490d4b5071706eccc7b6652b701b844d7013f5ddf2da
+size 141557760
diff --git a/params_shard_239.bin b/params_shard_239.bin
new file mode 100644
index 0000000000000000000000000000000000000000..08bafef43dd56631fbfbf9c131b73493bdb56f4e
--- /dev/null
+++ b/params_shard_239.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b794dd48da9ce8fe8ba57f0e88baced43b287f7cb3c2bb87306cc535d0195310
+size 70778880
diff --git a/params_shard_24.bin b/params_shard_24.bin
new file mode 100644
index 0000000000000000000000000000000000000000..05b334a70458ec66b5140dfa8f3d65e5da336ef0
--- /dev/null
+++ b/params_shard_24.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:482d60a776939db37369723f6d3796c9455bb4d30fb65de0e9654402bce3092e
+size 18350080
diff --git a/params_shard_240.bin b/params_shard_240.bin
new file mode 100644
index 0000000000000000000000000000000000000000..061473dfbf88a493f881e076f422f5c2a3ae7853
--- /dev/null
+++ b/params_shard_240.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f851da271493db0fe1973d59196b9e07c2ee951916d6b3a2d721ac58b9aa0d65
+size 18350080
diff --git a/params_shard_241.bin b/params_shard_241.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ee9c88e979f0842b902703ac186cedd24c8e2b21
--- /dev/null
+++ b/params_shard_241.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:905793b3b345732118107b8c52dc6a4a4af47dd85f911ace2b86dee7e730af96
+size 20760576
diff --git a/params_shard_242.bin b/params_shard_242.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1a5e12b12d9ae3639a318898260c5c6420d8e102
--- /dev/null
+++ b/params_shard_242.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f81d9576d74874efa2587adc6778580ad7fadd8f22b29553739704d7f1aa7068
+size 141557760
diff --git a/params_shard_243.bin b/params_shard_243.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1e30fb7756d6b36cdd45a21684c06aa574e2465b
--- /dev/null
+++ b/params_shard_243.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2d1561f504e60ef1c02b7abed8a4a6aba5cd1da46da1bf6b0d582aec32f389e5
+size 70778880
diff --git a/params_shard_244.bin b/params_shard_244.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9dc09ed2a1bfbc64795838c2a3720475b35e3d4e
--- /dev/null
+++ b/params_shard_244.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:960ddd5d78eabb87295c5b5ebd095d8b057c3af6d403c2f8e788bbd2998c3e73
+size 18350080
diff --git a/params_shard_245.bin b/params_shard_245.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5444871a259b6a98fd621119adeedff5c7d9fc3c
--- /dev/null
+++ b/params_shard_245.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4c0c292d9b0f7262fe30fe791d70ac5ac1ca5b2915cd1f81b0c1807c7de6d2dc
+size 20760576
diff --git a/params_shard_246.bin b/params_shard_246.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9930481da44718776a6ea5e16ea53a2fa26c0ac3
--- /dev/null
+++ b/params_shard_246.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:19a0e02aaf0e7129daa76863418983f54177f0f803a90d32c2348db6f9ea4f79
+size 141557760
diff --git a/params_shard_247.bin b/params_shard_247.bin
new file mode 100644
index 0000000000000000000000000000000000000000..41addcc8d2a71bc82e538318ee5791b3bb5b9999
--- /dev/null
+++ b/params_shard_247.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d152d9aa8ddea1770c832edd1ad2620d6848695ced211418a6d11664dd705eef
+size 70778880
diff --git a/params_shard_248.bin b/params_shard_248.bin
new file mode 100644
index 0000000000000000000000000000000000000000..589e5cf5e47c8036ab6fae803c2678193ff15c48
--- /dev/null
+++ b/params_shard_248.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6bd1b16285acbe4ec1cddc69641297961476b40e75f61fbd9323dd109861dcfd
+size 18350080
diff --git a/params_shard_249.bin b/params_shard_249.bin
new file mode 100644
index 0000000000000000000000000000000000000000..43d850d76ccc068518b2093c7aa56fab3e946e41
--- /dev/null
+++ b/params_shard_249.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3cc5560042ccb974cc6c4dbb7eda7cb819df55631b4c248b89e03c4181347a8b
+size 20760576
diff --git a/params_shard_25.bin b/params_shard_25.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7eb6e24f51126fc208e80266a18f557ee76b210e
--- /dev/null
+++ b/params_shard_25.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5eab5e29b2703ffb8b848a0b2f5f531bec0245b04e2ff939c393aef03b7dbddf
+size 20760576
diff --git a/params_shard_250.bin b/params_shard_250.bin
new file mode 100644
index 0000000000000000000000000000000000000000..81fdf830f2795d77172a921402b7823ffff33aab
--- /dev/null
+++ b/params_shard_250.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fff5408e6dace3e04f66be8a289494d1c8f69e08d8c2e3c4d0dc13239474e914
+size 141557760
diff --git a/params_shard_251.bin b/params_shard_251.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0906e544a6a47e4734a6f45cd1a04423086c789f
--- /dev/null
+++ b/params_shard_251.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7e37b92877c5550cb3ca9160de9d43aac34f0f0a335aa4a4e71bc4b0ac165e53
+size 70778880
diff --git a/params_shard_252.bin b/params_shard_252.bin
new file mode 100644
index 0000000000000000000000000000000000000000..065ea37adc5d66de53a4844fc16b9f59959da5d2
--- /dev/null
+++ b/params_shard_252.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5d818c87c132d9c4683ff4933f40ae78a2f46465270bb94d28e623c9397b23f3
+size 18350080
diff --git a/params_shard_253.bin b/params_shard_253.bin
new file mode 100644
index 0000000000000000000000000000000000000000..53aa1150ddb0e5daf74f21e5861a1438770e53a4
--- /dev/null
+++ b/params_shard_253.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:41ca37f860b26798fc8a3e944c78c2a6d5fb311e42cb9c5c3cd2d4169ebe8648
+size 20760576
diff --git a/params_shard_254.bin b/params_shard_254.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9977c15e111bd563058352d966a5acbac55567fb
--- /dev/null
+++ b/params_shard_254.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4281fd464f1e5d2f9f4f982a4ce3100034daaae474c19c34c62ab469f94bc7ff
+size 141557760
diff --git a/params_shard_255.bin b/params_shard_255.bin
new file mode 100644
index 0000000000000000000000000000000000000000..06c3f98fb3bf28c57abf1a4206e1c5d5124e5bb1
--- /dev/null
+++ b/params_shard_255.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3684382ec7923c4d4a17644a4cf9f0e23c732b5cff9a185381bb53aa6ec42843
+size 70778880
diff --git a/params_shard_256.bin b/params_shard_256.bin
new file mode 100644
index 0000000000000000000000000000000000000000..19fc4da77a92642181d862d33cee504b96cf28e8
--- /dev/null
+++ b/params_shard_256.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d3b3adcab897bcf2e74f041a77f59f2368d608b312b3682f58eb3ebe020c621e
+size 389283840
diff --git a/params_shard_257.bin b/params_shard_257.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0f83fee726f9e6d4ddf799861633704f27ac6a37
--- /dev/null
+++ b/params_shard_257.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e33e46ddbdc054b85e6ee4d29f91def62a7d3a527ba4e818edfb3f2237c45a67
+size 32348160
diff --git a/params_shard_26.bin b/params_shard_26.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e6e2591371a8154b25907dd3d16a41e77db18d9a
--- /dev/null
+++ b/params_shard_26.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d32213fb080231fd9cac193f84557e394dbeb0a019022ccf69d45d83c404bdf8
+size 141557760
diff --git a/params_shard_27.bin b/params_shard_27.bin
new file mode 100644
index 0000000000000000000000000000000000000000..71ff269619fde141497b14bc62a3df6e26f6e2b7
--- /dev/null
+++ b/params_shard_27.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d5409f55a0dd2e72c03cfacb82d2346a1247f721f92cb3ffd6ced09ddeaed459
+size 70778880
diff --git a/params_shard_28.bin b/params_shard_28.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8a27899c3ffe17a9cdba6832d9b2fb1a2e783416
--- /dev/null
+++ b/params_shard_28.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8387cb261191f795f0d01f162510f0148ef90642db34927fe7b1f94b21af116b
+size 18350080
diff --git a/params_shard_29.bin b/params_shard_29.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3b63fe4db727dc222a627bbfb6da3b3216e7effb
--- /dev/null
+++ b/params_shard_29.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ec967c9b3ef3bd7d61345124fcd369635b5706e1e55f8a6baff4f0cfa29e0fdb
+size 20760576
diff --git a/params_shard_3.bin b/params_shard_3.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6f6dd7aba9f739f68fe2632dd36c3c72bfa1cdf1
--- /dev/null
+++ b/params_shard_3.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2f3523f659ee1eecd3259b600ee34c38e6aab6abc60bd3fa86d8bd776d29bdff
+size 70778880
diff --git a/params_shard_30.bin b/params_shard_30.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d21dc525d6be5f02eaaf580e6264edc5f075b23f
--- /dev/null
+++ b/params_shard_30.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:46b605a9eef59fd06e4de45114f90305d289149818e1976c2ddda9791696349c
+size 141557760
diff --git a/params_shard_31.bin b/params_shard_31.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3083a1029cd41231532241c766653f0f14b2cf3d
--- /dev/null
+++ b/params_shard_31.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:01ac4c8b16748dd601a5d95e15ca7f354eb3207d407fd5916c7010f7629bf50d
+size 70778880
diff --git a/params_shard_32.bin b/params_shard_32.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c8a729e988492874e6710535d07180d91266b3f6
--- /dev/null
+++ b/params_shard_32.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6821a27408a08b112b6ec775e76c7a9b2f9504e567b6ef5e598850f9760e9332
+size 18350080
diff --git a/params_shard_33.bin b/params_shard_33.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1430e71e5e7820b4a3482888f4566f8ae471552f
--- /dev/null
+++ b/params_shard_33.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c419ba936d73ef1d372e93f8093c5b5681be898e9621ce82e62e3daf9a6accfd
+size 20760576
diff --git a/params_shard_34.bin b/params_shard_34.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c4eeade746c629ad05e752f60faa692d329959be
--- /dev/null
+++ b/params_shard_34.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:90324a53b081231b8ddbc5b4ef2f77f1eab1e8515a6d22078d599dea7625cdcb
+size 141557760
diff --git a/params_shard_35.bin b/params_shard_35.bin
new file mode 100644
index 0000000000000000000000000000000000000000..92156d8ff80d75048e5d845cd7faea9d9245d7cc
--- /dev/null
+++ b/params_shard_35.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f4125ae2e7442cadf47453df7627297d402b3e0d525b0bcf3eb141d5bd86cba2
+size 70778880
diff --git a/params_shard_36.bin b/params_shard_36.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2a0eacef4c7e945b76cb0879671f8a30ef91c061
--- /dev/null
+++ b/params_shard_36.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:72fd4d2ffa7fb986f47abd6e42553fa14acda564bd8fce370ff217624d467f22
+size 18350080
diff --git a/params_shard_37.bin b/params_shard_37.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ab889f4f8b3ae948ba45de54713fb10bc2533ba6
--- /dev/null
+++ b/params_shard_37.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:68c37b12fb758bf7db9053d7f03d91419b737386ce17f28f29e59a276266d090
+size 20760576
diff --git a/params_shard_38.bin b/params_shard_38.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d27928d2c1fed48aef209c2426f4e2032ec7ccca
--- /dev/null
+++ b/params_shard_38.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:98608e8777b3163cd6a19cbdcd12b25d9f35c13e3c62b543f4e643cfa1298d37
+size 141557760
diff --git a/params_shard_39.bin b/params_shard_39.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b7c4cee26da7a434cdb17a3a10dd33c75981dcb4
--- /dev/null
+++ b/params_shard_39.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:62ca8b5be8ee4d338c59adba6f0416888bf0246706c325a83013d9d213df6a1c
+size 70778880
diff --git a/params_shard_4.bin b/params_shard_4.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1b77b6656942353c378e5030ef7c504b6ece33a6
--- /dev/null
+++ b/params_shard_4.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:31dbe77deeb7bd8c40b4d62cbda4532df4bc38785da998d8cc91673671b26497
+size 18350080
diff --git a/params_shard_40.bin b/params_shard_40.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ffc70958cdc5d6a0d57eea3536aa378c4f5615ab
--- /dev/null
+++ b/params_shard_40.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ac73b5d35fcc6f065e90b475ce8416d3e4bf145f58e11c7cdc2b4b60fcf9b9c1
+size 18350080
diff --git a/params_shard_41.bin b/params_shard_41.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6a48470c5a400a17410275c55ef3a2ffc58dcc9e
--- /dev/null
+++ b/params_shard_41.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:94f6f07fca710d2d55043fbb5044bf14195296e79fae4d9d0259d8ea9f1a9208
+size 20760576
diff --git a/params_shard_42.bin b/params_shard_42.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6fc573cc47becdab81fb3b31a703512076d3d5ad
--- /dev/null
+++ b/params_shard_42.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:82aabab1122a9e61fa3fef30bb94cc3fbcd51667140739063ab311895f55c2bf
+size 141557760
diff --git a/params_shard_43.bin b/params_shard_43.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5d950fb5f728f042b532d3664a638d1403bd57df
--- /dev/null
+++ b/params_shard_43.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:326ca3da2f385d308a4f8ded4cdab2c291f9341aadfb4dde933099c755d69e14
+size 70778880
diff --git a/params_shard_44.bin b/params_shard_44.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ec16191794fa67963dfe81965f3f3d0369e52ac6
--- /dev/null
+++ b/params_shard_44.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:41fb9e25c94040728b72967096d5cf259bbc9af991711c0482a9558cf11a8a59
+size 18350080
diff --git a/params_shard_45.bin b/params_shard_45.bin
new file mode 100644
index 0000000000000000000000000000000000000000..75d48258c8a926db9f5b172b132ef92e300fe0aa
--- /dev/null
+++ b/params_shard_45.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e6c4b2f78aa1c164d1fd2827256e675f2f26c1a52242f0b69a468949d7508ed4
+size 20760576
diff --git a/params_shard_46.bin b/params_shard_46.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b18535d8b8a1cd6a59b8a364613a19770789489a
--- /dev/null
+++ b/params_shard_46.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:93021761ea9b4140abe103abd5e86731beb2bf2e01de3db97085149a74598e8c
+size 141557760
diff --git a/params_shard_47.bin b/params_shard_47.bin
new file mode 100644
index 0000000000000000000000000000000000000000..47d444b57587ba05a83dc90f62f8d7d36d9387e8
--- /dev/null
+++ b/params_shard_47.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6ca2b202e63840237eb40322c56fc5b307b902fc4b49039dcad4756e910d857a
+size 70778880
diff --git a/params_shard_48.bin b/params_shard_48.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6e468b89e46fb43c89b763b4ab4fcc97cc324d1b
--- /dev/null
+++ b/params_shard_48.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c429bd070b835c3014ed343ad6cb0809fca41ae3d352136522232da71e9e4eb9
+size 18350080
diff --git a/params_shard_49.bin b/params_shard_49.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b2187322c87ecb4b30df7089070e5e90e981e9df
--- /dev/null
+++ b/params_shard_49.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:77280e9d40b7909bfbc641562cfdc4a43c5f448f50175f91f4802f9d90de2709
+size 20760576
diff --git a/params_shard_5.bin b/params_shard_5.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ece1a454394d3d66c1031152788dd2721aedf2c7
--- /dev/null
+++ b/params_shard_5.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7ff870590bc2b47c2f9ddb9f746126cecfcb76b323094e0e3f0e60dc25cdee8a
+size 20760576
diff --git a/params_shard_50.bin b/params_shard_50.bin
new file mode 100644
index 0000000000000000000000000000000000000000..70cbe0de79bb38de18de8ff7be4ef8044056b505
--- /dev/null
+++ b/params_shard_50.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3d23163e5489f42822d9c78046fbb70fe1b6f1a3477febfeccee08f5af2161a9
+size 141557760
diff --git a/params_shard_51.bin b/params_shard_51.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3683686fd5711a18adb0f589bc0af6176e33c257
--- /dev/null
+++ b/params_shard_51.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9353decbb877a3bc4fb12f905cc27571c5fc8e4b79797e90d33fbc949ddde493
+size 70778880
diff --git a/params_shard_52.bin b/params_shard_52.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9b876d6d59c64614ced5a26b79d0d156667679df
--- /dev/null
+++ b/params_shard_52.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3d6c619132898275b30c23ef92358863ed882086baa6721bc8073eaf049ab8b8
+size 18350080
diff --git a/params_shard_53.bin b/params_shard_53.bin
new file mode 100644
index 0000000000000000000000000000000000000000..415fd4d0351fc06bfbefd408ff54aba06c81004a
--- /dev/null
+++ b/params_shard_53.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:41e14af03a54ae0f6c32061aeb8fd48e3e8a96b507753d4b17af2601c11835ff
+size 20760576
diff --git a/params_shard_54.bin b/params_shard_54.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e494cd9b91d7d4891146d5ad734d09a6249b4a1c
--- /dev/null
+++ b/params_shard_54.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1648cb4567960ac37fcde69e789ee7e919a8aae3bb654d42c98eac6955731322
+size 141557760
diff --git a/params_shard_55.bin b/params_shard_55.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1507c20a4076016b3033c0ebd60e769f1c079003
--- /dev/null
+++ b/params_shard_55.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:65bded1694c61405c1fbcd4953e117c7902b8cdf4fc681fbc7e2a9941d7a35fb
+size 70778880
diff --git a/params_shard_56.bin b/params_shard_56.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3897ca2c2af1d2b97039429998ede25d0e0844fe
--- /dev/null
+++ b/params_shard_56.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:164dc415e084da34d22fc917a576d1c69eb16b9a72d4a577585cae358f54bab1
+size 18350080
diff --git a/params_shard_57.bin b/params_shard_57.bin
new file mode 100644
index 0000000000000000000000000000000000000000..81d2c9aef4afdcc5dcb0c4798cf8428d57a164dc
--- /dev/null
+++ b/params_shard_57.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:45f1ee9a042df10c5bb88f90e3054ac3334b74c2793067303d5ecbce37293289
+size 20760576
diff --git a/params_shard_58.bin b/params_shard_58.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b2d7feb49e3ae5f457541ff5eeff1e3c51d0dc62
--- /dev/null
+++ b/params_shard_58.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0be7ea94b30d9a62b305cfee18c64679ebfba0ea0ddc64bef2f68fe2b52aecc3
+size 141557760
diff --git a/params_shard_59.bin b/params_shard_59.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6856a08a2dc2a3d9cd0039a3b3d092207fc13cc7
--- /dev/null
+++ b/params_shard_59.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d27752d2f41bc529730d52526e38d39d6c9bf20659ee2e8d0cbe0e39a4be84b4
+size 70778880
diff --git a/params_shard_6.bin b/params_shard_6.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5ed2eb80f2db5589cb1bb9581addb83a678b9e55
--- /dev/null
+++ b/params_shard_6.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:474dc432fcb1ea338996980a2139a9fc18fcb0f50d1c1bed9052dbb59ee34b29
+size 141557760
diff --git a/params_shard_60.bin b/params_shard_60.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e58f5397389acf65b0ead2d9d5259e4a8d0af005
--- /dev/null
+++ b/params_shard_60.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:266480472367ea93f102fb8509be5485d105c55c85df5d22ab1eb535c604d219
+size 18350080
diff --git a/params_shard_61.bin b/params_shard_61.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f47babdbf1599bd34f9443599ccdf63047b12a8e
--- /dev/null
+++ b/params_shard_61.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2595c7fe77b0e84f42b656d5fca179e7d1e8d0b5a55f0c300881b983d1a82f3a
+size 20760576
diff --git a/params_shard_62.bin b/params_shard_62.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6d2189200c44242b7a151e2cd6303e89b28622ce
--- /dev/null
+++ b/params_shard_62.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a38d4e60c4e6351869b88d97674a89c3195c05d9d3ae4e0ca1b7c132957fd06e
+size 141557760
diff --git a/params_shard_63.bin b/params_shard_63.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8a534d4e882871db1150025676295fa7d937dd8b
--- /dev/null
+++ b/params_shard_63.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:92fd837ec1fe4e60382ad83c32ec1868d6605f4acf74c2db35f80856c45e13b3
+size 70778880
diff --git a/params_shard_64.bin b/params_shard_64.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e1ce0b1c1e47034bf4338b301e57bbc712f0d936
--- /dev/null
+++ b/params_shard_64.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f7b42500cbdf0a1bd64e459e4d4d1f5118fe66e29f07c0b48de50f29e097e931
+size 18350080
diff --git a/params_shard_65.bin b/params_shard_65.bin
new file mode 100644
index 0000000000000000000000000000000000000000..80da5f2194cc163b0e53269dfeefa250cbb5de98
--- /dev/null
+++ b/params_shard_65.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e4d177f074c05a2a18a1ab027ab50c142c0527d69ff6ff52fc2bf9f077f19152
+size 20760576
diff --git a/params_shard_66.bin b/params_shard_66.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6903f6ddf92e61fc3ac4aa9d655eeacf08cfe9f0
--- /dev/null
+++ b/params_shard_66.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:734b68266315a987b20be17d97d42654ffbd325c33b1ecb0dc41a78dd47d3e3b
+size 141557760
diff --git a/params_shard_67.bin b/params_shard_67.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ee526f728d3a8b13eb865808ac0435f48b8eb0be
--- /dev/null
+++ b/params_shard_67.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a408048e8fe4fa973d2110e4e94c0b9ec5340a89114ecab682c6e45012fe6d66
+size 70778880
diff --git a/params_shard_68.bin b/params_shard_68.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b82c7354aa9acde63961779abefde234bf622037
--- /dev/null
+++ b/params_shard_68.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d4884a4a14c3a95625f6c7dbadffa4c24551b6cfdd99f65e59dcbee5ff32b0e8
+size 18350080
diff --git a/params_shard_69.bin b/params_shard_69.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2fdb1ef95038a0ccd214125fc5b7e8cc9844dbb6
--- /dev/null
+++ b/params_shard_69.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:43185dee5fe9d6c77d8b0508a045913492fccc8690235b884b43f327d8917d9e
+size 20760576
diff --git a/params_shard_7.bin b/params_shard_7.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2c3748cb57d8190566ab89f0e966ad2fbdca97a5
--- /dev/null
+++ b/params_shard_7.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6115b753831f5c9f3c0ed043437b16fced8dec108e6ddce277e94af3567f67be
+size 70778880
diff --git a/params_shard_70.bin b/params_shard_70.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b93aec5f500f3aa49cadcea59e0b29ae7b5ee23e
--- /dev/null
+++ b/params_shard_70.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bdd8c3f82a7fa139147eb888040fca411a7b1f3a3b327629f5462c13cb37aeab
+size 141557760
diff --git a/params_shard_71.bin b/params_shard_71.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c9736ae92835b43bdb1c955a8d1cba80f1033bdd
--- /dev/null
+++ b/params_shard_71.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b4e641defaad10e64f221c266906b35736e0a414f0a83d16adab91e03023416f
+size 70778880
diff --git a/params_shard_72.bin b/params_shard_72.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f4215547fe01db510e9ec0dd6fa2831a7ed31c4b
--- /dev/null
+++ b/params_shard_72.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:15ffcfafdbf47479def985ec60f995d65a27a52a9a40501bad21e70777eb4521
+size 18350080
diff --git a/params_shard_73.bin b/params_shard_73.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b7c95c8bc3b675249abcf0b9ff64ced7b5dfda6d
--- /dev/null
+++ b/params_shard_73.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5e371304513a42dfe4ecfca3e1d536cc35ea605ab0d90dd8ee2d6a77a534c535
+size 20760576
diff --git a/params_shard_74.bin b/params_shard_74.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a5aa346d28e37c1ea439e33278d2f184a467f68a
--- /dev/null
+++ b/params_shard_74.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1d94f9a0cbb5979e1e12622aac8ecb9594031153890d7a3d81289157050149d6
+size 141557760
diff --git a/params_shard_75.bin b/params_shard_75.bin
new file mode 100644
index 0000000000000000000000000000000000000000..fc8ca8464e798a72e1a0348538a74fdd834d806d
--- /dev/null
+++ b/params_shard_75.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:af9a03bea0b0a682b0a541c5503d9f3f83d3440b797a565acc09c8e8bcafc126
+size 70778880
diff --git a/params_shard_76.bin b/params_shard_76.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c4d28f6e360e93b15bbf9523b9b07c33ffee77b4
--- /dev/null
+++ b/params_shard_76.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:62364d3d9b0544494e26f38b4bfe17a027e6e715a20a893ff910b7a9c1bb90e0
+size 18350080
diff --git a/params_shard_77.bin b/params_shard_77.bin
new file mode 100644
index 0000000000000000000000000000000000000000..83988b6adf8f9c64a861c0be3e0151ad5cf62570
--- /dev/null
+++ b/params_shard_77.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:74e5957e68548420810135bd04a12aa1380e83db58746dad792795bd90019325
+size 20760576
diff --git a/params_shard_78.bin b/params_shard_78.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ca187355f1ba5b79b8b8f357c9abb77ee3a413a8
--- /dev/null
+++ b/params_shard_78.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:efb030aa6dd571110118de85a14f4f4bac164bc72ba35a9f09cf65a42a07872c
+size 141557760
diff --git a/params_shard_79.bin b/params_shard_79.bin
new file mode 100644
index 0000000000000000000000000000000000000000..240416b04264bed33ea3d42327bdaa0c4ce9229c
--- /dev/null
+++ b/params_shard_79.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6590ec11f119b7b9616c7373776f7cdb92237d2223c1ccce43558a178f1f92a6
+size 70778880
diff --git a/params_shard_8.bin b/params_shard_8.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e321a8a095461494dc513ccdc78017fc26108241
--- /dev/null
+++ b/params_shard_8.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d955f694d42b968496720d96c7ff636647b08e6ef00f008c5f24bb24823307dc
+size 18350080
diff --git a/params_shard_80.bin b/params_shard_80.bin
new file mode 100644
index 0000000000000000000000000000000000000000..230fc043a044499d93ea98b601fe28b22051c02b
--- /dev/null
+++ b/params_shard_80.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a008c745912590c4f62f41fc01eb19a9d06b5282318e233724bbf66f4f04b19f
+size 18350080
diff --git a/params_shard_81.bin b/params_shard_81.bin
new file mode 100644
index 0000000000000000000000000000000000000000..aa15a43a49c36df500ec1f7eccf16732409b167a
--- /dev/null
+++ b/params_shard_81.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:51786a24f750b714d49e180a76f421888a9220a93ef207aee1de3f98a2ffc4b7
+size 20760576
diff --git a/params_shard_82.bin b/params_shard_82.bin
new file mode 100644
index 0000000000000000000000000000000000000000..510d9e5758c28894a6f1306634bb7e4749356e82
--- /dev/null
+++ b/params_shard_82.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:06416518325e4549e900fe033224d8336c2477110e6d1500f8dabac8aed7c7e9
+size 141557760
diff --git a/params_shard_83.bin b/params_shard_83.bin
new file mode 100644
index 0000000000000000000000000000000000000000..50fec2c3bb70f45f29370dbd90b5b2c82efd69c0
--- /dev/null
+++ b/params_shard_83.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:36009df202e871191d2e79e7c645c712110764ecf6820b2c921e5e6bee7bad3a
+size 70778880
diff --git a/params_shard_84.bin b/params_shard_84.bin
new file mode 100644
index 0000000000000000000000000000000000000000..99121898e05a5f2ffce420786fb883223e90a880
--- /dev/null
+++ b/params_shard_84.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8f9baf0eb5fd504bb0ad048d722b3f846449337b9f62746f500c01b2e8dcb90c
+size 18350080
diff --git a/params_shard_85.bin b/params_shard_85.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4ca25d5358abdd38c93ba7dc7ebf2e1acc5a64bc
--- /dev/null
+++ b/params_shard_85.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ce98f2f1dc68db8ed9ab88d89a539820f9af4c674ed723774afb43a61f94540f
+size 20760576
diff --git a/params_shard_86.bin b/params_shard_86.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3f5806f1d9341d4c2f8fe43c40bd0bf1fb0eb741
--- /dev/null
+++ b/params_shard_86.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4d2d485a4a81683bd29526ff958795b5bbc5b9278c1ed244eb4116c2c61d670e
+size 141557760
diff --git a/params_shard_87.bin b/params_shard_87.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0bfb94960973f592488d6400ed6bb08f275e2db9
--- /dev/null
+++ b/params_shard_87.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:087a463346630747d15e944807762d390dd5db25e3afec51d45556f3e556fe3d
+size 70778880
diff --git a/params_shard_88.bin b/params_shard_88.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bf3d9e2c8f5fcf59a1050e007bd2d1db36bacdad
--- /dev/null
+++ b/params_shard_88.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8c84e2ffd43c33640012dd7ccc85cf7eb3280db99fd105a1db8e9d27a75c6291
+size 18350080
diff --git a/params_shard_89.bin b/params_shard_89.bin
new file mode 100644
index 0000000000000000000000000000000000000000..fc73ceabdb3167cb4779f3da9628af1d264b71b7
--- /dev/null
+++ b/params_shard_89.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e64c25ea4754ab54065a3400da0886bc616cacb4dcb27ae81cb5fce35dfaa71b
+size 20760576
diff --git a/params_shard_9.bin b/params_shard_9.bin
new file mode 100644
index 0000000000000000000000000000000000000000..81226faf1236d0abd97cb21827c8bf630e82f83e
--- /dev/null
+++ b/params_shard_9.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a577a81a19e29102a8b801f1f75474a6e589f10e63913ff4ad4a65ae88a37639
+size 20760576
diff --git a/params_shard_90.bin b/params_shard_90.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5921ee8678430547040bc24b12ae1f50b4d5126d
--- /dev/null
+++ b/params_shard_90.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cbb2ba08b5de50de331f1a4f091a031d496d190c127294b964b2946497e05b68
+size 141557760
diff --git a/params_shard_91.bin b/params_shard_91.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e76149c68e7172946c17977458f9774675bcfdd3
--- /dev/null
+++ b/params_shard_91.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cf2eabb1c5e8cd536d75d7efe66806e1fd93d0cff5f8325a27a98f248ad0be0e
+size 70778880
diff --git a/params_shard_92.bin b/params_shard_92.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b7894c0b9a3359066b2cfcaedcaea5d3fa74c46b
--- /dev/null
+++ b/params_shard_92.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:147ac514790da4ae7130c6236351e9d65a0b9f1c1c5724f4727ab699e4e5b3e3
+size 18350080
diff --git a/params_shard_93.bin b/params_shard_93.bin
new file mode 100644
index 0000000000000000000000000000000000000000..665b4cf621008b218e1f7e34fa1dc63338da87f7
--- /dev/null
+++ b/params_shard_93.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7b0291f2914f1eee706c4c38e7ae88b7dea56bdde03d036e1e5716ca276d0383
+size 20760576
diff --git a/params_shard_94.bin b/params_shard_94.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2af78fcf0cee162b6d65d3f361ded4ae24cca1fe
--- /dev/null
+++ b/params_shard_94.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ea233461836b3498336a7c8adc8f8b65d4c72af7985afe06c92bac5435c1d336
+size 141557760
diff --git a/params_shard_95.bin b/params_shard_95.bin
new file mode 100644
index 0000000000000000000000000000000000000000..225442d4f5f91d064c9a0131c73e3bcabad48251
--- /dev/null
+++ b/params_shard_95.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a7ba5c033edc802effa9ca6418691092cc825b150dd99d2085bf835c89a48358
+size 70778880
diff --git a/params_shard_96.bin b/params_shard_96.bin
new file mode 100644
index 0000000000000000000000000000000000000000..91aa67161b7d3f7e6e10e4807bf25c96e24264e6
--- /dev/null
+++ b/params_shard_96.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4fd8590e9118aa5dd1d79b99e610173dab39c245ff7291c3d9c634522e505942
+size 18350080
diff --git a/params_shard_97.bin b/params_shard_97.bin
new file mode 100644
index 0000000000000000000000000000000000000000..74bf9ec42305feab0f79fa6f727cac84c00f4e05
--- /dev/null
+++ b/params_shard_97.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5c4b3357db6065c302be4b72dfa4f10141cc7bf3ac1101f18eb430b657d2e08a
+size 20760576
diff --git a/params_shard_98.bin b/params_shard_98.bin
new file mode 100644
index 0000000000000000000000000000000000000000..fe8eacf0d1ec1db2b5b8946d933c7bef888d9515
--- /dev/null
+++ b/params_shard_98.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a2dc8746c4c10e4f4ee64e6bc6c8e195be1bc162a7fb7f638b47291c49b45d04
+size 141557760
diff --git a/params_shard_99.bin b/params_shard_99.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9265631de8268ff093ad9750153f44934374417f
--- /dev/null
+++ b/params_shard_99.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5ac5a87926c721d52859cbd5d7958e7ba0abcc58ecf2cca2e3b471bca706f144
+size 70778880
diff --git a/private-llm-config.json b/private-llm-config.json
new file mode 100644
index 0000000000000000000000000000000000000000..e065663d05adad9b7d5381bac4d3cb2847710225
--- /dev/null
+++ b/private-llm-config.json
@@ -0,0 +1,45 @@
+{
+ "model_type": "qwen2",
+ "quantization": "GPTQ-Int4",
+ "model_config": {
+ "hidden_act": "silu",
+ "hidden_size": 5120,
+ "intermediate_size": 27648,
+ "num_attention_heads": 40,
+ "num_hidden_layers": 64,
+ "num_key_value_heads": 8,
+ "rms_norm_eps": 1e-05,
+ "rope_theta": 1000000.0,
+ "vocab_size": 152064,
+ "tie_word_embeddings": false,
+ "context_window_size": 8192,
+ "prefill_chunk_size": 128,
+ "tensor_parallel_shards": 1,
+ "head_dim": 128,
+ "dtype": "float32",
+ "max_batch_size": 80
+ },
+ "vocab_size": 152064,
+ "context_window_size": 8192,
+ "sliding_window_size": -1,
+ "prefill_chunk_size": 128,
+ "attention_sink_size": -1,
+ "tensor_parallel_shards": 1,
+ "mean_gen_len": 512,
+ "max_gen_len": 4096,
+ "shift_fill_factor": 0.3,
+ "temperature": 0.6,
+ "presence_penalty": 0.0,
+ "frequency_penalty": 0.0,
+ "repetition_penalty": 1.2,
+ "top_p": 0.95,
+ "conv_template": "deepseek-r1-qwen",
+ "pad_token_id": 0,
+ "bos_token_id": 151646,
+ "eos_token_id": 151643,
+ "tokenizer_files": [
+ "tokenizer.json",
+ "tokenizer_config.json"
+ ],
+ "version": "0.1.0"
+}
diff --git a/tokenizer.json b/tokenizer.json
new file mode 100644
index 0000000000000000000000000000000000000000..a34650995da6939a945c330eadb0687147ac3ef8
--- /dev/null
+++ b/tokenizer.json
@@ -0,0 +1,303282 @@
+{
+ "version": "1.0",
+ "truncation": null,
+ "padding": null,
+ "added_tokens": [
+ {
+ "id": 151643,
+ "content": "<|end▁of▁sentence|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": true
+ },
+ {
+ "id": 151644,
+ "content": "<|User|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": false
+ },
+ {
+ "id": 151645,
+ "content": "<|Assistant|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": false
+ },
+ {
+ "id": 151646,
+ "content": "<|begin▁of▁sentence|>",
+ "normalized": false,
+ "lstrip": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ {
+ "id": 151647,
+ "content": "<|EOT|>",
+ "normalized": false,
+ "lstrip": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ {
+ "id": 151648,
+ "content": "
&": 5789, + "CON": 5790, + "Ġrepl": 5791, + "Ġregular": 5792, + "Storage": 5793, + "ramework": 5794, + "Ġgoal": 5795, + "Ġtouch": 5796, + ".widget": 5797, + "Ġbuilt": 5798, + "des": 5799, + "Part": 5800, + "(re": 5801, + "Ġworth": 5802, + "hib": 5803, + "game": 5804, + "Ġв": 5805, + "acion": 5806, + "ĠWhite": 5807, + "(type": 5808, + "(`": 5809, + "Ġnatural": 5810, + "Ġinj": 5811, + "Ġcalcul": 5812, + "ĠApril": 5813, + ".List": 5814, + "Ġassociated": 5815, + "ĉSystem": 5816, + "~~": 5817, + "=[": 5818, + "Ġstorage": 5819, + "Ġbytes": 5820, + "Ġtravel": 5821, + "Ġsou": 5822, + "Ġpassed": 5823, + "!=": 5824, + "ascript": 5825, + ".open": 5826, + "Ġgrid": 5827, + "Ġbus": 5828, + "Ġrecogn": 5829, + "Ab": 5830, + "Ġhon": 5831, + "ĠCenter": 5832, + "Ġprec": 5833, + "build": 5834, + "HTML": 5835, + "ĠSan": 5836, + "Ġcountries": 5837, + "aled": 5838, + "token": 5839, + "kt": 5840, + "Ġqual": 5841, + "Last": 5842, + "adow": 5843, + "Ġmanufact": 5844, + "idad": 5845, + "jango": 5846, + "Next": 5847, + "xf": 5848, + ".a": 5849, + "Ġporno": 5850, + "ĠPM": 5851, + "erve": 5852, + "iting": 5853, + "_th": 5854, + "ci": 5855, + "=None": 5856, + "gs": 5857, + "Ġlogin": 5858, + "atives": 5859, + "']);Ċ": 5860, + "Äħ": 5861, + "Ġill": 5862, + "IA": 5863, + "children": 5864, + "DO": 5865, + "Ġlevels": 5866, + "Ġ{{": 5867, + "Ġlooks": 5868, + "Ġ\"#": 5869, + "ToString": 5870, + "Ġnecessary": 5871, + "ĠĠĠĊ": 5872, + "cell": 5873, + "Entry": 5874, + "Ġ'#": 5875, + "Ġextrem": 5876, + "Selector": 5877, + "Ġplaceholder": 5878, + "Load": 5879, + "Ġreleased": 5880, + "ORE": 5881, + "Enumer": 5882, + "ĠTV": 5883, + "SET": 5884, + "inq": 5885, + "Press": 5886, + "ĠDepartment": 5887, + "Ġproperties": 5888, + "Ġrespond": 5889, + "Search": 5890, + "ael": 5891, + "Ġrequ": 5892, + "ĠBook": 5893, + "/Ċ": 5894, + "(st": 5895, + "Ġfinancial": 5896, + "icket": 5897, + "_input": 5898, + "Ġthreat": 5899, + "(in": 5900, + "Strip": 5901, + "ìĿ": 5902, + "ção": 5903, + "Ġevidence": 5904, + "));": 5905, + "ĠBro": 5906, + "Ġ[];Ċ": 5907, + "Ġou": 5908, + "buf": 5909, + "Script": 5910, + "dat": 5911, + "Ġrule": 5912, + "#import": 5913, + "=\"/": 5914, + "Serial": 5915, + "Ġstarting": 5916, + "[index": 5917, + "ae": 5918, + "Ġcontrib": 5919, + "session": 5920, + "_new": 5921, + "utable": 5922, + "ober": 5923, + "Ġ\"./": 5924, + "Ġlogger": 5925, + "Ġrecently": 5926, + "Ġreturned": 5927, + "ččĊ": 5928, + ")))Ċ": 5929, + "itions": 5930, + "Ġseek": 5931, + "Ġcommunic": 5932, + "Ġ\".": 5933, + "Ġusername": 5934, + "ECT": 5935, + "DS": 5936, + "Ġotherwise": 5937, + "ĠGerman": 5938, + ".aw": 5939, + "Adapter": 5940, + "ixel": 5941, + "Ġsystems": 5942, + "Ġdrop": 5943, + "Ġstructure": 5944, + "Ġ$(\"#": 5945, + "encies": 5946, + "anning": 5947, + "ĠLink": 5948, + "ĠResponse": 5949, + "Ġstri": 5950, + "ż": 5951, + "ĠDB": 5952, + "æĹ": 5953, + "android": 5954, + "submit": 5955, + "otion": 5956, + "(@": 5957, + ".test": 5958, + "ĊĊĊĊĊĊĊĊ": 5959, + "];čĊ": 5960, + "Ġdirectly": 5961, + "Ġ\"%": 5962, + "ris": 5963, + "elta": 5964, + "AIL": 5965, + "){čĊ": 5966, + "mine": 5967, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 5968, + "(k": 5969, + "bon": 5970, + "asic": 5971, + "pite": 5972, + "___": 5973, + "Max": 5974, + "Ġerrors": 5975, + "ĠWhile": 5976, + "Ġarguments": 5977, + "Ġensure": 5978, + "Right": 5979, + "-based": 5980, + "Web": 5981, + "Ġ-=": 5982, + "Ġintrodu": 5983, + "ĠInst": 5984, + "ĠWash": 5985, + "ordin": 5986, + "join": 5987, + "Database": 5988, + "Ġgrad": 5989, + "Ġusually": 5990, + "ITE": 5991, + "Props": 5992, + "?>Ċ": 5993, + "ĠGo": 5994, + "@Override": 5995, + "REF": 5996, + "Ġip": 5997, + "ĠAustral": 5998, + "Ġist": 5999, + "ViewById": 6000, + "Ġserious": 6001, + "Ġcustomer": 6002, + ".prototype": 6003, + "odo": 6004, + "cor": 6005, + "Ġdoor": 6006, + "ĠWITHOUT": 6007, + "Ġplant": 6008, + "Ġbegan": 6009, + "Ġdistance": 6010, + "()).": 6011, + "Ġchance": 6012, + "Ġord": 6013, + "came": 6014, + "pragma": 6015, + "Ġprotect": 6016, + "ragment": 6017, + "ĠNode": 6018, + "ening": 6019, + "Ñĩ": 6020, + "Ġroute": 6021, + "ĠSchool": 6022, + "hi": 6023, + "Ġneighb": 6024, + "After": 6025, + "licit": 6026, + "Ġcontr": 6027, + "Ġprimary": 6028, + "AA": 6029, + ".WriteLine": 6030, + "utils": 6031, + "Ġbi": 6032, + "Red": 6033, + ".Linq": 6034, + ".object": 6035, + "Ġleaders": 6036, + "unities": 6037, + "Ġgun": 6038, + "onth": 6039, + "ĠDev": 6040, + "FILE": 6041, + "Ġcomments": 6042, + "_len": 6043, + "arrow": 6044, + "amount": 6045, + "Range": 6046, + "sert": 6047, + "GridView": 6048, + "Ġupdated": 6049, + "ĠMo": 6050, + "Ġinform": 6051, + "ociety": 6052, + "ala": 6053, + "Access": 6054, + "Ġhab": 6055, + "Ġcreat": 6056, + "_arg": 6057, + "ĠJanuary": 6058, + "ĠDay": 6059, + "\")čĊ": 6060, + "uple": 6061, + "document": 6062, + "gorith": 6063, + "menu": 6064, + "ĠOver": 6065, + "bb": 6066, + ".title": 6067, + "_out": 6068, + "Ġled": 6069, + "uri": 6070, + "Ġ?>": 6071, + "gl": 6072, + "Ġbank": 6073, + "ayment": 6074, + "ĉprintf": 6075, + "MD": 6076, + "Ġsample": 6077, + "Ġhands": 6078, + "ĠVersion": 6079, + "uario": 6080, + "Ġoffers": 6081, + "ityEngine": 6082, + "Ġshape": 6083, + "Ġsleep": 6084, + "_point": 6085, + "Settings": 6086, + "Ġachie": 6087, + "Ġsold": 6088, + "ota": 6089, + ".bind": 6090, + "Am": 6091, + "Ġsafe": 6092, + "Store": 6093, + "Ġshared": 6094, + "Ġpriv": 6095, + "_VAL": 6096, + "Ġsens": 6097, + "){": 6098, + "Ġremember": 6099, + "shared": 6100, + "element": 6101, + "Ġshoot": 6102, + "Vert": 6103, + "cout": 6104, + "Ġenv": 6105, + "_label": 6106, + "Ġ>Ċ": 6107, + "run": 6108, + "Ġscene": 6109, + "(array": 6110, + "device": 6111, + "_title": 6112, + "agon": 6113, + "]čĊ": 6114, + "aby": 6115, + "Ġbecame": 6116, + "boolean": 6117, + "Ġpark": 6118, + "ĠCode": 6119, + "upload": 6120, + "riday": 6121, + "ĠSeptember": 6122, + "Fe": 6123, + "Ġsen": 6124, + "cing": 6125, + "FL": 6126, + "Col": 6127, + "uts": 6128, + "_page": 6129, + "inn": 6130, + "Ġimplied": 6131, + "aling": 6132, + "Ġyourself": 6133, + ".Count": 6134, + "conf": 6135, + "Ġaud": 6136, + "_init": 6137, + ".)": 6138, + "Ġwrote": 6139, + "NG": 6140, + ".Error": 6141, + "ä»": 6142, + ".for": 6143, + "Ġequal": 6144, + "ĠRequest": 6145, + "Ġserial": 6146, + "Ġallows": 6147, + "XX": 6148, + "Ġmiddle": 6149, + "chor": 6150, + "ø": 6151, + "erval": 6152, + ".Column": 6153, + "reading": 6154, + "Ġescort": 6155, + "ĠAugust": 6156, + "Ġquickly": 6157, + "Ġweap": 6158, + "ĠCG": 6159, + "ropri": 6160, + "ho": 6161, + "Ġcop": 6162, + "(struct": 6163, + "ĠBig": 6164, + "Ġvs": 6165, + "Ġfrequ": 6166, + ".Value": 6167, + "Ġactions": 6168, + "Ġproper": 6169, + "Ġinn": 6170, + "Ġobjects": 6171, + "Ġmatrix": 6172, + "avascript": 6173, + "Ġones": 6174, + ".group": 6175, + "Ġgreen": 6176, + "Ġpaint": 6177, + "ools": 6178, + "ycl": 6179, + "encode": 6180, + "olt": 6181, + "comment": 6182, + ".api": 6183, + "Dir": 6184, + "Ġune": 6185, + "izont": 6186, + ".position": 6187, + "Ġdesigned": 6188, + "_val": 6189, + "avi": 6190, + "iring": 6191, + "tab": 6192, + "Ġlayer": 6193, + "Ġviews": 6194, + "Ġreve": 6195, + "rael": 6196, + "ĠON": 6197, + "rics": 6198, + "np": 6199, + "Ġcore": 6200, + "());čĊ": 6201, + "Main": 6202, + "Ġexpert": 6203, + "ĉĉčĊ": 6204, + "_en": 6205, + "Ġ/>": 6206, + "utter": 6207, + "IAL": 6208, + "ails": 6209, + "ĠKing": 6210, + "*/ĊĊ": 6211, + "ĠMet": 6212, + "_end": 6213, + "addr": 6214, + "ora": 6215, + "Ġir": 6216, + "Min": 6217, + "Ġsurpr": 6218, + "Ġrepe": 6219, + "Ġdirectory": 6220, + "PUT": 6221, + "-S": 6222, + "Ġelection": 6223, + "haps": 6224, + ".pre": 6225, + "cm": 6226, + "Values": 6227, + "Ġ\"Ċ": 6228, + "column": 6229, + "ivil": 6230, + "Login": 6231, + "inue": 6232, + "Ġbeautiful": 6233, + "Ġsecret": 6234, + "(event": 6235, + "Ġchat": 6236, + "ums": 6237, + "Ġorigin": 6238, + "Ġeffects": 6239, + "Ġmanagement": 6240, + "illa": 6241, + "tk": 6242, + "Ġsetting": 6243, + "ĠCour": 6244, + "Ġmassage": 6245, + "ĉend": 6246, + "Ġhappy": 6247, + "Ġfinish": 6248, + "Ġcamera": 6249, + "ĠVer": 6250, + "ĠDemocr": 6251, + "ĠHer": 6252, + "(Q": 6253, + "cons": 6254, + "ita": 6255, + "Ġ'.": 6256, + "{}": 6257, + "ĉC": 6258, + "Ġstuff": 6259, + "Ġ:Ċ": 6260, + "ĠAR": 6261, + "Task": 6262, + "hidden": 6263, + "eros": 6264, + "IGN": 6265, + "atio": 6266, + "ĠHealth": 6267, + "olute": 6268, + "Enter": 6269, + "'>": 6270, + "ĠTwitter": 6271, + "ĠCounty": 6272, + "scribe": 6273, + "Ġ=>Ċ": 6274, + "Ġhy": 6275, + "fit": 6276, + "Ġmilitary": 6277, + "Ġsale": 6278, + "required": 6279, + "non": 6280, + "bootstrap": 6281, + "hold": 6282, + "rim": 6283, + "-old": 6284, + "ĠDown": 6285, + "Ġmention": 6286, + "contact": 6287, + "_group": 6288, + "oday": 6289, + "Ġtown": 6290, + "Ġsolution": 6291, + "uate": 6292, + "elling": 6293, + "]->": 6294, + "otes": 6295, + "ental": 6296, + "omen": 6297, + "ospital": 6298, + "ĠSup": 6299, + "_EN": 6300, + "Ġslow": 6301, + "SESSION": 6302, + "Ġblue": 6303, + "ago": 6304, + "Ġlives": 6305, + "Ġ^": 6306, + ".un": 6307, + "inst": 6308, + "enge": 6309, + "Ġcustomers": 6310, + "Ġcast": 6311, + "udget": 6312, + "ï¼ģ": 6313, + "icens": 6314, + "Ġdetermin": 6315, + "Selected": 6316, + "_pl": 6317, + "ueue": 6318, + "Ġdark": 6319, + "//ĊĊ": 6320, + "si": 6321, + "thern": 6322, + "ĠJapan": 6323, + "/w": 6324, + "PU": 6325, + "ĠEast": 6326, + "ovie": 6327, + "Ġpackage": 6328, + "Ġnor": 6329, + "Ġapi": 6330, + "bot": 6331, + "\"];Ċ": 6332, + "_post": 6333, + "ulate": 6334, + "Ġclub": 6335, + "'));Ċ": 6336, + "Ġloop": 6337, + "PIO": 6338, + "ione": 6339, + "shot": 6340, + "Initial": 6341, + "Ġplayed": 6342, + "register": 6343, + "rought": 6344, + "_max": 6345, + "acement": 6346, + "match": 6347, + "raphics": 6348, + "AST": 6349, + "Ġexisting": 6350, + "Ġcomplex": 6351, + "DA": 6352, + ".Ch": 6353, + ".common": 6354, + "mo": 6355, + "Ġ'../../": 6356, + "ito": 6357, + "Ġanalysis": 6358, + "Ġdeliver": 6359, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĊ": 6360, + "idx": 6361, + "Ãł": 6362, + "ongo": 6363, + "ĠEnglish": 6364, + "Ċ": 9992, + "_default": 9993, + "ĠDatabase": 9994, + "rep": 9995, + "ESS": 9996, + "nergy": 9997, + ".Find": 9998, + "_mask": 9999, + "Ġrise": 10000, + "Ġkernel": 10001, + "::$": 10002, + ".Q": 10003, + "Ġoffering": 10004, + "decl": 10005, + "ĠCS": 10006, + "Ġlisted": 10007, + "Ġmostly": 10008, + "enger": 10009, + "Ġblocks": 10010, + "olo": 10011, + "Ġgoverning": 10012, + "\\F": 10013, + "Ġconcent": 10014, + ".getText": 10015, + "Ġmb": 10016, + "Ġoccurred": 10017, + "Ġchanging": 10018, + "Scene": 10019, + "_CODE": 10020, + "Beh": 10021, + "\"The": 10022, + "Ġtile": 10023, + "ĠAssociation": 10024, + "ĉP": 10025, + "alty": 10026, + "_ad": 10027, + "odies": 10028, + "iated": 10029, + "Ġprepared": 10030, + "possible": 10031, + "Ġmort": 10032, + "TEST": 10033, + "Ġignore": 10034, + "Ġcalc": 10035, + "Ġrs": 10036, + "ĠassertEquals": 10037, + "Ġsz": 10038, + "ĠTHIS": 10039, + ".\"Ċ": 10040, + "Ġcanvas": 10041, + "java": 10042, + "Ġdut": 10043, + "VALID": 10044, + ".sql": 10045, + ".input": 10046, + "Ġaux": 10047, + "Sup": 10048, + "Ġartist": 10049, + "Vec": 10050, + "_TIME": 10051, + ".stringify": 10052, + "etween": 10053, + "ĠCategory": 10054, + "Ġ[-": 10055, + "ĠDevExpress": 10056, + "ĠJul": 10057, + "Ġring": 10058, + ".ed": 10059, + "YY": 10060, + "Let": 10061, + "TextField": 10062, + "Ġflat": 10063, + "_print": 10064, + "ĠOTHER": 10065, + "adian": 10066, + "Ġchecked": 10067, + "ele": 10068, + "Align": 10069, + "standing": 10070, + "Ġ[],": 10071, + "Ġlab": 10072, + "ucky": 10073, + "ĠChristmas": 10074, + "(image": 10075, + ".module": 10076, + "Ġlots": 10077, + "Ġslightly": 10078, + "(final": 10079, + "erge": 10080, + "è¿": 10081, + "ĠPolice": 10082, + "ĠRight": 10083, + "Ġaward": 10084, + "ĠOS": 10085, + "Ġ{}ĊĊ": 10086, + "Ġptr": 10087, + "oves": 10088, + "icated": 10089, + "ем": 10090, + "Ġmanage": 10091, + "oliday": 10092, + "Amount": 10093, + "oolStrip": 10094, + "tbody": 10095, + "Nav": 10096, + "wrap": 10097, + "BB": 10098, + "Ġwatching": 10099, + "arios": 10100, + "Ġoptional": 10101, + "_K": 10102, + "ĠLicensed": 10103, + ".Map": 10104, + "Timer": 10105, + "ĠAP": 10106, + "ĠRev": 10107, + "(o": 10108, + ",c": 10109, + "umin": 10110, + "etailed": 10111, + "ĠHy": 10112, + "Ġblank": 10113, + "agger": 10114, + "ĠSelf": 10115, + "()[": 10116, + ".make": 10117, + "earn": 10118, + "channel": 10119, + ";Ċ": 10133, + "World": 10134, + "Ġpython": 10135, + "Ġlif": 10136, + "Ġtrav": 10137, + "Ġconven": 10138, + "company": 10139, + "ĠClub": 10140, + "Ver": 10141, + "Btn": 10142, + "Ġzone": 10143, + "products": 10144, + "ĠEduc": 10145, + "Ġverify": 10146, + "ĠMil": 10147, + "ono": 10148, + "]);ĊĊ": 10149, + "ENCE": 10150, + "Ġpacket": 10151, + "Ġcer": 10152, + "Ġenumer": 10153, + "Ġpars": 10154, + "formed": 10155, + "Ġoccup": 10156, + "tre": 10157, + "Ġexercise": 10158, + "Day": 10159, + "_sum": 10160, + "Ġasking": 10161, + "aption": 10162, + "Ġorders": 10163, + "Ġspending": 10164, + "ĠERR": 10165, + ".Dis": 10166, + "ĠUtil": 10167, + "âĢľI": 10168, + "\\'": 10169, + "?)": 10170, + "/>Ċ": 10171, + "Ġemot": 10172, + "Ġinfluence": 10173, + "ĠAfrica": 10174, + "atters": 10175, + "Ùħ": 10176, + ".session": 10177, + "Ġchief": 10178, + "ĉĉĉĉĉĉĉĉĉĉĉ": 10179, + "Ġtom": 10180, + "cluded": 10181, + "serial": 10182, + "_handler": 10183, + ".Type": 10184, + "aped": 10185, + "Ġpolicies": 10186, + "-ex": 10187, + "-tr": 10188, + "blank": 10189, + "merce": 10190, + "Ġcoverage": 10191, + "Ġrc": 10192, + "_matrix": 10193, + "_box": 10194, + "Ġcharges": 10195, + "ĠBoston": 10196, + "Pe": 10197, + "Ġcircum": 10198, + "Ġfilled": 10199, + "Ġnorth": 10200, + "ictureBox": 10201, + "ĉres": 10202, + "è®": 10203, + "Ġtermin": 10204, + "Ġ[âĢ¦": 10205, + "IRECT": 10206, + "Ġber": 10207, + "Ġ\"../../": 10208, + "retch": 10209, + ".code": 10210, + "_col": 10211, + "ĠGovernment": 10212, + "Ġargv": 10213, + "ĠLord": 10214, + "asi": 10215, + "Exec": 10216, + "ĉlet": 10217, + "vertis": 10218, + "Ġdiscussion": 10219, + "enance": 10220, + "outube": 10221, + "typeof": 10222, + "Ġserved": 10223, + "ĠPut": 10224, + "ĉx": 10225, + "Ġsweet": 10226, + "Before": 10227, + "ategy": 10228, + ".of": 10229, + "ĠMaterial": 10230, + "Sort": 10231, + "ONT": 10232, + "igital": 10233, + "Why": 10234, + "Ġsust": 10235, + "Ġç": 10236, + "abet": 10237, + "Ġsegment": 10238, + "Ġ[],Ċ": 10239, + "ĠMuslim": 10240, + "ĠfindViewById": 10241, + "cut": 10242, + "_TEXT": 10243, + "ĠMary": 10244, + "Ġloved": 10245, + "Ġlie": 10246, + "ĠJO": 10247, + "Ġisset": 10248, + "month": 10249, + "Ġprime": 10250, + "ti": 10251, + "ĠCarol": 10252, + "Use": 10253, + "ĠPop": 10254, + "ĠSave": 10255, + "Interval": 10256, + "execute": 10257, + "dy": 10258, + "ĠIran": 10259, + "_cont": 10260, + "ĉT": 10261, + "Ġphase": 10262, + "checkbox": 10263, + "week": 10264, + "Ġhide": 10265, + "Ġtil": 10266, + "Ġju": 10267, + "Custom": 10268, + "burg": 10269, + "/M": 10270, + "TON": 10271, + "Ġquant": 10272, + "Ġrub": 10273, + "ixels": 10274, + "Ġinstalled": 10275, + "Ġdump": 10276, + "Ġproperly": 10277, + "(List": 10278, + "Ġdecide": 10279, + "apply": 10280, + "Has": 10281, + "Ġkeeping": 10282, + "Ġcitizens": 10283, + "Ġjoint": 10284, + "pool": 10285, + "Socket": 10286, + "_op": 10287, + "Ġweapon": 10288, + "gnore": 10289, + "ĠExec": 10290, + "otten": 10291, + "ĠMS": 10292, + "Ġ(-": 10293, + "ĠReview": 10294, + "Ġexamples": 10295, + "Ġtight": 10296, + "!(": 10297, + "DP": 10298, + "ĠMessageBox": 10299, + "Ġphotograph": 10300, + "URI": 10301, + "ét": 10302, + "low": 10303, + "ĠGrand": 10304, + ".persistence": 10305, + "Ġmaintain": 10306, + "Ġnums": 10307, + "Ġzip": 10308, + "ials": 10309, + "ĠGets": 10310, + "peg": 10311, + "ĠBuffer": 10312, + "~~~~": 10313, + "rastructure": 10314, + "ĠPL": 10315, + "uen": 10316, + "obby": 10317, + "sizeof": 10318, + "Ġpic": 10319, + "Ġseed": 10320, + "Ġexperienced": 10321, + "Ġodd": 10322, + "Ġkick": 10323, + "Ġprocedure": 10324, + "avigator": 10325, + "-on": 10326, + ",j": 10327, + "ĠAlthough": 10328, + "ĠuserId": 10329, + "accept": 10330, + "Blue": 10331, + "IColor": 10332, + "layer": 10333, + "available": 10334, + "Ġends": 10335, + ".table": 10336, + "Ġdataset": 10337, + "bus": 10338, + "Ġexplain": 10339, + "(pro": 10340, + "ĠCommittee": 10341, + "Ġnoted": 10342, + "]:Ċ": 10343, + "Dim": 10344, + "stdio": 10345, + ".\",Ċ": 10346, + "_source": 10347, + "ĠWeek": 10348, + "ĠEdge": 10349, + "Ġoperating": 10350, + "Ġeste": 10351, + "ipl": 10352, + "agination": 10353, + "Ġproceed": 10354, + "Ġanimation": 10355, + ".Models": 10356, + "ĠWatch": 10357, + "iat": 10358, + "Ġoppon": 10359, + "/A": 10360, + "Report": 10361, + "Ġsounds": 10362, + "_buf": 10363, + "IELD": 10364, + "Ġbund": 10365, + "ĉget": 10366, + ".pr": 10367, + "(tmp": 10368, + "Ġkid": 10369, + ">ĊĊĊ": 10370, + "Ġyang": 10371, + "NotFound": 10372, + "ÑĨ": 10373, + "math": 10374, + "@gmail": 10375, + "ĠLIMIT": 10376, + "redients": 10377, + "Ġvent": 10378, + "avigate": 10379, + "Look": 10380, + "Ġreligious": 10381, + "Ġrand": 10382, + "rio": 10383, + "(GL": 10384, + "_ip": 10385, + "uan": 10386, + "iciency": 10387, + "ĠChange": 10388, + ">čĊčĊ": 10389, + "ĠEntity": 10390, + "Ġrencontre": 10391, + "ĠRet": 10392, + "plan": 10393, + "én": 10394, + "BOOL": 10395, + "uries": 10396, + "train": 10397, + "Definition": 10398, + "============": 10399, + "zz": 10400, + "Animation": 10401, + "ĠOK": 10402, + "_menu": 10403, + ".bl": 10404, + "_score": 10405, + "Ġacad": 10406, + "(System": 10407, + "Ġrefresh": 10408, + "'=>$": 10409, + ".Graphics": 10410, + "amento": 10411, + "pid": 10412, + "tc": 10413, + "Ġtips": 10414, + "Ġhomes": 10415, + "Ġfuel": 10416, + "âĸ": 10417, + "_helper": 10418, + "ĠĠčĊ": 10419, + "ĠRoom": 10420, + ".Close": 10421, + "_attr": 10422, + "ĠMount": 10423, + "ĠEv": 10424, + "arser": 10425, + "_top": 10426, + "eah": 10427, + "ĠDelete": 10428, + "ãĢį": 10429, + "uke": 10430, + "Ġusage": 10431, + "aria": 10432, + "_dev": 10433, + "Ġtexture": 10434, + "Ġconversation": 10435, + "eper": 10436, + "Bean": 10437, + "done": 10438, + "nonatomic": 10439, + "ĠSecond": 10440, + "Ġshooting": 10441, + "_pre": 10442, + "Components": 10443, + "Ġ]ĊĊ": 10444, + "__,": 10445, + "stitution": 10446, + ".Char": 10447, + ">();ĊĊ": 10448, + "Ġpresented": 10449, + "Ġwa": 10450, + "oker": 10451, + "-ĊĊ": 10452, + "iner": 10453, + "Ġbecoming": 10454, + "Ġincident": 10455, + "Att": 10456, + "Ġrevealed": 10457, + "forc": 10458, + "Ġboot": 10459, + ".page": 10460, + "Enumerator": 10461, + "_->": 10462, + "Photo": 10463, + "Ġspring": 10464, + ".\",": 10465, + "ĠDictionary": 10466, + "BJECT": 10467, + "Ġlocations": 10468, + "Ġsamples": 10469, + "InputStream": 10470, + "ĠBrown": 10471, + "Ġstats": 10472, + "quality": 10473, + "Ñħ": 10474, + "-dis": 10475, + "Ġhelping": 10476, + "Ġped": 10477, + "(se": 10478, + "ĠWho": 10479, + "alian": 10480, + "internal": 10481, + "Ġft": 10482, + ">().": 10483, + "->{": 10484, + "Ġmine": 10485, + "Ġsector": 10486, + "Ġgro": 10487, + "Ġopportunities": 10488, + "Ġü": 10489, + "Ġmp": 10490, + "Ġalleged": 10491, + "Ġdoubt": 10492, + "Mouse": 10493, + "About": 10494, + "_part": 10495, + "Ġchair": 10496, + "Ġstopped": 10497, + "loop": 10498, + "entities": 10499, + "Ġapps": 10500, + "ansion": 10501, + "Ġmental": 10502, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 10503, + "FR": 10504, + "Ġdefend": 10505, + "care": 10506, + "Ġideal": 10507, + "/api": 10508, + "urface": 10509, + "Ġele": 10510, + "ulator": 10511, + "ĠRights": 10512, + "anguages": 10513, + "Ġfunds": 10514, + "Ġadapt": 10515, + "Attributes": 10516, + "Ġdeploy": 10517, + "opts": 10518, + "Ġvalidation": 10519, + "Ġconcerns": 10520, + "uce": 10521, + ".num": 10522, + "ulture": 10523, + "ila": 10524, + "Ġcup": 10525, + "Ġpure": 10526, + ".Fore": 10527, + "ĠHashMap": 10528, + ".valueOf": 10529, + "asm": 10530, + "MO": 10531, + "Ġcs": 10532, + "Ġstores": 10533, + "Ġ************************************************************************": 10534, + "Ġcommunication": 10535, + "mem": 10536, + ".EventHandler": 10537, + ".Status": 10538, + "_right": 10539, + ".setOn": 10540, + "Sheet": 10541, + "Ġidentify": 10542, + "enerated": 10543, + "ordered": 10544, + "Ġ\"[": 10545, + "Ġswe": 10546, + "Condition": 10547, + "ĠAccording": 10548, + "Ġprepare": 10549, + "Ġrob": 10550, + "Pool": 10551, + "Ġsport": 10552, + "rv": 10553, + "ĠRouter": 10554, + "Ġalternative": 10555, + "([]": 10556, + "ĠChicago": 10557, + "ipher": 10558, + "ische": 10559, + "ĠDirector": 10560, + "kl": 10561, + "ĠWil": 10562, + "keys": 10563, + "Ġmysql": 10564, + "Ġwelcome": 10565, + "king": 10566, + "ĠManager": 10567, + "Ġcaught": 10568, + ")}Ċ": 10569, + "Score": 10570, + "_PR": 10571, + "Ġsurvey": 10572, + "hab": 10573, + "Headers": 10574, + "ADER": 10575, + "Ġdecor": 10576, + "Ġturns": 10577, + "Ġradius": 10578, + "errupt": 10579, + "Cor": 10580, + "Ġmel": 10581, + "Ġintr": 10582, + "(q": 10583, + "ĠAC": 10584, + "amos": 10585, + "MAX": 10586, + "ĠGrid": 10587, + "ĠJesus": 10588, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 10589, + ".DE": 10590, + "Ġts": 10591, + "Ġlinked": 10592, + "free": 10593, + "ĠQt": 10594, + "Ġ/**čĊ": 10595, + "Ġfaster": 10596, + "ctr": 10597, + "_J": 10598, + "DT": 10599, + ".Check": 10600, + "Ġcombination": 10601, + "Ġintended": 10602, + "-the": 10603, + "-type": 10604, + "ectors": 10605, + "ami": 10606, + "uting": 10607, + "Ġuma": 10608, + "XML": 10609, + "UCT": 10610, + "Ap": 10611, + "ĠRandom": 10612, + "Ġran": 10613, + ".sort": 10614, + "Ġsorted": 10615, + ".Un": 10616, + "_PER": 10617, + "itory": 10618, + "Ġpriority": 10619, + "ĠGal": 10620, + "ĠOld": 10621, + "hot": 10622, + "ĠDisplay": 10623, + "(sub": 10624, + "_TH": 10625, + "_Y": 10626, + "ĠCare": 10627, + "loading": 10628, + "Kind": 10629, + "_handle": 10630, + ",,": 10631, + "rase": 10632, + "_replace": 10633, + ".addEventListener": 10634, + "ĠRT": 10635, + "Ġentered": 10636, + "gers": 10637, + "Ġich": 10638, + "(start": 10639, + "/app": 10640, + "Ġbrother": 10641, + "Memory": 10642, + "Outlet": 10643, + "Ġutf": 10644, + "prec": 10645, + "Ġnavigation": 10646, + "ORK": 10647, + "Ġdst": 10648, + "Detail": 10649, + "Ġaudience": 10650, + "Ġdur": 10651, + "Ġcluster": 10652, + "unched": 10653, + "Ġ],": 10654, + "Ġcomfortable": 10655, + ".values": 10656, + "ĠTotal": 10657, + "Ġsnap": 10658, + "Ġstandards": 10659, + "Ġperformed": 10660, + "hand": 10661, + "(\"@": 10662, + "åŃ": 10663, + "Ġphil": 10664, + "ibr": 10665, + "trim": 10666, + "Ġforget": 10667, + "Ġdoctor": 10668, + ".TextBox": 10669, + "icons": 10670, + ",s": 10671, + "ĠOp": 10672, + "Sm": 10673, + "Stop": 10674, + "ĉList": 10675, + "ĉu": 10676, + "Comment": 10677, + "_VERSION": 10678, + ".Xtra": 10679, + "Person": 10680, + "rb": 10681, + "LOB": 10682, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĊ": 10683, + "ĠCentral": 10684, + "ICK": 10685, + "raq": 10686, + "Ġputting": 10687, + "Ġmd": 10688, + "ĠLove": 10689, + "Program": 10690, + "Border": 10691, + "oor": 10692, + "Ġallowing": 10693, + "after": 10694, + "Ġentries": 10695, + "ĠMaybe": 10696, + "]).": 10697, + "ĠShort": 10698, + ")\\": 10699, + ".now": 10700, + "friend": 10701, + "Ġprefer": 10702, + "ĠGPIO": 10703, + "osis": 10704, + "ĠGameObject": 10705, + "Ġskip": 10706, + "Ġcompetition": 10707, + "_match": 10708, + "lications": 10709, + "_CONT": 10710, + ".groupBox": 10711, + "Ġals": 10712, + "\"We": 10713, + "_eq": 10714, + "lan": 10715, + "_search": 10716, + "ĠMusic": 10717, + "asis": 10718, + "Ġbind": 10719, + "ĠIsland": 10720, + "rum": 10721, + "(E": 10722, + "Ġseat": 10723, + "Video": 10724, + "Ġack": 10725, + "reek": 10726, + "={()": 10727, + "Ġrating": 10728, + "Ġrestaurant": 10729, + "DEX": 10730, + "(buf": 10731, + "pping": 10732, + "uality": 10733, + "Ġleague": 10734, + "Ġfocused": 10735, + "apon": 10736, + "$data": 10737, + "CLUD": 10738, + "CLUDING": 10739, + "Ġabsolute": 10740, + "(query": 10741, + "Ġtells": 10742, + "Ang": 10743, + "Ġcommunities": 10744, + "Ġhonest": 10745, + "oking": 10746, + "Ġapart": 10747, + "arity": 10748, + "/$": 10749, + "_module": 10750, + "ĠEnc": 10751, + ".an": 10752, + ".Config": 10753, + "Cre": 10754, + "Ġshock": 10755, + "ĠArab": 10756, + "IENT": 10757, + "/re": 10758, + "Ġretrie": 10759, + "ycler": 10760, + "isa": 10761, + "ĠOrgan": 10762, + ".graph": 10763, + "Ġí": 10764, + "ĠBAS": 10765, + "Enum": 10766, + "Ġpossibly": 10767, + "ÑĢаÐ": 10768, + "ĠJapanese": 10769, + "Ġcraft": 10770, + "ĠPlace": 10771, + "Ġtalent": 10772, + "Ġfunding": 10773, + "Ġconfirmed": 10774, + "Ġcycle": 10775, + "/x": 10776, + "GE": 10777, + "Ġhearing": 10778, + "Ġplants": 10779, + "Ġmouth": 10780, + "pages": 10781, + "oria": 10782, + "ĠRemove": 10783, + "_total": 10784, + "Ġod": 10785, + "ollapse": 10786, + "door": 10787, + "Ġbought": 10788, + "Ġaddr": 10789, + "ARCH": 10790, + "_dim": 10791, + "dden": 10792, + "Ġdecades": 10793, + "REQUEST": 10794, + "Ġversions": 10795, + "fire": 10796, + "Ġmoves": 10797, + "fb": 10798, + "Ġcoffee": 10799, + ".connect": 10800, + "ĠRow": 10801, + "Ġschema": 10802, + "Scope": 10803, + "-Type": 10804, + "Ġfighting": 10805, + "Ġretail": 10806, + "Ġmodified": 10807, + "TF": 10808, + "Files": 10809, + "nie": 10810, + "_command": 10811, + "stone": 10812, + "ĠÑĤ": 10813, + "_thread": 10814, + "Ġbond": 10815, + "ĠDevelopment": 10816, + "Ġpt": 10817, + "FORM": 10818, + "plet": 10819, + "Ġidentified": 10820, + "cpp": 10821, + "Ġcoding": 10822, + "oked": 10823, + "ĠMaster": 10824, + "IDTH": 10825, + "Ġresidents": 10826, + "redit": 10827, + "ĠPhoto": 10828, + "=-": 10829, + "unte": 10830, + "ateur": 10831, + "_STATE": 10832, + "ĠSing": 10833, + "Ġsheet": 10834, + ".val": 10835, + "orse": 10836, + "Ġhers": 10837, + "Ġdetermined": 10838, + "Common": 10839, + "Ġwed": 10840, + "_queue": 10841, + "PH": 10842, + "ĠAtl": 10843, + "cred": 10844, + "/LICENSE": 10845, + "Ġmes": 10846, + "Ġadvanced": 10847, + ".java": 10848, + ".Sh": 10849, + "Go": 10850, + "kill": 10851, + "fp": 10852, + "_settings": 10853, + "Ġpal": 10854, + "Ġtruck": 10855, + "Ġcombined": 10856, + "Ġ\"${": 10857, + "ĠCorpor": 10858, + "Ġjoined": 10859, + "ĠJose": 10860, + "ĠCup": 10861, + "uns": 10862, + "estival": 10863, + "levision": 10864, + "Ġbroken": 10865, + "Ġmarriage": 10866, + "ĠWestern": 10867, + "Ġrepresents": 10868, + "ĠTitle": 10869, + "Ġss": 10870, + ".Ass": 10871, + "ongoose": 10872, + "iento": 10873, + "<>();Ċ": 10874, + "Ġabsolutely": 10875, + "Ġsmooth": 10876, + "TERN": 10877, + "ĠUnless": 10878, + "Word": 10879, + "Ġmerge": 10880, + "igan": 10881, + "ĠVol": 10882, + "Ġnn": 10883, + ".getId": 10884, + "Ġз": 10885, + "Ġsexy": 10886, + "Ġseeking": 10887, + "Single": 10888, + ".this": 10889, + "Ġkom": 10890, + "bound": 10891, + ";\"": 10892, + "ĠfontSize": 10893, + "_df": 10894, + "Ġinjury": 10895, + "(H": 10896, + "Ġissued": 10897, + "_END": 10898, + ":self": 10899, + "Ġpatch": 10900, + "Ġleaves": 10901, + "Ġadopt": 10902, + "FileName": 10903, + "ãĢIJ": 10904, + "Ġexecutive": 10905, + "ĠByte": 10906, + "]))Ċ": 10907, + "Ġnu": 10908, + "outing": 10909, + "cluding": 10910, + "-R": 10911, + ".options": 10912, + "Ġsubstant": 10913, + "avax": 10914, + "ĠBUT": 10915, + "Ġtechnical": 10916, + "Ġtwice": 10917, + "Ġmás": 10918, + "Ġunivers": 10919, + "yr": 10920, + "Ġdrag": 10921, + "ĠDC": 10922, + "Ġsed": 10923, + "Ġbot": 10924, + "ĠPal": 10925, + "ĠHall": 10926, + "forcement": 10927, + "Ġauch": 10928, + ".mod": 10929, + "notation": 10930, + "_files": 10931, + ".line": 10932, + "_flag": 10933, + "[name": 10934, + "Ġresolution": 10935, + "Ġbott": 10936, + "(\"[": 10937, + "ende": 10938, + "(arr": 10939, + "Free": 10940, + "(@\"": 10941, + "ĠDistrict": 10942, + "PEC": 10943, + ":-": 10944, + "Picker": 10945, + "ĠJo": 10946, + "ĠĠĠĠĠĊ": 10947, + "ĠRiver": 10948, + "_rows": 10949, + "Ġhelpful": 10950, + "Ġmassive": 10951, + "---Ċ": 10952, + "Ġmeasures": 10953, + "ĠRuntime": 10954, + "Ġworry": 10955, + "ĠSpec": 10956, + "ĉD": 10957, + "ãĢij": 10958, + "Ġ){Ċ": 10959, + "Ġworse": 10960, + "(filename": 10961, + "Ġlay": 10962, + "Ġmagic": 10963, + "ĠTheir": 10964, + "oul": 10965, + "stroy": 10966, + "ĠWhere": 10967, + "Ġsudden": 10968, + "Ġdefe": 10969, + "Ġbinding": 10970, + "Ġflight": 10971, + "ĠOnInit": 10972, + "ĠWomen": 10973, + "ĠPolicy": 10974, + "Ġdrugs": 10975, + "ishing": 10976, + "('../": 10977, + "ĠMel": 10978, + "peat": 10979, + "tor": 10980, + "Ġproposed": 10981, + "Ġstated": 10982, + "_RES": 10983, + "Ġeast": 10984, + "ĠCONDITION": 10985, + "_desc": 10986, + "Ġwinning": 10987, + "folio": 10988, + "Mapper": 10989, + "ĠPan": 10990, + "ĠAnge": 10991, + ".servlet": 10992, + "Ġcopies": 10993, + "LM": 10994, + "Ġvm": 10995, + "åį": 10996, + "Ġdictionary": 10997, + "Seg": 10998, + "elines": 10999, + "ĠSend": 11000, + "Ġiron": 11001, + "ĠFort": 11002, + ".domain": 11003, + "Ġdebate": 11004, + "NotNull": 11005, + "eq": 11006, + "acher": 11007, + "lf": 11008, + "ĉfmt": 11009, + "Ġlawy": 11010, + "ÄŁ": 11011, + "ĠMen": 11012, + "Ġtrim": 11013, + "(NULL": 11014, + "Ġ!!": 11015, + "Ġpad": 11016, + "Ġfollows": 11017, + "\"][\"": 11018, + "requ": 11019, + "ĠEp": 11020, + ".github": 11021, + "(img": 11022, + "eto": 11023, + "('\\": 11024, + "Services": 11025, + "umbnail": 11026, + "_main": 11027, + "pleted": 11028, + "fortunately": 11029, + "Ġwindows": 11030, + "Ġplane": 11031, + "ĠConnection": 11032, + ".local": 11033, + "uard": 11034, + "}\\": 11035, + "==\"": 11036, + "andon": 11037, + "ĠRoy": 11038, + "west": 11039, + "iginal": 11040, + "emies": 11041, + "itz": 11042, + "'):Ċ": 11043, + "ĠPeter": 11044, + "Ġtough": 11045, + "Ġreduced": 11046, + "Ġcalculate": 11047, + "Ġrapid": 11048, + "customer": 11049, + "Ġefficient": 11050, + "Ġmedium": 11051, + "Ġfell": 11052, + ".ref": 11053, + "ĠCas": 11054, + "Ġfeedback": 11055, + "Speed": 11056, + "(output": 11057, + "aje": 11058, + "Ġcategories": 11059, + "Ġfee": 11060, + "};": 11061, + "Ġdeleted": 11062, + "reh": 11063, + "Ġproof": 11064, + "Desc": 11065, + "Build": 11066, + "Ġsides": 11067, + ".ArrayList": 11068, + "-%": 11069, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 11070, + "ر": 11071, + ".match": 11072, + "ли": 11073, + "Ġfeels": 11074, + "Ġachieve": 11075, + "Ġclim": 11076, + "_ON": 11077, + "ĠCD": 11078, + "Ġteacher": 11079, + "_current": 11080, + "bn": 11081, + "_PL": 11082, + "isting": 11083, + "Enable": 11084, + "GEN": 11085, + "Ġtv": 11086, + "Ġsock": 11087, + "Ġplays": 11088, + "Ġdiscount": 11089, + "ĠKE": 11090, + "ĠDebug": 11091, + "Fore": 11092, + "ĠIraq": 11093, + "Ġappearance": 11094, + "Mon": 11095, + "Ġstyled": 11096, + "ĠHuman": 11097, + "iot": 11098, + "ĠHistory": 11099, + "Ġsac": 11100, + "ĠCollection": 11101, + "Ġrecommended": 11102, + ".Selected": 11103, + "Ġorganizations": 11104, + "Ġdiscovered": 11105, + "cohol": 11106, + "adas": 11107, + "ĠThomas": 11108, + "May": 11109, + "Ġconserv": 11110, + "Ġdomin": 11111, + "ĠFollow": 11112, + "ĠSection": 11113, + "ĠThanks": 11114, + "Username": 11115, + "Ġrecipe": 11116, + "Ġwonderful": 11117, + ".sleep": 11118, + "_if": 11119, + "ĉĊĉĊ": 11120, + "orno": 11121, + "Ġru": 11122, + "_target": 11123, + ".\"\"": 11124, + "à¦": 11125, + "EventArgs": 11126, + "Ġinputs": 11127, + "Ġfif": 11128, + "Ġvision": 11129, + "cy": 11130, + "ĠSeries": 11131, + ")(((": 11132, + "Ġtrading": 11133, + "Ġmarker": 11134, + "Begin": 11135, + "Ġtypically": 11136, + "Ġcauses": 11137, + "dropdown": 11138, + "_DEBUG": 11139, + "Ġdetect": 11140, + "country": 11141, + "!\");Ċ": 11142, + "ĉR": 11143, + "appy": 11144, + "Ġcref": 11145, + "('<": 11146, + "\"=>": 11147, + "ĠLE": 11148, + "reader": 11149, + "Ġadministr": 11150, + "õ": 11151, + "ucket": 11152, + "Ġfashion": 11153, + ".char": 11154, + "izar": 11155, + "Ġdisable": 11156, + "Ġsuc": 11157, + "ĠLive": 11158, + "issue": 11159, + "Ġmetadata": 11160, + "flags": 11161, + "ĠðŁ": 11162, + "Ġcommitted": 11163, + "Ġva": 11164, + "Ġrough": 11165, + "Ġ'''Ċ": 11166, + "Ġhighlight": 11167, + "_vars": 11168, + "VO": 11169, + "Ġencoding": 11170, + "-Z": 11171, + "_sign": 11172, + "$(\"#": 11173, + "Ġrain": 11174, + "reatest": 11175, + "ĠEND": 11176, + "Selection": 11177, + "Ġcandidates": 11178, + "Ġsav": 11179, + ".Empty": 11180, + "Ġdecisions": 11181, + "Ġcollabor": 11182, + "ridge": 11183, + "feed": 11184, + "ression": 11185, + "Ġpersons": 11186, + "VM": 11187, + "ega": 11188, + "_BIT": 11189, + "According": 11190, + "acked": 11191, + "Ġdollars": 11192, + "_loss": 11193, + "ĠCost": 11194, + "}\"Ċ": 11195, + "Notification": 11196, + "Ġprostit": 11197, + "Ġauthority": 11198, + ".rec": 11199, + "Ġspokes": 11200, + "ĠToday": 11201, + "istant": 11202, + "ĠHead": 11203, + "âĢĿ.": 11204, + "ertainment": 11205, + "cean": 11206, + "culate": 11207, + "Ġven": 11208, + "However": 11209, + "_arr": 11210, + "Ġtokens": 11211, + "Graph": 11212, + "ĠJud": 11213, + "ĠVirgin": 11214, + "ĠSerial": 11215, + "unning": 11216, + "Mutable": 11217, + "agers": 11218, + ".csv": 11219, + "Ġdeveloping": 11220, + "Ġinstructions": 11221, + "Ġpromise": 11222, + "Ġrequested": 11223, + "_encode": 11224, + "/\"": 11225, + "ĠIcon": 11226, + "uilt": 11227, + "-day": 11228, + "Ġintelligence": 11229, + ".IS": 11230, + "ĠObservable": 11231, + "ĠHard": 11232, + "Bool": 11233, + "idential": 11234, + ".Anchor": 11235, + "Ġselling": 11236, + "CI": 11237, + "AGES": 11238, + "tle": 11239, + "bur": 11240, + "UFFER": 11241, + "RY": 11242, + "Ġbigger": 11243, + "Ġrat": 11244, + "Ġfamous": 11245, + "Ġtypename": 11246, + "Ġexplained": 11247, + "}}Ċ": 11248, + "Ġnuclear": 11249, + "-N": 11250, + "Ġcrisis": 11251, + "ĠEnter": 11252, + "Ġanswers": 11253, + "/${": 11254, + "/pl": 11255, + "Ġsequ": 11256, + "_next": 11257, + "mask": 11258, + "Ġstanding": 11259, + "Ġplenty": 11260, + "ĠCross": 11261, + "ĉret": 11262, + "dro": 11263, + "ĠCast": 11264, + "=true": 11265, + "ĠChris": 11266, + "icio": 11267, + "ĠMike": 11268, + "Decimal": 11269, + "addComponent": 11270, + "Len": 11271, + "Ġcock": 11272, + "Ġ#{": 11273, + "URN": 11274, + "": 11403, + "Ġ*=": 11404, + "ĠPS": 11405, + "Ġdangerous": 11406, + "[p": 11407, + "OME": 11408, + "Other": 11409, + "ĠStringBuilder": 11410, + "Points": 11411, + "heading": 11412, + "Ġcurrency": 11413, + "Ġpercentage": 11414, + "_API": 11415, + "Ġclassic": 11416, + "thead": 11417, + "ĠMO": 11418, + "FE": 11419, + "Idx": 11420, + "await": 11421, + "Ġè": 11422, + "Ġaccident": 11423, + "Ġvariant": 11424, + "Ġmyst": 11425, + "ĠLand": 11426, + "ĠBre": 11427, + "Ġharm": 11428, + "ĠAcc": 11429, + "Ġcharged": 11430, + "iones": 11431, + "Visibility": 11432, + "arry": 11433, + "ĠLanguage": 11434, + "Ġwalking": 11435, + "\".ĊĊ": 11436, + "ifer": 11437, + "Ġleadership": 11438, + ".From": 11439, + "ynam": 11440, + "Ġtimestamp": 11441, + "ipt": 11442, + "ĠHas": 11443, + "REFER": 11444, + "ĠIts": 11445, + "Ġlistener": 11446, + "UTE": 11447, + "_description": 11448, + "Ġexperiences": 11449, + "Ġcreates": 11450, + "RS": 11451, + "cart": 11452, + "black": 11453, + "Ġchoices": 11454, + "war": 11455, + "Ġ'''": 11456, + "Ġordered": 11457, + "Ġevening": 11458, + "Ġpil": 11459, + "Ġtun": 11460, + "ĠBad": 11461, + "(app": 11462, + "random": 11463, + "Ġexplicit": 11464, + "Ġarrived": 11465, + "Ġfly": 11466, + "Ġeconom": 11467, + "-mail": 11468, + "Ġlists": 11469, + "Ġarchitect": 11470, + "ĠPay": 11471, + "Ġds": 11472, + "ĠSol": 11473, + "Ġvehicles": 11474, + "Hz": 11475, + "-com": 11476, + "Ġking": 11477, + "_equal": 11478, + "ĠHelp": 11479, + "Ġabuse": 11480, + "--;Ċ": 11481, + "Ġextr": 11482, + "Ġchemical": 11483, + "ä¿": 11484, + "Ġorient": 11485, + "Ġbreath": 11486, + "ĠSpace": 11487, + "(element": 11488, + "wait": 11489, + "DED": 11490, + "igma": 11491, + "Ġentr": 11492, + "Ġsob": 11493, + "-name": 11494, + "Ġaffected": 11495, + "ika": 11496, + "Ġcoal": 11497, + "_work": 11498, + "Ġhundreds": 11499, + "Ġpolitics": 11500, + "subject": 11501, + "Ġconsumer": 11502, + "ANGE": 11503, + "Ġrepeated": 11504, + "Send": 11505, + "Ġ#[": 11506, + "Ġprotocol": 11507, + "Ġleads": 11508, + "useum": 11509, + "Every": 11510, + "Import": 11511, + "(count": 11512, + "Ġchallenges": 11513, + "Ġnovel": 11514, + "Ġdepart": 11515, + "bits": 11516, + ".Current": 11517, + "Ġ`${": 11518, + "oting": 11519, + "(\\": 11520, + "Ġcreative": 11521, + "Ġbuff": 11522, + "Ġintroduced": 11523, + "usic": 11524, + "modules": 11525, + "Are": 11526, + "-doc": 11527, + "language": 11528, + "_cache": 11529, + "Ġtod": 11530, + "?>": 11531, + "omething": 11532, + "Ġhun": 11533, + "åº": 11534, + "aters": 11535, + "Intent": 11536, + "Ġimplemented": 11537, + "ĠCase": 11538, + "Children": 11539, + "Ġnotification": 11540, + "Renderer": 11541, + "Wrapper": 11542, + "Objects": 11543, + "tl": 11544, + ".Contains": 11545, + "Plugin": 11546, + ".row": 11547, + "Ġforg": 11548, + "Ġpermit": 11549, + "Ġtargets": 11550, + "ĠIF": 11551, + "Ġtip": 11552, + "sex": 11553, + "Ġsupports": 11554, + "Ġfold": 11555, + "photo": 11556, + "},čĊ": 11557, + "Ġgoogle": 11558, + "$('#": 11559, + "Ġsharing": 11560, + "Ġgoods": 11561, + "vs": 11562, + "ĠDan": 11563, + "Rate": 11564, + "ĠMartin": 11565, + "Ġmanner": 11566, + "lie": 11567, + ".The": 11568, + "Internal": 11569, + "ĠCONTR": 11570, + "Mock": 11571, + "RIGHT": 11572, + "Ġ'{": 11573, + "Ġcontrols": 11574, + "Mat": 11575, + "Ġmand": 11576, + "Ġextended": 11577, + "Ok": 11578, + "Ġembed": 11579, + "Ġplanet": 11580, + "ĠNon": 11581, + "-ch": 11582, + ")\",": 11583, + "epar": 11584, + "Ġbelieved": 11585, + "ĠEnvironment": 11586, + "ĠFriend": 11587, + "-res": 11588, + "Ġhandling": 11589, + "nic": 11590, + "-level": 11591, + "scri": 11592, + "Xml": 11593, + "BE": 11594, + "ungen": 11595, + "Ġalter": 11596, + "[idx": 11597, + "Pop": 11598, + "cam": 11599, + "Ġ(((": 11600, + "Ġshipping": 11601, + "Ġbattery": 11602, + "iddleware": 11603, + "MC": 11604, + "Ġimpl": 11605, + "otation": 11606, + "ĠLab": 11607, + "