diff --git a/.gitattributes b/.gitattributes
index a6344aac8c09253b3b630fb776ae94478aa0275b..52373fe24473b1aa44333d318f578ae6bf04b49b 100644
--- a/.gitattributes
+++ b/.gitattributes
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
*.zip filter=lfs diff=lfs merge=lfs -text
*.zst filter=lfs diff=lfs merge=lfs -text
*tfevents* filter=lfs diff=lfs merge=lfs -text
+tokenizer.json filter=lfs diff=lfs merge=lfs -text
diff --git a/README.md b/README.md
index 7be5fc7f47d5db027d120b8024982df93db95b74..1f774e20cb5e849dcf0a63f311cd392d0d1627af 100644
--- a/README.md
+++ b/README.md
@@ -1,3 +1,11 @@
---
+language:
+- en
license: mit
+base_model: FuseAI/FuseO1-DeepSeekR1-QwQ-SkyT1-32B-Preview
+base_model_relation: quantized
+library_name: mlc-llm
+pipeline_tag: text-generation
---
+
+4-bit GPTQ quantized version of [FuseAI/FuseO1-DeepSeekR1-QwQ-SkyT1-32B-Preview](https://huggingface.co/FuseAI/FuseO1-DeepSeekR1-QwQ-SkyT1-32B-Preview) for inference with the [Private LLM](http://privatellm.app) app.
diff --git a/config.json b/config.json
new file mode 100644
index 0000000000000000000000000000000000000000..d9e7e08f5c8e277065c653a7c72987d064f55208
--- /dev/null
+++ b/config.json
@@ -0,0 +1,5 @@
+{
+ "quantization_config": {
+ "bits": 4
+ }
+}
diff --git a/ndarray-cache.json b/ndarray-cache.json
new file mode 100644
index 0000000000000000000000000000000000000000..c0765fafb15b5d286b9146ff20a9da7c46dffadb
--- /dev/null
+++ b/ndarray-cache.json
@@ -0,0 +1,9687 @@
+{
+ "metadata": {
+ "ParamSize": 709,
+ "ParamBytes": 16895535104.0,
+ "BitsPerParam": 4.125405656518088
+ },
+ "records": [
+ {
+ "dataPath": "params_shard_0.bin",
+ "format": "raw-shard",
+ "nbytes": 389283840,
+ "records": [
+ {
+ "name": "lm_head.q_weight",
+ "shape": [
+ 640,
+ 152064
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 389283840,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e514aca4c682d50ee4cb08b855b1154d"
+ },
+ {
+ "dataPath": "params_shard_1.bin",
+ "format": "raw-shard",
+ "nbytes": 389283840,
+ "records": [
+ {
+ "name": "model.embed_tokens.q_weight",
+ "shape": [
+ 152064,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 389283840,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9cb18e190462c9789f0b70fbd536add8"
+ },
+ {
+ "dataPath": "params_shard_2.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.0.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "06dad7677b4ed79524a44ddbd1a6fcf9"
+ },
+ {
+ "dataPath": "params_shard_3.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.0.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9cf3a271e940b843da9ba8b06c130ebf"
+ },
+ {
+ "dataPath": "params_shard_4.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.0.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ef5c0e5c075cc868c9e78370cbd5905e"
+ },
+ {
+ "dataPath": "params_shard_5.bin",
+ "format": "raw-shard",
+ "nbytes": 31574016,
+ "records": [
+ {
+ "name": "lm_head.q_scale",
+ "shape": [
+ 40,
+ 152064
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 12165120,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.embed_tokens.q_scale",
+ "shape": [
+ 152064,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 12165120,
+ "byteOffset": 12165120
+ },
+ {
+ "name": "model.layers.0.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 24330240
+ },
+ {
+ "name": "model.layers.0.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 24340480
+ },
+ {
+ "name": "model.layers.0.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 26552320
+ },
+ {
+ "name": "model.layers.0.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 30976000
+ },
+ {
+ "name": "model.layers.0.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 30986240
+ },
+ {
+ "name": "model.layers.0.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 31000576
+ }
+ ],
+ "md5sum": "034fa3f03faa5e0862833237b4997a08"
+ },
+ {
+ "dataPath": "params_shard_6.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.1.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ffb4c1f6b544958fda42aeb7a0561d17"
+ },
+ {
+ "dataPath": "params_shard_7.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.1.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1d50d56030938741077b8c2417fd9565"
+ },
+ {
+ "dataPath": "params_shard_8.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.1.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c24aa7a97eecd8306733ef40411888a6"
+ },
+ {
+ "dataPath": "params_shard_9.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.0.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.0.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.1.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.1.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.1.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.1.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.1.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.1.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "916f5d77066a2e697479774fb5922929"
+ },
+ {
+ "dataPath": "params_shard_10.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.10.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0114f243a054ab0982b3e368fa88d4e6"
+ },
+ {
+ "dataPath": "params_shard_11.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.10.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "364bc012bc3dbbcc979546700586eaad"
+ },
+ {
+ "dataPath": "params_shard_12.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.10.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8d3d9ead6aefe403f79d2dd96be98ab9"
+ },
+ {
+ "dataPath": "params_shard_13.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.1.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.1.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.10.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.10.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.10.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.10.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.10.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.10.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "d38ddf35e432739af3c56ad915959601"
+ },
+ {
+ "dataPath": "params_shard_14.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.11.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d346237f43db034f039bf0be28eea5a6"
+ },
+ {
+ "dataPath": "params_shard_15.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.11.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ca66f1dbce88e8ee582ff28cdcd72592"
+ },
+ {
+ "dataPath": "params_shard_16.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.11.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2b259e4b1b8f61d6a7d7be074403e005"
+ },
+ {
+ "dataPath": "params_shard_17.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.10.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.10.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.11.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.11.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.11.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.11.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.11.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.11.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "e9375510bd1991be58e959f36bc674df"
+ },
+ {
+ "dataPath": "params_shard_18.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.12.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b7b0d3eb8d9f53be076e6f126c82b454"
+ },
+ {
+ "dataPath": "params_shard_19.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.12.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f072c7c988e923467fbba8e570fa8918"
+ },
+ {
+ "dataPath": "params_shard_20.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.12.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ac361295b9a492c04db5136930eaaf99"
+ },
+ {
+ "dataPath": "params_shard_21.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.11.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.11.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.12.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.12.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.12.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.12.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.12.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.12.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "92834dd74fbdafaa368be5189d48d38b"
+ },
+ {
+ "dataPath": "params_shard_22.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.13.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6f250ddb642d28d70b2d6779d26e38c1"
+ },
+ {
+ "dataPath": "params_shard_23.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.13.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a9876973d82afea1f933fba566974bdb"
+ },
+ {
+ "dataPath": "params_shard_24.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.13.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2488ac1e9ae70ea543ad63711e1350ff"
+ },
+ {
+ "dataPath": "params_shard_25.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.12.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.12.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.13.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.13.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.13.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.13.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.13.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.13.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "db0cf5718ad37539595f7b7cf55467e5"
+ },
+ {
+ "dataPath": "params_shard_26.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.14.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f66ea1fd330c1d98ede9204fd1c27f4f"
+ },
+ {
+ "dataPath": "params_shard_27.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.14.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c2d4691f83ce44f17dd6fc6b3e0b6fe1"
+ },
+ {
+ "dataPath": "params_shard_28.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.14.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d28c11a8cf83bd470b4a990726e82586"
+ },
+ {
+ "dataPath": "params_shard_29.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.13.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.13.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.14.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.14.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.14.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.14.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.14.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.14.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "a7aac5f05e15094024233386b6453d35"
+ },
+ {
+ "dataPath": "params_shard_30.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.15.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "50ff011d62eca6338f26482fca3b0b63"
+ },
+ {
+ "dataPath": "params_shard_31.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.15.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5230d3593c8fa3a1c62258f553f5033c"
+ },
+ {
+ "dataPath": "params_shard_32.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.15.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0d9f3196ec6bf1c8d6cef24ddc1bddab"
+ },
+ {
+ "dataPath": "params_shard_33.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.14.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.14.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.15.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.15.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.15.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.15.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.15.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.15.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "362bc54c797e7961742221c537a011f1"
+ },
+ {
+ "dataPath": "params_shard_34.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.16.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "51d6e8dd2adec67c7c9e09163b8d2704"
+ },
+ {
+ "dataPath": "params_shard_35.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.16.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3cf0a54ba3fb8784fa15593df890b628"
+ },
+ {
+ "dataPath": "params_shard_36.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.16.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "402801c5c379962b172b6c18bc0724b4"
+ },
+ {
+ "dataPath": "params_shard_37.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.15.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.15.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.16.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.16.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.16.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.16.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.16.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.16.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "eeb784751bda3f7472710e55ba7c98c3"
+ },
+ {
+ "dataPath": "params_shard_38.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.17.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "95c80c01c527dab61b5b932590ee350c"
+ },
+ {
+ "dataPath": "params_shard_39.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.17.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fff693a327d921b8e909e23d02eba397"
+ },
+ {
+ "dataPath": "params_shard_40.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.17.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5761436559db39f44239e420956c96f5"
+ },
+ {
+ "dataPath": "params_shard_41.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.16.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.16.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.17.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.17.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.17.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.17.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.17.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.17.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "b2672e2beb049000ad033a3d4755737a"
+ },
+ {
+ "dataPath": "params_shard_42.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.18.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7cd69ffcc9a195f6bfe807412dedbd86"
+ },
+ {
+ "dataPath": "params_shard_43.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.18.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5a9e5bf27ecf3b55faaa2a6cc5dd0518"
+ },
+ {
+ "dataPath": "params_shard_44.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.18.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ebca7cc04bcabe46320b4869482939a0"
+ },
+ {
+ "dataPath": "params_shard_45.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.17.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.17.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.18.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.18.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.18.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.18.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.18.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.18.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "92322a3d2bc91e360980f5990acfdca3"
+ },
+ {
+ "dataPath": "params_shard_46.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.19.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "bdd3e519ca2fb440ab7ff91246698022"
+ },
+ {
+ "dataPath": "params_shard_47.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.19.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "211c698c8869992ccb79bdca68a8444f"
+ },
+ {
+ "dataPath": "params_shard_48.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.19.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "815bc0f80e56793cf2e68f4d134ca462"
+ },
+ {
+ "dataPath": "params_shard_49.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.18.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.18.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.19.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.19.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.19.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.19.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.19.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.19.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "224aa969234d62e700d931ec1e21e262"
+ },
+ {
+ "dataPath": "params_shard_50.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.2.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0c4828a30434f15834be04976ce8bd43"
+ },
+ {
+ "dataPath": "params_shard_51.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.2.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "261c91c378bffef4361c596ef061a146"
+ },
+ {
+ "dataPath": "params_shard_52.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.2.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "91619426adde771e6a780cafbe0b5bdd"
+ },
+ {
+ "dataPath": "params_shard_53.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.19.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.19.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.2.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.2.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.2.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.2.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.2.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.2.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "6498639c39e6df461f75945173d611b5"
+ },
+ {
+ "dataPath": "params_shard_54.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.20.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e3f18601a71ef851af116c3793e277a8"
+ },
+ {
+ "dataPath": "params_shard_55.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.20.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "00a79e4653205ca670d06ac3f2cb03f2"
+ },
+ {
+ "dataPath": "params_shard_56.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.20.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e8bdb0261b918a6c02923c091d053873"
+ },
+ {
+ "dataPath": "params_shard_57.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.2.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.2.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.20.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.20.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.20.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.20.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.20.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.20.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "34c3163bac91ce27b1abc1aa3382e154"
+ },
+ {
+ "dataPath": "params_shard_58.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.21.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f55968be109830ee73bc5f8e68842273"
+ },
+ {
+ "dataPath": "params_shard_59.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.21.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "efe24b37b2e583d26bd82f27f87b823c"
+ },
+ {
+ "dataPath": "params_shard_60.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.21.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0f690e450a0239e5d98e228e5d746942"
+ },
+ {
+ "dataPath": "params_shard_61.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.20.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.20.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.21.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.21.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.21.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.21.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.21.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.21.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "d5a13b29e87787b217a98c1e4f291211"
+ },
+ {
+ "dataPath": "params_shard_62.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.22.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1aae928d1df22c726185ac225bab72c4"
+ },
+ {
+ "dataPath": "params_shard_63.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.22.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b8fab896a0c2e1446edaa67dbff8c66d"
+ },
+ {
+ "dataPath": "params_shard_64.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.22.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "61c349bebaca9f363b514cd0e2978313"
+ },
+ {
+ "dataPath": "params_shard_65.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.21.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.21.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.22.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.22.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.22.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.22.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.22.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.22.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "a489e93a30b8e58bd8ca5c9bdfd65d4d"
+ },
+ {
+ "dataPath": "params_shard_66.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.23.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9de5d042e528a91f9b32c57bffdd0914"
+ },
+ {
+ "dataPath": "params_shard_67.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.23.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a7faca051d2ab44cd16a8cef002643d7"
+ },
+ {
+ "dataPath": "params_shard_68.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.23.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "25fea6f9eca4e3ba9cb8d28877cf7f4d"
+ },
+ {
+ "dataPath": "params_shard_69.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.22.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.22.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.23.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.23.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.23.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.23.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.23.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.23.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "7ad512dea896dfa6d5e02325ac84f553"
+ },
+ {
+ "dataPath": "params_shard_70.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.24.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "37734868c1f5efc3c85964e1fa66360f"
+ },
+ {
+ "dataPath": "params_shard_71.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.24.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8da309bd23173475bc7ab9939a94cd37"
+ },
+ {
+ "dataPath": "params_shard_72.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.24.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3880b9c30c4c691ca444dfc7248debef"
+ },
+ {
+ "dataPath": "params_shard_73.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.23.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.23.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.24.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.24.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.24.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.24.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.24.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.24.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "90e2bdee1aaf106e38b13e30626da90d"
+ },
+ {
+ "dataPath": "params_shard_74.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.25.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "72838ca1efce265b053b38608f9f9ee1"
+ },
+ {
+ "dataPath": "params_shard_75.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.25.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "81aaac09c01cce4ee961676132a571a6"
+ },
+ {
+ "dataPath": "params_shard_76.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.25.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "74ffa5c6a5e6f92f249153c8a5ee5937"
+ },
+ {
+ "dataPath": "params_shard_77.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.24.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.24.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.25.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.25.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.25.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.25.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.25.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.25.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "4fd7e1c28c9032d19c43c79ab498ee6a"
+ },
+ {
+ "dataPath": "params_shard_78.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.26.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "13e964f04c210c6899bad7b5adfa9bad"
+ },
+ {
+ "dataPath": "params_shard_79.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.26.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7124c4fb7527915d5dd7501aa1c59546"
+ },
+ {
+ "dataPath": "params_shard_80.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.26.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e5bb5792ff8f608e50c7990a594c67d7"
+ },
+ {
+ "dataPath": "params_shard_81.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.25.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.25.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.26.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.26.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.26.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.26.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.26.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.26.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "dec04173c08cafd1d292fda5bcdf9ada"
+ },
+ {
+ "dataPath": "params_shard_82.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.27.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ac95ab90e37d02639e749e9b3ecdc6c3"
+ },
+ {
+ "dataPath": "params_shard_83.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.27.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9fb44ceac5ff535efbed085a48746926"
+ },
+ {
+ "dataPath": "params_shard_84.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.27.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6164e1bfb53c7e7b01732ca5d67da336"
+ },
+ {
+ "dataPath": "params_shard_85.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.26.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.26.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.27.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.27.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.27.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.27.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.27.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.27.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "235bfcb4baf0cb76f75aa24bad07755e"
+ },
+ {
+ "dataPath": "params_shard_86.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.28.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "828a3d5674282a737c354d2184e553a0"
+ },
+ {
+ "dataPath": "params_shard_87.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.28.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "588f7f8018065a57499ad786d0fe7550"
+ },
+ {
+ "dataPath": "params_shard_88.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.28.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1f0fec41cb8f1750cf340d1d6ed9864c"
+ },
+ {
+ "dataPath": "params_shard_89.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.27.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.27.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.28.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.28.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.28.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.28.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.28.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.28.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "a9a27a80e6d297d72aa07acb1374351d"
+ },
+ {
+ "dataPath": "params_shard_90.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.29.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2cbad330874b83655fdf1b1ccefa46ac"
+ },
+ {
+ "dataPath": "params_shard_91.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.29.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8aa7682a75eb82e724605957f9d6bb1b"
+ },
+ {
+ "dataPath": "params_shard_92.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.29.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4cd2ab52174f5858181499d8fac88037"
+ },
+ {
+ "dataPath": "params_shard_93.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.28.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.28.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.29.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.29.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.29.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.29.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.29.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.29.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "6c0a2e12ea6f16129c6c9da7bb688a70"
+ },
+ {
+ "dataPath": "params_shard_94.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.3.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f93a950bd3d28c3052a4201042f3c9b1"
+ },
+ {
+ "dataPath": "params_shard_95.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.3.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "10e1b9c0de4d179e0fd242be48edd2fc"
+ },
+ {
+ "dataPath": "params_shard_96.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.3.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c326cba0f5b41b27ed08e5f14f56ed00"
+ },
+ {
+ "dataPath": "params_shard_97.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.29.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.29.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.3.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.3.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.3.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.3.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.3.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.3.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "213c7404722fd4ab580fd2d0ae0eb0da"
+ },
+ {
+ "dataPath": "params_shard_98.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.30.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9623379071afb5a56bd91c14900cee71"
+ },
+ {
+ "dataPath": "params_shard_99.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.30.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5a6eb73d85213850540eeb0b5e77f97e"
+ },
+ {
+ "dataPath": "params_shard_100.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.30.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ed0dc87251271e54ebb05b0ed8a105ae"
+ },
+ {
+ "dataPath": "params_shard_101.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.3.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.3.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.30.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.30.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.30.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.30.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.30.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.30.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "a6425cc0df64e234022874f007b5d3b2"
+ },
+ {
+ "dataPath": "params_shard_102.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.31.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3dfcb0e3e6040f05dd1c12f1430d73bd"
+ },
+ {
+ "dataPath": "params_shard_103.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.31.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fff26b50e7e18d7ef210008d5f37b581"
+ },
+ {
+ "dataPath": "params_shard_104.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.31.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6c3f3dade283c306c6228528b5a6c422"
+ },
+ {
+ "dataPath": "params_shard_105.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.30.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.30.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.31.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.31.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.31.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.31.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.31.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.31.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "3435690b788647cf7a22a8c897addacf"
+ },
+ {
+ "dataPath": "params_shard_106.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.32.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "55d0453e4bf2dc2ad9e613b261df176a"
+ },
+ {
+ "dataPath": "params_shard_107.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.32.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fffd74b7bb7f2af5859d3707c76a1acd"
+ },
+ {
+ "dataPath": "params_shard_108.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.32.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "53d778a64a1d4806f27b2e25f8cf52e9"
+ },
+ {
+ "dataPath": "params_shard_109.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.31.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.31.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.32.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.32.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.32.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.32.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.32.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.32.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "c5d01e9ad249b3e2400c635500323b28"
+ },
+ {
+ "dataPath": "params_shard_110.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.33.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "633fe2e4dd7b2cc3ba3104f7d693120a"
+ },
+ {
+ "dataPath": "params_shard_111.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.33.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "dadaf5b4f17b21ff01803894df64c3e6"
+ },
+ {
+ "dataPath": "params_shard_112.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.33.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6d1ecff8bfc7d59ee842ae591c8ca39c"
+ },
+ {
+ "dataPath": "params_shard_113.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.32.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.32.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.33.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.33.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.33.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.33.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.33.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.33.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "fd70fc08fd9a7c36a1f842ceecae2292"
+ },
+ {
+ "dataPath": "params_shard_114.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.34.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9cc9190cd4517b5d727e59c977ae1671"
+ },
+ {
+ "dataPath": "params_shard_115.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.34.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "33b96f0a90e7de7cb3cee8136875df1b"
+ },
+ {
+ "dataPath": "params_shard_116.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.34.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "70e87a6886a9a179983c450e4b3d34f2"
+ },
+ {
+ "dataPath": "params_shard_117.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.33.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.33.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.34.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.34.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.34.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.34.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.34.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.34.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "8662e0442fe6709eda1068cc35feb61a"
+ },
+ {
+ "dataPath": "params_shard_118.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.35.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d8dbc267b2361240dbffae9cf0c98df6"
+ },
+ {
+ "dataPath": "params_shard_119.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.35.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f4575e2d9703230e49041ecfae0c1ece"
+ },
+ {
+ "dataPath": "params_shard_120.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.35.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d1e631142200c317045dc54fb8eb1098"
+ },
+ {
+ "dataPath": "params_shard_121.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.34.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.34.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.35.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.35.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.35.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.35.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.35.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.35.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "8a3a7e469f4f9706cff4c3f8d9054762"
+ },
+ {
+ "dataPath": "params_shard_122.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.36.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "dbd979dc01ae0116100d677927d494fd"
+ },
+ {
+ "dataPath": "params_shard_123.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.36.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a105a417c96646f092b09ad13f66c5c0"
+ },
+ {
+ "dataPath": "params_shard_124.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.36.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "987861d2cd9a76a340fd6d84071b30c8"
+ },
+ {
+ "dataPath": "params_shard_125.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.35.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.35.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.36.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.36.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.36.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.36.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.36.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.36.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "b6cef9ea47a7d5a2aea87a24d9969eec"
+ },
+ {
+ "dataPath": "params_shard_126.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.37.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "43c54d0acdbd9f90f2ca5d676ef75227"
+ },
+ {
+ "dataPath": "params_shard_127.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.37.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6dcb27eb9c4c47eddb26d11152b8c6f3"
+ },
+ {
+ "dataPath": "params_shard_128.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.37.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "31e6db4b7d2ed24a5ff5ed08f7026c49"
+ },
+ {
+ "dataPath": "params_shard_129.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.36.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.36.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.37.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.37.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.37.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.37.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.37.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.37.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "46e8c4ca3e7b53fbe4d340c5901252c1"
+ },
+ {
+ "dataPath": "params_shard_130.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.38.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f195698dc3dbb4a0a5df03aaf6015ee8"
+ },
+ {
+ "dataPath": "params_shard_131.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.38.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e556fbdfe6fa39b5576ee6757bf8ee5c"
+ },
+ {
+ "dataPath": "params_shard_132.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.38.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "615061220e62d67d9dc5d3f6bc854830"
+ },
+ {
+ "dataPath": "params_shard_133.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.37.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.37.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.38.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.38.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.38.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.38.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.38.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.38.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "6fa78a645efba4983e8e931e54428b51"
+ },
+ {
+ "dataPath": "params_shard_134.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.39.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5a84c2ea31d886315d80ead7fa37684d"
+ },
+ {
+ "dataPath": "params_shard_135.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.39.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0c86d27835c962054b0ea13a54e29f44"
+ },
+ {
+ "dataPath": "params_shard_136.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.39.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8dca2d313911170c1b03bd3905c77869"
+ },
+ {
+ "dataPath": "params_shard_137.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.38.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.38.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.39.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.39.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.39.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.39.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.39.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.39.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "6afdbbbf395fa105cd3105ab42bfec33"
+ },
+ {
+ "dataPath": "params_shard_138.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.4.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "12e8229e94b6ea632832bc5e01052a33"
+ },
+ {
+ "dataPath": "params_shard_139.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.4.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9c64e4be3b125d4b68bd2d7a2621d4ba"
+ },
+ {
+ "dataPath": "params_shard_140.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.4.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "77f5469b3e85a109f8ed6293fe2f98b0"
+ },
+ {
+ "dataPath": "params_shard_141.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.39.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.39.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.4.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.4.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.4.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.4.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.4.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.4.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "9b2fed524429a21074aaa65d47b4f029"
+ },
+ {
+ "dataPath": "params_shard_142.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.40.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "dc0f1d7b326608c9c5c0accc057ba7f5"
+ },
+ {
+ "dataPath": "params_shard_143.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.40.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8bd11a566294007f5a47aa69066ae8c5"
+ },
+ {
+ "dataPath": "params_shard_144.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.40.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0e9424e9f2e585a8c78527f4f46da032"
+ },
+ {
+ "dataPath": "params_shard_145.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.4.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.4.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.40.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.40.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.40.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.40.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.40.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.40.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "49d59055fa03c6720b17235aa4cd1341"
+ },
+ {
+ "dataPath": "params_shard_146.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.41.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ce6cb548ab5d65c1d05d208a7c1a8562"
+ },
+ {
+ "dataPath": "params_shard_147.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.41.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "431a0c935a1c838656d0d360abaf87c8"
+ },
+ {
+ "dataPath": "params_shard_148.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.41.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c0345d1f97de80d6880d0255f742db7a"
+ },
+ {
+ "dataPath": "params_shard_149.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.40.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.40.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.41.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.41.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.41.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.41.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.41.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.41.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "c5c702d10795154ebf6c5d69203f6cc7"
+ },
+ {
+ "dataPath": "params_shard_150.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.42.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "599412788af765dee563f897941219a5"
+ },
+ {
+ "dataPath": "params_shard_151.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.42.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3d5b8027dba42fede295c2641904b230"
+ },
+ {
+ "dataPath": "params_shard_152.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.42.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7ddea37b42a84bd48c244fe9107b6623"
+ },
+ {
+ "dataPath": "params_shard_153.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.41.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.41.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.42.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.42.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.42.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.42.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.42.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.42.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "806ef2c337c7833db9c7d042bc20bf95"
+ },
+ {
+ "dataPath": "params_shard_154.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.43.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "19d802b134d75061059d26195083793f"
+ },
+ {
+ "dataPath": "params_shard_155.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.43.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b1bcb7c6f6c29ea7f091dfdf317187b0"
+ },
+ {
+ "dataPath": "params_shard_156.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.43.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9807ab49bdccdd6953d8d0635832150c"
+ },
+ {
+ "dataPath": "params_shard_157.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.42.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.42.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.43.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.43.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.43.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.43.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.43.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.43.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "02cc7d5baee3ac110fe0c29736a1eb9a"
+ },
+ {
+ "dataPath": "params_shard_158.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.44.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "50ee534f865bcde45f309baa1c201d05"
+ },
+ {
+ "dataPath": "params_shard_159.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.44.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fb851f8fa85e6f54ce8757dd20677e33"
+ },
+ {
+ "dataPath": "params_shard_160.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.44.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "359951516bb3f550113a8b6ed986a128"
+ },
+ {
+ "dataPath": "params_shard_161.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.43.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.43.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.44.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.44.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.44.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.44.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.44.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.44.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "b7bdbc15c70ae333411056e5f66389e0"
+ },
+ {
+ "dataPath": "params_shard_162.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.45.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5526d31d0140de9c501187345ef85b5f"
+ },
+ {
+ "dataPath": "params_shard_163.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.45.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8806ede0ccfcd419ecd854d717b63d84"
+ },
+ {
+ "dataPath": "params_shard_164.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.45.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c946cb01bf428d17ff5ab70017d03b8f"
+ },
+ {
+ "dataPath": "params_shard_165.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.44.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.44.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.45.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.45.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.45.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.45.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.45.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.45.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "f16f7248d3669b07d918662885a23f8b"
+ },
+ {
+ "dataPath": "params_shard_166.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.46.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "cb61d7cff6cd74cf5798a42d5b79c7eb"
+ },
+ {
+ "dataPath": "params_shard_167.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.46.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1d89dfce6a7b922786d239bdc34ef1b7"
+ },
+ {
+ "dataPath": "params_shard_168.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.46.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c182aec014c9302c79a8c286dcb9354b"
+ },
+ {
+ "dataPath": "params_shard_169.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.45.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.45.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.46.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.46.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.46.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.46.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.46.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.46.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "75ef3548cb6cf46fb1e021e92815002b"
+ },
+ {
+ "dataPath": "params_shard_170.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.47.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "eee68bcdccca20f727515612b5f143dd"
+ },
+ {
+ "dataPath": "params_shard_171.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.47.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c10ee56c9482ac631e0c049b80802af2"
+ },
+ {
+ "dataPath": "params_shard_172.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.47.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "862b2afa6eadff71c2ecd682b9b8969b"
+ },
+ {
+ "dataPath": "params_shard_173.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.46.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.46.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.47.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.47.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.47.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.47.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.47.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.47.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "00adb009a237138dc72b9ff3e62aa1f7"
+ },
+ {
+ "dataPath": "params_shard_174.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.48.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7b45b1f271c8a13cc0d355c8dd589cc0"
+ },
+ {
+ "dataPath": "params_shard_175.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.48.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f916cee980962dbe0cf51e79d73c900d"
+ },
+ {
+ "dataPath": "params_shard_176.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.48.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "045ce4c39b12a8f24bf65e5c0b7ae3af"
+ },
+ {
+ "dataPath": "params_shard_177.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.47.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.47.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.48.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.48.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.48.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.48.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.48.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.48.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "0c71d311a8ee6d9e2c257692ea5dcf12"
+ },
+ {
+ "dataPath": "params_shard_178.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.49.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b23fc22e29c37f64bf4b9499a89413b8"
+ },
+ {
+ "dataPath": "params_shard_179.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.49.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "04662b979a713f05b50419f2f49fdff7"
+ },
+ {
+ "dataPath": "params_shard_180.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.49.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ace809b959a5c997118d1311ad18b379"
+ },
+ {
+ "dataPath": "params_shard_181.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.48.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.48.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.49.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.49.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.49.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.49.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.49.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.49.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "ba0c89f1f3d2452f1c7ff09fe7f82889"
+ },
+ {
+ "dataPath": "params_shard_182.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.5.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "09da40d803df8f54b101b099389e760d"
+ },
+ {
+ "dataPath": "params_shard_183.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.5.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5bc9d4f6b0d5ed95450b387e693631fe"
+ },
+ {
+ "dataPath": "params_shard_184.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.5.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b891c12458722f2cc4a685b309466170"
+ },
+ {
+ "dataPath": "params_shard_185.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.49.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.49.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.5.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.5.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.5.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.5.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.5.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.5.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "d7c6363c45ece7eea1469cb45dccbd23"
+ },
+ {
+ "dataPath": "params_shard_186.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.50.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4ee5d6495635f48349e165545a209ee2"
+ },
+ {
+ "dataPath": "params_shard_187.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.50.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ee8f2d76b32964b4dc2da2a44a6d7fc8"
+ },
+ {
+ "dataPath": "params_shard_188.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.50.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "eeb4c680c8a58c346b00ed57761972b8"
+ },
+ {
+ "dataPath": "params_shard_189.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.5.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.5.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.50.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.50.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.50.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.50.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.50.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.50.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "52434c08787f2c83e7cabde2574c8538"
+ },
+ {
+ "dataPath": "params_shard_190.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.51.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "20756e3ce960846d21e2432aee3587dc"
+ },
+ {
+ "dataPath": "params_shard_191.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.51.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b926c78a1d37ca2a46daec17f36748ff"
+ },
+ {
+ "dataPath": "params_shard_192.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.51.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f55a8c78ad798072c1051a2aacd45e0a"
+ },
+ {
+ "dataPath": "params_shard_193.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.50.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.50.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.51.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.51.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.51.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.51.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.51.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.51.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "4c386cf1333fc61c960da93e564fbaa0"
+ },
+ {
+ "dataPath": "params_shard_194.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.52.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1d306303a25e1191baa3c1d78cf575a8"
+ },
+ {
+ "dataPath": "params_shard_195.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.52.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5b641e3859382fd2fc5088a537a06d1f"
+ },
+ {
+ "dataPath": "params_shard_196.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.52.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f7368b3e411b445433d1ef9489d6e55f"
+ },
+ {
+ "dataPath": "params_shard_197.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.51.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.51.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.52.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.52.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.52.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.52.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.52.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.52.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "c1aeb519a2e3e1dfdc894b355c8aaa6e"
+ },
+ {
+ "dataPath": "params_shard_198.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.53.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4fc3d783504b165cc7055462ff6e587f"
+ },
+ {
+ "dataPath": "params_shard_199.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.53.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f0fba927f9e8a03c455c5b2fae1d0f16"
+ },
+ {
+ "dataPath": "params_shard_200.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.53.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "30e70dab5c13562bf2f8b9cdbd3e0cda"
+ },
+ {
+ "dataPath": "params_shard_201.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.52.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.52.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.53.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.53.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.53.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.53.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.53.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.53.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "d17ae76071b741bbbe655cfc4670b057"
+ },
+ {
+ "dataPath": "params_shard_202.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.54.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ebce8236d32cfee5ae4d7ec6eb80c35f"
+ },
+ {
+ "dataPath": "params_shard_203.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.54.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "064ee6cd2552d54f45623850da28ef17"
+ },
+ {
+ "dataPath": "params_shard_204.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.54.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0688d5f50da1b03c8a25256707e1e164"
+ },
+ {
+ "dataPath": "params_shard_205.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.53.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.53.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.54.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.54.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.54.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.54.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.54.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.54.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "37390a00a29408430d26c235380cbc3a"
+ },
+ {
+ "dataPath": "params_shard_206.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.55.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8a3b63861b992488063ccf314b93ceab"
+ },
+ {
+ "dataPath": "params_shard_207.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.55.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d6f5696f2f23aea879441e51ef5905fc"
+ },
+ {
+ "dataPath": "params_shard_208.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.55.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "cd2d34ab39509bab7cece90490069d70"
+ },
+ {
+ "dataPath": "params_shard_209.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.54.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.54.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.55.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.55.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.55.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.55.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.55.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.55.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "f48e5931bf5c52d0d2ec1fa97e68b071"
+ },
+ {
+ "dataPath": "params_shard_210.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.56.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e2289b575146ec5892dbc9b9e3e2bcb4"
+ },
+ {
+ "dataPath": "params_shard_211.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.56.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "632801adfa2f42376a05d3dcb1ae591b"
+ },
+ {
+ "dataPath": "params_shard_212.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.56.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7019450869b27bffd264f012e0e4f7a6"
+ },
+ {
+ "dataPath": "params_shard_213.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.55.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.55.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.56.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.56.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.56.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.56.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.56.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.56.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "a43a889872faa60671a623150ee2cb31"
+ },
+ {
+ "dataPath": "params_shard_214.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.57.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8052cbd948e6333825c67494356f6f6a"
+ },
+ {
+ "dataPath": "params_shard_215.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.57.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f428916e79cdea1c5a05770782a532be"
+ },
+ {
+ "dataPath": "params_shard_216.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.57.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "41a9d9dd2b461e87fc1dfc99df416f67"
+ },
+ {
+ "dataPath": "params_shard_217.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.56.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.56.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.57.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.57.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.57.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.57.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.57.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.57.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "72c4f9fb3f5fa146404b7ace5a47a667"
+ },
+ {
+ "dataPath": "params_shard_218.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.58.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b9939fff6aa0e4eac26f7c38b0fc1391"
+ },
+ {
+ "dataPath": "params_shard_219.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.58.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "115e4ca8a8d367d30369455afa28eb57"
+ },
+ {
+ "dataPath": "params_shard_220.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.58.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "66e5c5d64654e198345797af054ec119"
+ },
+ {
+ "dataPath": "params_shard_221.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.57.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.57.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.58.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.58.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.58.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.58.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.58.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.58.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "68f38229593a7817f8bc06bba0c9f5c6"
+ },
+ {
+ "dataPath": "params_shard_222.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.59.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4f9acb2337bd126fa0c893f94ce0a745"
+ },
+ {
+ "dataPath": "params_shard_223.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.59.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "43c1c0da3c36d0005d80962299394dd0"
+ },
+ {
+ "dataPath": "params_shard_224.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.59.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "62f230c958e25a4ed90413affca41d72"
+ },
+ {
+ "dataPath": "params_shard_225.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.58.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.58.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.59.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.59.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.59.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.59.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.59.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.59.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "80da5196abf5d6060cda97bb08438abc"
+ },
+ {
+ "dataPath": "params_shard_226.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.6.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c147afb13b4d00a922d7c835a09a8c49"
+ },
+ {
+ "dataPath": "params_shard_227.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.6.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f2e972074c113d65b6e84972300bc14e"
+ },
+ {
+ "dataPath": "params_shard_228.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.6.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3011fbca4c282a1b698e882da230c4da"
+ },
+ {
+ "dataPath": "params_shard_229.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.59.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.59.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.6.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.6.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.6.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.6.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.6.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.6.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "429d637ec66f0000d675c7e93a0f64df"
+ },
+ {
+ "dataPath": "params_shard_230.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.60.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f09a8fb57115ce2ef0ee8b52aca69401"
+ },
+ {
+ "dataPath": "params_shard_231.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.60.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e79cf5927aa78b4a58f558562c627f69"
+ },
+ {
+ "dataPath": "params_shard_232.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.60.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6600da09bbcdd9e03ab8eee2eaec9f6d"
+ },
+ {
+ "dataPath": "params_shard_233.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.6.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.6.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.60.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.60.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.60.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.60.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.60.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.60.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "5dc508b2f74f02360e536e24700863cf"
+ },
+ {
+ "dataPath": "params_shard_234.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.61.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "224484ac6fa25f5d529b314995b913a3"
+ },
+ {
+ "dataPath": "params_shard_235.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.61.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f0b0268f6e4f311eaac7211c8c3e2756"
+ },
+ {
+ "dataPath": "params_shard_236.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.61.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a97dbfa6a3294a7f85736ebdaf6e4a19"
+ },
+ {
+ "dataPath": "params_shard_237.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.60.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.60.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.61.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.61.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.61.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.61.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.61.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.61.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "489f688276e5e7751cee2288d4f02a25"
+ },
+ {
+ "dataPath": "params_shard_238.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.62.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3222e6f9405ee0717a05e1a9cd22f6e8"
+ },
+ {
+ "dataPath": "params_shard_239.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.62.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b38d17d3162c14631de219e0d6f36ed5"
+ },
+ {
+ "dataPath": "params_shard_240.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.62.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "cf8e6f72723b4c60ad25ae84a6489b70"
+ },
+ {
+ "dataPath": "params_shard_241.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.61.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.61.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.62.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.62.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.62.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.62.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.62.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.62.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "e7a409ef6716b3dfc2d118acc2b9852b"
+ },
+ {
+ "dataPath": "params_shard_242.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.63.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ecc407247e8ea6fc0999195aaff060d7"
+ },
+ {
+ "dataPath": "params_shard_243.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.63.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d99e70926ab570954322da7965bdfbb0"
+ },
+ {
+ "dataPath": "params_shard_244.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.63.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7a788f9f21e8f8f12aaf6f5ad1b64152"
+ },
+ {
+ "dataPath": "params_shard_245.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.62.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.62.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.63.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.63.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.63.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.63.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.63.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.63.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "7c05d6157ed5292c7f7d11ba79e99c45"
+ },
+ {
+ "dataPath": "params_shard_246.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.7.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f608ffd2f30678a4cc7754b6503f0a32"
+ },
+ {
+ "dataPath": "params_shard_247.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.7.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ce65e55d2eb19cbfa5f8274039493698"
+ },
+ {
+ "dataPath": "params_shard_248.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.7.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "19d4d93de13892f83a826649199a3e52"
+ },
+ {
+ "dataPath": "params_shard_249.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.63.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.63.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.7.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.7.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.7.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.7.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.7.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.7.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "5097b3dda17322d492bcf138a5c76755"
+ },
+ {
+ "dataPath": "params_shard_250.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.8.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "cdf1d32e815807d32c10ff6879d9e01e"
+ },
+ {
+ "dataPath": "params_shard_251.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.8.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6fab47a5c535a74d81e51912cac5ed88"
+ },
+ {
+ "dataPath": "params_shard_252.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.8.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "587ca97d5182d02d5234709509f810c6"
+ },
+ {
+ "dataPath": "params_shard_253.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.7.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.7.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.8.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.8.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.8.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.8.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.8.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.8.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "4b16da2148ddb4013727bb1f2153e79f"
+ },
+ {
+ "dataPath": "params_shard_254.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.9.mlp.down_proj.q_weight",
+ "shape": [
+ 3456,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "97e4e1600c287f6f986ecbcc3e05c45c"
+ },
+ {
+ "dataPath": "params_shard_255.bin",
+ "format": "raw-shard",
+ "nbytes": 141557760,
+ "records": [
+ {
+ "name": "model.layers.9.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 640,
+ 55296
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 141557760,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "617f3891306e9b788cc367415ef711b5"
+ },
+ {
+ "dataPath": "params_shard_256.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.9.self_attn.c_attn.q_weight",
+ "shape": [
+ 640,
+ 7168
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5eefe89c5b5bb196400f60fd381b6dbf"
+ },
+ {
+ "dataPath": "params_shard_257.bin",
+ "format": "raw-shard",
+ "nbytes": 20760576,
+ "records": [
+ {
+ "name": "model.layers.8.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.8.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.9.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "model.layers.9.mlp.down_proj.q_scale",
+ "shape": [
+ 216,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 2211840,
+ "byteOffset": 13527040
+ },
+ {
+ "name": "model.layers.9.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 40,
+ 55296
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 15738880
+ },
+ {
+ "name": "model.layers.9.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 20162560
+ },
+ {
+ "name": "model.layers.9.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 20172800
+ },
+ {
+ "name": "model.layers.9.self_attn.c_attn.q_scale",
+ "shape": [
+ 40,
+ 7168
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 573440,
+ "byteOffset": 20187136
+ }
+ ],
+ "md5sum": "5a623715713a91e8d78e482cc1dc1fb4"
+ },
+ {
+ "dataPath": "params_shard_258.bin",
+ "format": "raw-shard",
+ "nbytes": 13527040,
+ "records": [
+ {
+ "name": "model.layers.9.self_attn.o_proj.q_weight",
+ "shape": [
+ 640,
+ 5120
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.9.self_attn.o_proj.q_scale",
+ "shape": [
+ 40,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.norm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 13516800
+ }
+ ],
+ "md5sum": "afa707485eecce27b71c4baba9711db8"
+ }
+ ]
+}
\ No newline at end of file
diff --git a/params_shard_0.bin b/params_shard_0.bin
new file mode 100644
index 0000000000000000000000000000000000000000..70bd8383e37bd063ba0fa32234fb933da098c34e
--- /dev/null
+++ b/params_shard_0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:39e743f5dcfe2da60f2a4b486c3da35c721d061d0ed7823b9b938123e7d7eee4
+size 389283840
diff --git a/params_shard_1.bin b/params_shard_1.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a91cdbaae4403ffb9ff4fe03b9b3ca6387bd25f9
--- /dev/null
+++ b/params_shard_1.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:658fef5580dfd37f147b369b4d83369c103d4eadfde04bb7aaa80b8fec38da8a
+size 389283840
diff --git a/params_shard_10.bin b/params_shard_10.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9e2544a68f010f7f3eebb146db68d4848443d272
--- /dev/null
+++ b/params_shard_10.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b31d5f4118fb11e4fb9a33bb55155f0ada2424d79a2fc9833285a23c39b4f652
+size 70778880
diff --git a/params_shard_100.bin b/params_shard_100.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7266b156041a2eb97877d129885846c0f9950d7e
--- /dev/null
+++ b/params_shard_100.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2c633ff71e46ffc0d0cde1cf4dbf01b4250553ab10bebf0ec01a4e77de18ad26
+size 18350080
diff --git a/params_shard_101.bin b/params_shard_101.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a5b91d5f16be499c4b5c5acd3ba62e7bfa9bf99c
--- /dev/null
+++ b/params_shard_101.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c96b1165bcf5a1dd4caa9e63ef3a825be72542782cf4b12c6d71a2b96557a985
+size 20760576
diff --git a/params_shard_102.bin b/params_shard_102.bin
new file mode 100644
index 0000000000000000000000000000000000000000..46273db8a7d7fa80c4191140cafc66492e935602
--- /dev/null
+++ b/params_shard_102.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b727fef73d783ae2a5e49b3dbde0041e4f2ecc6e954a459b25a74ee2ad7465ca
+size 70778880
diff --git a/params_shard_103.bin b/params_shard_103.bin
new file mode 100644
index 0000000000000000000000000000000000000000..514fd47def59c8c8b5259222619aef2fe2007450
--- /dev/null
+++ b/params_shard_103.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f6427e51e9bf61472e730978c27ca8c917d1241ba8a4d4d1936ad8aa4a00f3cc
+size 141557760
diff --git a/params_shard_104.bin b/params_shard_104.bin
new file mode 100644
index 0000000000000000000000000000000000000000..dfdf20bc2e1f66e1105c4eaa0891c2cac2717552
--- /dev/null
+++ b/params_shard_104.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:019bbce717c3ea4d965be316e0c35d55af1ed2c222c0035d930bc8ddac73a456
+size 18350080
diff --git a/params_shard_105.bin b/params_shard_105.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e5863cc9ff195db0822c4f5306bb0b1a34651f84
--- /dev/null
+++ b/params_shard_105.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:01a8a9d06533a6fb059c14fe426684a64e94879e4050e02af02d9262696da3b8
+size 20760576
diff --git a/params_shard_106.bin b/params_shard_106.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f4581d21ea1c2adf4a9bb3db109751cd510d92b1
--- /dev/null
+++ b/params_shard_106.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1f635544d7961522cad188b0e9f67fe03068008ba1121eaddfa33583e8a3fd8a
+size 70778880
diff --git a/params_shard_107.bin b/params_shard_107.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e7395907cdf99d36110b79e555fdc40fe83459c2
--- /dev/null
+++ b/params_shard_107.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fef49a94940086b14bef0be6f767ba95808aebfec1355acde7d1b2434d88a341
+size 141557760
diff --git a/params_shard_108.bin b/params_shard_108.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cad2299f65aea9024bacc322aea44a75ee328b7e
--- /dev/null
+++ b/params_shard_108.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e311d90ef4bcbfbdb14ab2123644c5fba3c3090cec61c638866412a59d55f747
+size 18350080
diff --git a/params_shard_109.bin b/params_shard_109.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7aa5d6fcfa24974a9846c0b117c2a0639b6e2992
--- /dev/null
+++ b/params_shard_109.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:974cc922a6d37c974d12ae09f40fbe5d0eef19f1bf227bc3a7e7722d28cec03a
+size 20760576
diff --git a/params_shard_11.bin b/params_shard_11.bin
new file mode 100644
index 0000000000000000000000000000000000000000..71db948cde0b2593a7dbe3593af2c3bb54c11b72
--- /dev/null
+++ b/params_shard_11.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ea7afc991cae91f377d2a6cf1434bc656814df1c8e9364ac947b4c0fe346208f
+size 141557760
diff --git a/params_shard_110.bin b/params_shard_110.bin
new file mode 100644
index 0000000000000000000000000000000000000000..10ede37deec9e26abfa5ad56c7d735556f22fa9c
--- /dev/null
+++ b/params_shard_110.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2b1425c0f50bc4aa8cbaaf952cf38834ad21aa59598fb3f3c8f7a45882f76485
+size 70778880
diff --git a/params_shard_111.bin b/params_shard_111.bin
new file mode 100644
index 0000000000000000000000000000000000000000..34def1841f5bd532c146ff41fa8d78218e61ffbb
--- /dev/null
+++ b/params_shard_111.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2116c1d730bd59fae407b52462ad22d8374a45a5383953a29d847fa82f736a6c
+size 141557760
diff --git a/params_shard_112.bin b/params_shard_112.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a44b261f48af27bc8b008ee7981e3205dc8ada71
--- /dev/null
+++ b/params_shard_112.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b9c5261be009c358d8c3fc1cef5e5533bcdf9e4d1c67846bfbe86fc2b57892fa
+size 18350080
diff --git a/params_shard_113.bin b/params_shard_113.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1970ba8198038f2051b93ac5b764c477f3f63248
--- /dev/null
+++ b/params_shard_113.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0ade505688c931fb4acae2b7744f9487466f36e0ae70232cc3c852bddfec57f7
+size 20760576
diff --git a/params_shard_114.bin b/params_shard_114.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0c23a1d496418c59eb3402d255a55663795d2782
--- /dev/null
+++ b/params_shard_114.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5dfd53d3b1150c633d45fcdab8235e4e2f89afc13bc01345e249d8d37ecc99a0
+size 70778880
diff --git a/params_shard_115.bin b/params_shard_115.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f832ef05afe159044d7acd5d1c4ea88a8b5090c8
--- /dev/null
+++ b/params_shard_115.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3743a961f3543e3f971c734ede9253aaebd99d46973c3507419a25fcef4dd7d0
+size 141557760
diff --git a/params_shard_116.bin b/params_shard_116.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2ff75707f96087d6dd2fb88e4446e4f94d2fcf33
--- /dev/null
+++ b/params_shard_116.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:420c659e124b6086f16f95e67944499b472609999dcb2d7202b34fe8ed1f2639
+size 18350080
diff --git a/params_shard_117.bin b/params_shard_117.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8fa79d9be0938a450ca9c5e313d3da76ca13bee5
--- /dev/null
+++ b/params_shard_117.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:74dbcab0a6c82eb85541895abacffc70e9a7dc2051096eb014141db791282392
+size 20760576
diff --git a/params_shard_118.bin b/params_shard_118.bin
new file mode 100644
index 0000000000000000000000000000000000000000..016d329e4a87d50617ee0e10299cd08a8ae3343b
--- /dev/null
+++ b/params_shard_118.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:37a8958a80d596017c95678b05ca1df43bdcb8a73ab321e7192093497d0ba4b0
+size 70778880
diff --git a/params_shard_119.bin b/params_shard_119.bin
new file mode 100644
index 0000000000000000000000000000000000000000..03a3e8f0836ddb95e9d855f028554683a11a2795
--- /dev/null
+++ b/params_shard_119.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e5795c8f0c3af7824573f5d4a3ce1d244fb4f3739bf67f7bd2eaf2f18655f85a
+size 141557760
diff --git a/params_shard_12.bin b/params_shard_12.bin
new file mode 100644
index 0000000000000000000000000000000000000000..364ff86c0d4ea1872778e81e302e4911c25a1827
--- /dev/null
+++ b/params_shard_12.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:afba589beb2cea6ab7557b292cf0240f7402ab83b3185dbc9e0dac53be23c219
+size 18350080
diff --git a/params_shard_120.bin b/params_shard_120.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0f54a30ab9c878b0f748e60d51aef7456cc3912e
--- /dev/null
+++ b/params_shard_120.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:adc2b7253a32e7cfa65d2df57088f2492c30228d3b66a228c448ff9176547d61
+size 18350080
diff --git a/params_shard_121.bin b/params_shard_121.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f0cda91672c6fab278407b94db888fa0d055fb0a
--- /dev/null
+++ b/params_shard_121.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f6083bd16b78466a510d87dc2aa3816b5707f5d68d9d1d71047f8c0aea52b17d
+size 20760576
diff --git a/params_shard_122.bin b/params_shard_122.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2baa06265fab413600462c6ce0f945dd3978f269
--- /dev/null
+++ b/params_shard_122.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ab5184eae1e5e1442c0351059df68a4f9b97763f400807765d685bfbd1183729
+size 70778880
diff --git a/params_shard_123.bin b/params_shard_123.bin
new file mode 100644
index 0000000000000000000000000000000000000000..618a870dfca6e4645ef7ffb6debd5272c18b3367
--- /dev/null
+++ b/params_shard_123.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:74783eda47e6fd357676acec0c42e3ac045ed41570881cfe21fd7eca41a035b2
+size 141557760
diff --git a/params_shard_124.bin b/params_shard_124.bin
new file mode 100644
index 0000000000000000000000000000000000000000..21400314272fd2eab07387c6122e43d6a751e62a
--- /dev/null
+++ b/params_shard_124.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fe2c6f89173bf2c4e3145f818f60b87acc9661aa5231c188a770205b9583c7cc
+size 18350080
diff --git a/params_shard_125.bin b/params_shard_125.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9b58bdcdd5741045a846a7548452e7362c07c254
--- /dev/null
+++ b/params_shard_125.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8dbb9c28ad67cbbefd5726de662ae7998e8589ed456fff19d7842922cd5544e7
+size 20760576
diff --git a/params_shard_126.bin b/params_shard_126.bin
new file mode 100644
index 0000000000000000000000000000000000000000..31c63d8b3bde7aa5ae6f9698cd9a52bb25613642
--- /dev/null
+++ b/params_shard_126.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:acf8028744a64b0e2f9e1497eb1e102957c8584db9c77a811933727e717c6cb9
+size 70778880
diff --git a/params_shard_127.bin b/params_shard_127.bin
new file mode 100644
index 0000000000000000000000000000000000000000..fe584f369eac663785c4a6adcd7c48321641fabb
--- /dev/null
+++ b/params_shard_127.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:582d387a5e496283183c03a7c0bfc46abf29b0ca61041e35e5f376a20c97a849
+size 141557760
diff --git a/params_shard_128.bin b/params_shard_128.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7d7b9faca3e213edc9a77610c2e540e479cbdbc5
--- /dev/null
+++ b/params_shard_128.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3a48d186b57502ca8895cbd65d562ebad2db2d013fc5a24e0c846cb29e1a2420
+size 18350080
diff --git a/params_shard_129.bin b/params_shard_129.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bad158f6ff809d387531c2eb30fb0556cb00d56b
--- /dev/null
+++ b/params_shard_129.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:574e0798e980a08beabbe5070f5d33460331d0cf513f94480309bb159ed80659
+size 20760576
diff --git a/params_shard_13.bin b/params_shard_13.bin
new file mode 100644
index 0000000000000000000000000000000000000000..642a5aa466d3feddb409922196610250b10b9fa3
--- /dev/null
+++ b/params_shard_13.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:78d09d4727f338f9f42a6711cefcd5890ac1e5d50916d88927b5d5cb273bb217
+size 20760576
diff --git a/params_shard_130.bin b/params_shard_130.bin
new file mode 100644
index 0000000000000000000000000000000000000000..30c40584814009d1076d43842dfac48f74be67ec
--- /dev/null
+++ b/params_shard_130.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6da33a575a06f32fb9f7351353c7d1ce18756b51d2f6b5c91727abb40ef1d233
+size 70778880
diff --git a/params_shard_131.bin b/params_shard_131.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e2714d1735b28eacffc77828bb1cb77f17d4370b
--- /dev/null
+++ b/params_shard_131.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:970dd008b2d9e8e37a8a4f45d4d783911f781d03d74cd9826bffe286ff956235
+size 141557760
diff --git a/params_shard_132.bin b/params_shard_132.bin
new file mode 100644
index 0000000000000000000000000000000000000000..757b1a0d094d34c0a5c5eb9602e9dd2398596b29
--- /dev/null
+++ b/params_shard_132.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9f01950f0374165d03c5b6e0cc26914fe4ec2b47ad1ef1b73848113994d73c56
+size 18350080
diff --git a/params_shard_133.bin b/params_shard_133.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4e222a59bfdfad16611bc178f3ebbafed208bb6e
--- /dev/null
+++ b/params_shard_133.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:453a88a1fb5708dcc701491fe62df4e8289ae44d63003b261b82b50b5b3b3497
+size 20760576
diff --git a/params_shard_134.bin b/params_shard_134.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ca020a18ad6a349ed31e7121fc0f300bb98b1591
--- /dev/null
+++ b/params_shard_134.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:982177897c5e1fb500eaed0b3e88c11bc3bf7ac3ce05b2c5fe2dd9712daeb3bb
+size 70778880
diff --git a/params_shard_135.bin b/params_shard_135.bin
new file mode 100644
index 0000000000000000000000000000000000000000..58635675110acda45eb1d9fc792a22ee8a4e9979
--- /dev/null
+++ b/params_shard_135.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7bab6532f1f272b2072a61c1b80920b48a49d4479c247ec50f55e9183dcb6bd9
+size 141557760
diff --git a/params_shard_136.bin b/params_shard_136.bin
new file mode 100644
index 0000000000000000000000000000000000000000..92605756ff9d1399cdf760bee253b2b2c47b5eff
--- /dev/null
+++ b/params_shard_136.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:95bdb44864aa3dde8c62a51257fd4b5e6599e7c2beaae48e0efa61a9969c1f3b
+size 18350080
diff --git a/params_shard_137.bin b/params_shard_137.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e6df40a1b5905e32311f8346c23069a40d65c97b
--- /dev/null
+++ b/params_shard_137.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fee64b3f0f6727a8c891a169f78407789823d3e7cf84bad2dfa9bc038bc91224
+size 20760576
diff --git a/params_shard_138.bin b/params_shard_138.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9800dc57848df2540196d0424b0413a7fa937253
--- /dev/null
+++ b/params_shard_138.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b5e74667a5dc8e600c18c4b11fd795fef9f07006324befd14eb8f94a69fbd32a
+size 70778880
diff --git a/params_shard_139.bin b/params_shard_139.bin
new file mode 100644
index 0000000000000000000000000000000000000000..62fe2e8308964b36644e8a0681fcf7f29ab2ef90
--- /dev/null
+++ b/params_shard_139.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8fbce1ffddcec85f47d19bd78353a035610f0570956d57828bf9cbe82e5e43da
+size 141557760
diff --git a/params_shard_14.bin b/params_shard_14.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4862f6c5bdb310637ec337ce5e9701f484ef3ce0
--- /dev/null
+++ b/params_shard_14.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a7961b0c594503692b59421ba51ad5acebf50d54b4c5e5c9ee4771618692cc1d
+size 70778880
diff --git a/params_shard_140.bin b/params_shard_140.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4d50d30f070d3f2cdf1749024b768877799d77ce
--- /dev/null
+++ b/params_shard_140.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4aca500d93bcd1c2feedc63ae48ec90dd12eba26c2db2c12bb710b55d6914ed6
+size 18350080
diff --git a/params_shard_141.bin b/params_shard_141.bin
new file mode 100644
index 0000000000000000000000000000000000000000..eb36025c5367b121740298e5b52c93228556f758
--- /dev/null
+++ b/params_shard_141.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ae3e8873d13c1659a87c772e8ce6892beabd887ad84de4557d63e03c7f552ad8
+size 20760576
diff --git a/params_shard_142.bin b/params_shard_142.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0b303bd33e06d6a50b5b9a1a25fe213bb9ad0230
--- /dev/null
+++ b/params_shard_142.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2db529f1073bfda76aa3ee8f0b2e6d873bbb4d7989250cc7124bdd7d45471484
+size 70778880
diff --git a/params_shard_143.bin b/params_shard_143.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3bec86bb56e028d029358e87c2528abe1863af71
--- /dev/null
+++ b/params_shard_143.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f9be767ef31503698ff138d14e6b9cd31b2d835a48bd2cae9196d188c5cfd7dd
+size 141557760
diff --git a/params_shard_144.bin b/params_shard_144.bin
new file mode 100644
index 0000000000000000000000000000000000000000..96234cb354cbeccb56eb6fa13cdefd3819d08b7c
--- /dev/null
+++ b/params_shard_144.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:040dc5957ff1d5569c1d4c28b85fab149a21cdab93e61a78316d862e289925b5
+size 18350080
diff --git a/params_shard_145.bin b/params_shard_145.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7d677b9eac019a8f83c9b836a098e50bc7ea35a3
--- /dev/null
+++ b/params_shard_145.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c2d09d9f223b024bd7bb6f873f890a13b79b19617312dd0dc298b171de59da6f
+size 20760576
diff --git a/params_shard_146.bin b/params_shard_146.bin
new file mode 100644
index 0000000000000000000000000000000000000000..671f8c1b54466862283f53429a9c3aafaa1f44cf
--- /dev/null
+++ b/params_shard_146.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d05155b18e9a4deb2190284aac7b96a72c73e219cf132f81fe370c58fc734fcc
+size 70778880
diff --git a/params_shard_147.bin b/params_shard_147.bin
new file mode 100644
index 0000000000000000000000000000000000000000..021c0789644e85a9469fba4ec575aadc31f3c831
--- /dev/null
+++ b/params_shard_147.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ca3a231fd5f450646186bf97d3958359889f30a169de1d004f52ce5188b6c6b0
+size 141557760
diff --git a/params_shard_148.bin b/params_shard_148.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6acd53396f272a0f1142adfb7cda4f79c5d73205
--- /dev/null
+++ b/params_shard_148.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cb8a9b58113588515aa760b8fe322eb7153563015330a4c6a95bd6115e6ba2c1
+size 18350080
diff --git a/params_shard_149.bin b/params_shard_149.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2cd00a22d42e748377e89ff71a5efe57c7840df9
--- /dev/null
+++ b/params_shard_149.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c797ec47f5c8d8b003511e3b0bd477ade8de6f92f04283f06c49622057f49fc8
+size 20760576
diff --git a/params_shard_15.bin b/params_shard_15.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0df65864f56625b61dc5f9c9519222556dd39c0f
--- /dev/null
+++ b/params_shard_15.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1bfd7ae61292f3bb60286cb0c53465db2ae0184e9ecf22de150361d3f810dc8d
+size 141557760
diff --git a/params_shard_150.bin b/params_shard_150.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d78caeca63ec55974ae4ac5a41fc11eb8de885e8
--- /dev/null
+++ b/params_shard_150.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:47033b654e63de325be133ec6eec5379378bc1ac638ceaa633928d3ab7237a23
+size 70778880
diff --git a/params_shard_151.bin b/params_shard_151.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2614a12f6a91b4a84f37cca3c0c340ab66e20d3e
--- /dev/null
+++ b/params_shard_151.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5431f8536f518fd17db670e6ce6f8ff118a50601653a925c58455811c0886a76
+size 141557760
diff --git a/params_shard_152.bin b/params_shard_152.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cc91570c023994d206b4dd0db8d89dccf82d1423
--- /dev/null
+++ b/params_shard_152.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:63efea61dd03e07519ce5463a50c1f7890bb5eaf82e1e26d7560e9e11ac6e1dc
+size 18350080
diff --git a/params_shard_153.bin b/params_shard_153.bin
new file mode 100644
index 0000000000000000000000000000000000000000..73ea81f22d66e5ec7d964fcd0c313b69d767914c
--- /dev/null
+++ b/params_shard_153.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a9fe5fb9284550e514c43c2a9a9f6bf312fb47a9bef5da7346c32ac2ec0a3ea6
+size 20760576
diff --git a/params_shard_154.bin b/params_shard_154.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d6fc7b5c9b59c5cd011e60298bb4ef0814fbff36
--- /dev/null
+++ b/params_shard_154.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ec6e469eb92fd723803d0f537ac2323ca34b6a1be2b6b565318cb09b417e1ef1
+size 70778880
diff --git a/params_shard_155.bin b/params_shard_155.bin
new file mode 100644
index 0000000000000000000000000000000000000000..99c5381f3225bc71291d5e2280fbeb511597fbfb
--- /dev/null
+++ b/params_shard_155.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:05f28e6b2def8d7e1a5726faa1d28ed6648b26a1da83b2f2f5c2637f2df06ad5
+size 141557760
diff --git a/params_shard_156.bin b/params_shard_156.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5aae8ed227a94f436c880cbb5d248a9dcfde45f5
--- /dev/null
+++ b/params_shard_156.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3cee910988fa2e300d1228812cf883d4de41a5c3c275a638014b426f558fcf95
+size 18350080
diff --git a/params_shard_157.bin b/params_shard_157.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cb0ea753788722f2044c7f8d8892c5e78958dc1a
--- /dev/null
+++ b/params_shard_157.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:aa2afc6d697769c5f6898d97b6ec9153b9a173316ccd3b83e43bc569cf89a3f5
+size 20760576
diff --git a/params_shard_158.bin b/params_shard_158.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6bffeefb92302f313d62111d8d57930cda3b0bd5
--- /dev/null
+++ b/params_shard_158.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3c6525c8183323324ed98899fed8a47d6c575b8df92b5c1ffee4ec498d3913cc
+size 70778880
diff --git a/params_shard_159.bin b/params_shard_159.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e99c3f522a284fd2a59999fc74a2f4ff2c0c577b
--- /dev/null
+++ b/params_shard_159.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ae90bb647dfcff82cdcf67fb78caf0ee66732c39287ff6ae3ec42bebff78d783
+size 141557760
diff --git a/params_shard_16.bin b/params_shard_16.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9109310b8070701027c6bf4f2ca2802271342a0c
--- /dev/null
+++ b/params_shard_16.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:75751c81c4d3c94285cbac439103db099dc6fad04e45fc2b10a32990ee699177
+size 18350080
diff --git a/params_shard_160.bin b/params_shard_160.bin
new file mode 100644
index 0000000000000000000000000000000000000000..608140817919a7c3e2981d369f1845a2c4a93383
--- /dev/null
+++ b/params_shard_160.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6d3ee0c3f68b232048f69bbecce2f9a3a75b31c038b6c8fa59e6754ee74a21f6
+size 18350080
diff --git a/params_shard_161.bin b/params_shard_161.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d58b02c34ff02137b0c98ce55cd183b6879cc24f
--- /dev/null
+++ b/params_shard_161.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:365e7dfe0e04c7e83ebe90652b87b560d62a6e583ec5f513a701f92d853b7c18
+size 20760576
diff --git a/params_shard_162.bin b/params_shard_162.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9bca89ac1cb49b0e17077cce78890d3d063b22ed
--- /dev/null
+++ b/params_shard_162.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:40c295707da8ce2aba4e5aa765fa3c4f819d542db84e75a81b8020c5eb1aa6ca
+size 70778880
diff --git a/params_shard_163.bin b/params_shard_163.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2e641c4064f7ca0925f28be5d518eed532572e1d
--- /dev/null
+++ b/params_shard_163.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f8af4488f9fd648221e9a75c61520b9c5fedb7bb78f19b11494c3953668158ce
+size 141557760
diff --git a/params_shard_164.bin b/params_shard_164.bin
new file mode 100644
index 0000000000000000000000000000000000000000..aa718a815d7f2cd4d1d609ebcd0685ff465b68f4
--- /dev/null
+++ b/params_shard_164.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5fb562c0ad5916cb50309868f6b8f3f0f35dc3fdc20c52df93f4ddb40fa53d8d
+size 18350080
diff --git a/params_shard_165.bin b/params_shard_165.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b9092a9d786b0658c110b52cddb98ef2ae124b73
--- /dev/null
+++ b/params_shard_165.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1420cd3939d4260d97d53c2479f3dea3bdc8dc86a1605ff77e09bf8cecaa3126
+size 20760576
diff --git a/params_shard_166.bin b/params_shard_166.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c657e2baabc14c99b749584d84bc0d756b0068d6
--- /dev/null
+++ b/params_shard_166.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d1c5543e220fc2af3c3b73cd030e5f3077b770eec8b68857e5bd5497c87ac0fb
+size 70778880
diff --git a/params_shard_167.bin b/params_shard_167.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d4aa0691f31d93a2ba052db129da1b8c93832818
--- /dev/null
+++ b/params_shard_167.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3a8cdfb215a41e20ac0be13763570fce4d82e36f2772597e586e1bc73df99dbc
+size 141557760
diff --git a/params_shard_168.bin b/params_shard_168.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2ff119d1e6de5a5449c94b701f34b636d81ad26b
--- /dev/null
+++ b/params_shard_168.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:90d9626bacf8e33f3a4bf87ed44175c6a83f05dfb067086d7e5513e93ac10ffb
+size 18350080
diff --git a/params_shard_169.bin b/params_shard_169.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e95fa64c1d20ad1fcf8c62fa795736772e4fb287
--- /dev/null
+++ b/params_shard_169.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:92f041cc8edf4a2cf96e3b7807482c0c37ed29262a6332bf8ce40951650efe14
+size 20760576
diff --git a/params_shard_17.bin b/params_shard_17.bin
new file mode 100644
index 0000000000000000000000000000000000000000..624d703f98f07de4791275d69f0f8513ac920b05
--- /dev/null
+++ b/params_shard_17.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a87ac6a1608a834eccdb7101b7da5f0d7e4279116fba6d06d6028adc939e8ce8
+size 20760576
diff --git a/params_shard_170.bin b/params_shard_170.bin
new file mode 100644
index 0000000000000000000000000000000000000000..49875d5a3779d035ebb8e0ec6b6359e5db5f78dd
--- /dev/null
+++ b/params_shard_170.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f995a9b34c775dba95c3c0805a5ae58f1dfdf0a40c8423fc1c0cfa83e172c278
+size 70778880
diff --git a/params_shard_171.bin b/params_shard_171.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4b8c44962abf9d4c322e37c7dd2ab9b4d03406f3
--- /dev/null
+++ b/params_shard_171.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ae38b21a1bc1d70a326307040a4cc4a216559f9af99138f7cde94721487049f5
+size 141557760
diff --git a/params_shard_172.bin b/params_shard_172.bin
new file mode 100644
index 0000000000000000000000000000000000000000..81c1eb2dcbd6ab8bc3c31aeaa98f36478a84742d
--- /dev/null
+++ b/params_shard_172.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ea00357f2126eac825c7f495757d875e47925379b5dce32dbe1e13abc7d9cbed
+size 18350080
diff --git a/params_shard_173.bin b/params_shard_173.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c159f95ed929f88429404e270aa38762c64c5fa1
--- /dev/null
+++ b/params_shard_173.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9a8540bc86dab897ce909ada436fb656ff291ed31c1f498afe21fa92be009c3e
+size 20760576
diff --git a/params_shard_174.bin b/params_shard_174.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ceec81125ccc68ae1255deba82a80cb57eb349e2
--- /dev/null
+++ b/params_shard_174.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:221df73ea1be3bf4292b2fd505fac1af6eb0e3383a531059a915439458adce02
+size 70778880
diff --git a/params_shard_175.bin b/params_shard_175.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6bd3cf3c47d45a41d92ffb76d0f79658915fcc73
--- /dev/null
+++ b/params_shard_175.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c66cfc706cd482ec95aafb6e59fc7821735c0d248f53792a4fd645c7f69b1205
+size 141557760
diff --git a/params_shard_176.bin b/params_shard_176.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1e1cadd9a219b079c5179ffb628331583527a046
--- /dev/null
+++ b/params_shard_176.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b7316a69bc2ec04d245584242a986a251f5bdd8f96ec4378e049ad91f227dd4b
+size 18350080
diff --git a/params_shard_177.bin b/params_shard_177.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4a297d49ef5dc7d77a9c3f14b9f00c9cbfc7e54b
--- /dev/null
+++ b/params_shard_177.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5a8e6a74b79bf0dcad8fa342da999d96239f0d9a7a7240f626e7bb746354c493
+size 20760576
diff --git a/params_shard_178.bin b/params_shard_178.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b88174278fec8ea324cc8beb95b3cacd09868be9
--- /dev/null
+++ b/params_shard_178.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:930994f69befa700cd26a3762325abd8372e960f0ad7b0c0d8830a8559bece62
+size 70778880
diff --git a/params_shard_179.bin b/params_shard_179.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2c03904584014fc4be52f13fd361aa56c41f416b
--- /dev/null
+++ b/params_shard_179.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:be019c1f9c9b1b73f3cb511c7bc58dc9d5e09985b2dee79cb00cf820af3a42bd
+size 141557760
diff --git a/params_shard_18.bin b/params_shard_18.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9298105f5f5818d892e1dc0c73a83dabfe9ddb8a
--- /dev/null
+++ b/params_shard_18.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0088891c621bf8529fe30f6ce7a648be0f537c8c2bb459b5b298827c952b98fa
+size 70778880
diff --git a/params_shard_180.bin b/params_shard_180.bin
new file mode 100644
index 0000000000000000000000000000000000000000..151cf38c21924143669d494314849557758245a7
--- /dev/null
+++ b/params_shard_180.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4e74b2f4e5f3f9ba34ac900072a0cf001f5799e5188a96b91c17aa1ecf090cd2
+size 18350080
diff --git a/params_shard_181.bin b/params_shard_181.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9eabda6e38276f5a70c679c6738885e80e3895b9
--- /dev/null
+++ b/params_shard_181.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6b6d020af63074d36162d6ee52aa94481be429ed5d0399bc4e95b6f7649b8760
+size 20760576
diff --git a/params_shard_182.bin b/params_shard_182.bin
new file mode 100644
index 0000000000000000000000000000000000000000..816ebe276193177a7d6c81886b52bdf43ae7ebb1
--- /dev/null
+++ b/params_shard_182.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7d1bf4bf88cc8df79c44e8988ff7c5546ceb3477b0575ca8d5d87f51bc933fe3
+size 70778880
diff --git a/params_shard_183.bin b/params_shard_183.bin
new file mode 100644
index 0000000000000000000000000000000000000000..71415f14d20e380dff94509a75456d85b0673039
--- /dev/null
+++ b/params_shard_183.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fd3137adc77f5d5cfbd9f2ac886e61b60f62a013570bd168396689c20e26518d
+size 141557760
diff --git a/params_shard_184.bin b/params_shard_184.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1c9f757a2f8420ec532535faa6727ae5ff6f05d9
--- /dev/null
+++ b/params_shard_184.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a58b379f4a56dd027c9e557673e8174f29773d793598718f4034a5ff71a74116
+size 18350080
diff --git a/params_shard_185.bin b/params_shard_185.bin
new file mode 100644
index 0000000000000000000000000000000000000000..790c5cabc203b4ded4f247dd0b3a7a5efb730301
--- /dev/null
+++ b/params_shard_185.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5f94caa5e73873c0f0b6be2d247d41bad28aa4d4955f03bd2addbc7f674e40d6
+size 20760576
diff --git a/params_shard_186.bin b/params_shard_186.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9ac6125122f709e3141cf4864a8ced6e8f4af395
--- /dev/null
+++ b/params_shard_186.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5e35b6dbad9f029065976358f41bfedad4a623d653ba9911901c55fb3f3f6b42
+size 70778880
diff --git a/params_shard_187.bin b/params_shard_187.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f9884e6922b133a09ebf4d6bd6a05bddeea81eeb
--- /dev/null
+++ b/params_shard_187.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:802f443afc5e56275674e0bf4c21b6ad9870bb7e32ffa85ed564a0a8f36d9175
+size 141557760
diff --git a/params_shard_188.bin b/params_shard_188.bin
new file mode 100644
index 0000000000000000000000000000000000000000..54c3e7f4a50f3e888f03d4e6ada04f0dd8f1a460
--- /dev/null
+++ b/params_shard_188.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4123f666916bccb7c3868a2265898412a0c0cb720779d7804d2d236ac66537ab
+size 18350080
diff --git a/params_shard_189.bin b/params_shard_189.bin
new file mode 100644
index 0000000000000000000000000000000000000000..216d4482e3d5c7a9bb4f449aad1662aaabf042a4
--- /dev/null
+++ b/params_shard_189.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ae2c2e81e1fd57683972d5c0921e2855dca54131e7ead1903dfffcb2d0511cc2
+size 20760576
diff --git a/params_shard_19.bin b/params_shard_19.bin
new file mode 100644
index 0000000000000000000000000000000000000000..838f203aefecbd8f98764198799fbee9972c3448
--- /dev/null
+++ b/params_shard_19.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c6f294ad733cc83dc0aa34490d4ac7412bd2d0a99c2fea3fa620879f46779461
+size 141557760
diff --git a/params_shard_190.bin b/params_shard_190.bin
new file mode 100644
index 0000000000000000000000000000000000000000..901f5a671303df26ee5c101c3f7bea7200fb3886
--- /dev/null
+++ b/params_shard_190.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:23c71c0b546cce480762185958a4e1af407584111211d50830ce730a6f9ffc68
+size 70778880
diff --git a/params_shard_191.bin b/params_shard_191.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a78ba2884ab6e34d716b522100cb670923a4d5b9
--- /dev/null
+++ b/params_shard_191.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:13d547fac3ede3e66c127c26a74db7b81f922e04ae91eadcc32ae23fd1e01585
+size 141557760
diff --git a/params_shard_192.bin b/params_shard_192.bin
new file mode 100644
index 0000000000000000000000000000000000000000..55ada7a13b02daedd7ba5a9e1b69afb832cdd267
--- /dev/null
+++ b/params_shard_192.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:14c566ee26997fcd8950ba21b9bcf11f6007094f21c7310b2c63f543e17fc9c0
+size 18350080
diff --git a/params_shard_193.bin b/params_shard_193.bin
new file mode 100644
index 0000000000000000000000000000000000000000..776e089aa2d6f7a793e1d69bed1055abbc56ea9b
--- /dev/null
+++ b/params_shard_193.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:abdd0fea3d14e71de5e898cec36605cdae5c4da0e84493cb5050ee4325d5b4f5
+size 20760576
diff --git a/params_shard_194.bin b/params_shard_194.bin
new file mode 100644
index 0000000000000000000000000000000000000000..453ccb2e25737d78f4950a42445ebc0b54c80abc
--- /dev/null
+++ b/params_shard_194.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d3de0f2efdc257e19acedb2e508931565a984d3cc52197f0f83b4fd395019be2
+size 70778880
diff --git a/params_shard_195.bin b/params_shard_195.bin
new file mode 100644
index 0000000000000000000000000000000000000000..adcdcd3eae04db9bcf5cb6ae577d010c3b5463b6
--- /dev/null
+++ b/params_shard_195.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:320176c51f6af9093a3d73aa3d38b40e707fd1b2eda371669d27448598980867
+size 141557760
diff --git a/params_shard_196.bin b/params_shard_196.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ce10f313f986b764d16736c2386adf890b2e2481
--- /dev/null
+++ b/params_shard_196.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cc9210222c12e8fe517ed2f890ba5199ef1e219b42c2384328bbf852a5a30624
+size 18350080
diff --git a/params_shard_197.bin b/params_shard_197.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e017af2dadc9a1524c997d52dd9ea3df14a24c92
--- /dev/null
+++ b/params_shard_197.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c1ce2e6ffa7237e50f83dec91cdaabfa20d4dfbd995e75cf1a0d45101456ffe4
+size 20760576
diff --git a/params_shard_198.bin b/params_shard_198.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c9b17cf6c49b26c415efb8f8fd1e2b60e420e7ab
--- /dev/null
+++ b/params_shard_198.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:da31deb937ded44384f4dc904a03753af0282bc13b238ec3c484d791debb0b0a
+size 70778880
diff --git a/params_shard_199.bin b/params_shard_199.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b655eabc581222a02caa7b77482e07fd677ed871
--- /dev/null
+++ b/params_shard_199.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:265368d36db05479c060c41e9ca3a27b1af407a221159ae6f67dde1221aef3b6
+size 141557760
diff --git a/params_shard_2.bin b/params_shard_2.bin
new file mode 100644
index 0000000000000000000000000000000000000000..20278e63ee4804516fc216f4ef2ac3f617ed5aab
--- /dev/null
+++ b/params_shard_2.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3cab0ec94b230354ce5accc91c275ea0b6f8778c731efcc06a29608d56022331
+size 70778880
diff --git a/params_shard_20.bin b/params_shard_20.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0412c4344aa6b6fe2cbac331f8525bbfda53a2e5
--- /dev/null
+++ b/params_shard_20.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ddf235ba2450f1744d2ab4056795acd0189e3143b69fa19702a0b2f2a81df432
+size 18350080
diff --git a/params_shard_200.bin b/params_shard_200.bin
new file mode 100644
index 0000000000000000000000000000000000000000..14c1382552dc9264d85f172727749ddd6fb6e998
--- /dev/null
+++ b/params_shard_200.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cfd73125d8d20331fa6fa0142f4aa8c1b39addb736b872d9b471e98a991e70fc
+size 18350080
diff --git a/params_shard_201.bin b/params_shard_201.bin
new file mode 100644
index 0000000000000000000000000000000000000000..520782668b21d3bf37765c25af6cc69e1940533b
--- /dev/null
+++ b/params_shard_201.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3df6ca0b7d7c1bd4e7eb2796847cf60ff72a9ded1deba41e1408b56892b0360d
+size 20760576
diff --git a/params_shard_202.bin b/params_shard_202.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d07f8bbf59b3bf9885905c04cd423c662b065e8c
--- /dev/null
+++ b/params_shard_202.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9544364c0a768c5fa66ac40d235cdc4a68de1141d6a0da703a17a52b818e15f0
+size 70778880
diff --git a/params_shard_203.bin b/params_shard_203.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0759ddafa53477b981a242be8862a9b9554e0864
--- /dev/null
+++ b/params_shard_203.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f8d88d86c10d1be82e559c0dd08fae495f7ba6d04a83c77218fa2e708efa846b
+size 141557760
diff --git a/params_shard_204.bin b/params_shard_204.bin
new file mode 100644
index 0000000000000000000000000000000000000000..11c615b6626bd3f781c404ff78ddb32d2d55c99d
--- /dev/null
+++ b/params_shard_204.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bf8572e9d23bc57554c6b616457fe4562eb82327241620e85dfd6c5e5f9f32e0
+size 18350080
diff --git a/params_shard_205.bin b/params_shard_205.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5328140790ab1b2a796a52045c94cffd34bf74e9
--- /dev/null
+++ b/params_shard_205.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3a223d5a6c4a444987baeda0bba31603a20312f6e5d69315d5fb206f71a6bfeb
+size 20760576
diff --git a/params_shard_206.bin b/params_shard_206.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6bf9fed418721a7e9f94ad1561bb43ef4311d8dc
--- /dev/null
+++ b/params_shard_206.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0082a455cc2ad8a1f1c92b4c89fa818aecf53e436467daa7e5616345ea451702
+size 70778880
diff --git a/params_shard_207.bin b/params_shard_207.bin
new file mode 100644
index 0000000000000000000000000000000000000000..fcb789755c53cfc1bc4ab1b59a770adaa0ccc199
--- /dev/null
+++ b/params_shard_207.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e9991ab7cab0af4cc7bc462e2cbf8a8a1dce3b6a09143e32182aa73feef90ea1
+size 141557760
diff --git a/params_shard_208.bin b/params_shard_208.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4f7da789a464c7f93616153b7dfb39c92d69e2e9
--- /dev/null
+++ b/params_shard_208.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6d8213b05c937488b756aeba80f2227115a5efaecac611a8d9df6e82c9b4a97c
+size 18350080
diff --git a/params_shard_209.bin b/params_shard_209.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1b1a5264eb6fee017213c1493d5f791671558365
--- /dev/null
+++ b/params_shard_209.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9931043ae3b2dfa47cbe7e825d4b90100349391ca561b033c01c7a4eb090bedc
+size 20760576
diff --git a/params_shard_21.bin b/params_shard_21.bin
new file mode 100644
index 0000000000000000000000000000000000000000..77b4e96a7c55e092e6cc798f699316c6a1caa53d
--- /dev/null
+++ b/params_shard_21.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:98595d8d1cd0715bb6244ab072bcbec03697193fcae546d134efd8252643e28d
+size 20760576
diff --git a/params_shard_210.bin b/params_shard_210.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e35b7456171a0f3c8fb3647f5f47ccbcee84153e
--- /dev/null
+++ b/params_shard_210.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:11e41a98d864a0bc7008aebf87116b031b21d08f0b3f34677f5826537b3b24ae
+size 70778880
diff --git a/params_shard_211.bin b/params_shard_211.bin
new file mode 100644
index 0000000000000000000000000000000000000000..13b3c43836c661a869321520035bbe180b4e47ac
--- /dev/null
+++ b/params_shard_211.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:41b55371ce208a55a7f0fe0902e46e9fd10c95d47b956b13c8bb1f9d54981526
+size 141557760
diff --git a/params_shard_212.bin b/params_shard_212.bin
new file mode 100644
index 0000000000000000000000000000000000000000..00ccc0a97f858ee7981a6653201a8e55018eb710
--- /dev/null
+++ b/params_shard_212.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:93867d0614401089d74129881ec3f620912f2586487d1442556fb495fdb33ae8
+size 18350080
diff --git a/params_shard_213.bin b/params_shard_213.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0c20579c356c8a55c9653fa4297d4390d187c5a0
--- /dev/null
+++ b/params_shard_213.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5321b8987f9cc40d9041e1685746dd247efe1a5f4ed86bbf4cd872f09307d550
+size 20760576
diff --git a/params_shard_214.bin b/params_shard_214.bin
new file mode 100644
index 0000000000000000000000000000000000000000..199112b8864a1a9809bd1349d0f3056d97510dcb
--- /dev/null
+++ b/params_shard_214.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:49c93fe009071ae00d979daebcd3f8b2208b52acfcbc4816b5225deaef810c4d
+size 70778880
diff --git a/params_shard_215.bin b/params_shard_215.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ef8e7a2126e6f7c85e56bed4290a35ac21f2c743
--- /dev/null
+++ b/params_shard_215.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c10b4afdc13ec3bf3e05c1bcd97d4f604c0a7bef4f3a29c06aba1aa4017c0deb
+size 141557760
diff --git a/params_shard_216.bin b/params_shard_216.bin
new file mode 100644
index 0000000000000000000000000000000000000000..146df2d881f3e737a421b555e2c5d33dba0e05dd
--- /dev/null
+++ b/params_shard_216.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:68e079207e0655fcd20e5da6a94fe6b96bb0118de02567e10121459e0858bf25
+size 18350080
diff --git a/params_shard_217.bin b/params_shard_217.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6e0a7edbd01b38750758cd4c1b832527d2e45ced
--- /dev/null
+++ b/params_shard_217.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fd1316264e07cd17e554eab763591ae676a57a2bf3d7fbfff0f87a9989fd0d9e
+size 20760576
diff --git a/params_shard_218.bin b/params_shard_218.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c6229fb6cc352ff83a3d53b657482552f1ce341e
--- /dev/null
+++ b/params_shard_218.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:44205b9b9879a48af932100b7eb012b8809402251d67244fe5452ae7d71e290e
+size 70778880
diff --git a/params_shard_219.bin b/params_shard_219.bin
new file mode 100644
index 0000000000000000000000000000000000000000..414af2d0377574e9285183308cb099d3f51e4682
--- /dev/null
+++ b/params_shard_219.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0d908d040949292644896dd958df2bfb3fc3da150f82029f15fcaea9a2dbb7b2
+size 141557760
diff --git a/params_shard_22.bin b/params_shard_22.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1b78d96478fca3339e30d88fef7571fa4c55de52
--- /dev/null
+++ b/params_shard_22.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:20b0aa14358169bedc6a14ea30fb1c18b509aee663f8efce6fcf233ffe80a94a
+size 70778880
diff --git a/params_shard_220.bin b/params_shard_220.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0523ef4fddb99a38f035c861980e54359f0732cd
--- /dev/null
+++ b/params_shard_220.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3a6d3561705142648da710406206b8c8b6294e41a45fb1d1a6ca4b990e82ad19
+size 18350080
diff --git a/params_shard_221.bin b/params_shard_221.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3462a18b4fb98876f770c18862f374b0d5ca0f17
--- /dev/null
+++ b/params_shard_221.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:96cb538cd1ba2df869d11891b0ecd63f68ae0a395af744dd86faaab1396ab4c9
+size 20760576
diff --git a/params_shard_222.bin b/params_shard_222.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3e311340633d85fc8b22aa612a561226afdc8fc6
--- /dev/null
+++ b/params_shard_222.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2edaa238ccb6fe3f0099cf8f3048e4b57ee9dd34b6676391418b0d734a610c51
+size 70778880
diff --git a/params_shard_223.bin b/params_shard_223.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9fa9a311df21453d7bd3b121f8ee45d5e050875c
--- /dev/null
+++ b/params_shard_223.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b7ccd993a005a68f19e1637761914744354959abbebd5f30d7ab755676fa9baf
+size 141557760
diff --git a/params_shard_224.bin b/params_shard_224.bin
new file mode 100644
index 0000000000000000000000000000000000000000..eda974327b969f81cf52739e5e8ee97b2baf2488
--- /dev/null
+++ b/params_shard_224.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c1520239e046b1bafc850da4ec752e63535ecc0eaa765faf9d9118d668d542db
+size 18350080
diff --git a/params_shard_225.bin b/params_shard_225.bin
new file mode 100644
index 0000000000000000000000000000000000000000..06bc3997cb0a7a544ca9c3e3555643cebbd8f2ff
--- /dev/null
+++ b/params_shard_225.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e4aa444bf3d4655903c4c6ed53bbab97393c777207e8bccd3cfdb918e3f3dafd
+size 20760576
diff --git a/params_shard_226.bin b/params_shard_226.bin
new file mode 100644
index 0000000000000000000000000000000000000000..397d04e4f92756b27542f1cf59a00d9b02e11d02
--- /dev/null
+++ b/params_shard_226.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:09703e8cf6974ea1245ea5ba164619cd05564cd49e34ecad686dedc61396f8c9
+size 70778880
diff --git a/params_shard_227.bin b/params_shard_227.bin
new file mode 100644
index 0000000000000000000000000000000000000000..36f114d48a38a6b4e61a49d63a93c2b756cbe89a
--- /dev/null
+++ b/params_shard_227.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e60aebb27a31bc4d574b46a0fa6d65beb43ea2a907a7aada2ee1f43308120822
+size 141557760
diff --git a/params_shard_228.bin b/params_shard_228.bin
new file mode 100644
index 0000000000000000000000000000000000000000..34fcc57e557f4fd7a08ab3c4ad170755cc4ac582
--- /dev/null
+++ b/params_shard_228.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4657bfa8e0e729699f092f7dbe5a1f54caecaec52666eea10a55a1987ad37766
+size 18350080
diff --git a/params_shard_229.bin b/params_shard_229.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5aa196b93bd985050079a1b424ce1b7f5fdf1edd
--- /dev/null
+++ b/params_shard_229.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e7a34c6da30a6c9b805b96f2548060ad8736de3068a207adb03821be45b994a0
+size 20760576
diff --git a/params_shard_23.bin b/params_shard_23.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b21131fccdbf95e5238cfbc20d3b84201d9ce63e
--- /dev/null
+++ b/params_shard_23.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:431feff9fc3096dd17103ee2d9f8da31240402520b261dadd8fd7d7357689513
+size 141557760
diff --git a/params_shard_230.bin b/params_shard_230.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2c299a08e3501aef74f3a0964c4755efc02ce957
--- /dev/null
+++ b/params_shard_230.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d5f8d93355ed8536baac9631e8a881f84b751a6524196100050451a250fc3309
+size 70778880
diff --git a/params_shard_231.bin b/params_shard_231.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3b7205bfa5abd7ec432ceb8b38ff56361e5b77a6
--- /dev/null
+++ b/params_shard_231.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bede31f53c0b8c93a8a115c4a4a18635669f0b11ddcc0049780df49e6cf5122e
+size 141557760
diff --git a/params_shard_232.bin b/params_shard_232.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f986dd8eb9ba011adf05b213b74a1a6c0e65d08c
--- /dev/null
+++ b/params_shard_232.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d6021f5a4429e988983153137d7005aaace07c4dc6b4bab96bac1326eea39978
+size 18350080
diff --git a/params_shard_233.bin b/params_shard_233.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d41954c91a872ec1e6e21710067f60a58973e76c
--- /dev/null
+++ b/params_shard_233.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1d46aba745adc66d0abaf00e0b0981641cd044e766a92753a133847b04afd547
+size 20760576
diff --git a/params_shard_234.bin b/params_shard_234.bin
new file mode 100644
index 0000000000000000000000000000000000000000..24001677bd2b329021a5ba7ef08f0d3613ceb174
--- /dev/null
+++ b/params_shard_234.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3a4d35131ab678a083dc78bb6308767108783f8c9737831f1cf81d56a966f929
+size 70778880
diff --git a/params_shard_235.bin b/params_shard_235.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2863f6c94ad7d1665391226aeae72cb650d95bdb
--- /dev/null
+++ b/params_shard_235.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d8232c19d20cb0d5772bbc0d2d2e57ef28b46fbbd84057ba8ce780c917a35724
+size 141557760
diff --git a/params_shard_236.bin b/params_shard_236.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d522f5f7fe7c6764c1fbf2af1595c41a9a818c67
--- /dev/null
+++ b/params_shard_236.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f8e63bd6c7ca6a6fdf84327bf84bfb41202a63b389ceb03516ee3ea0c13a124c
+size 18350080
diff --git a/params_shard_237.bin b/params_shard_237.bin
new file mode 100644
index 0000000000000000000000000000000000000000..74d7d6524d621bd45ea53ddecec6a0a37deffd9e
--- /dev/null
+++ b/params_shard_237.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:960039c8239042dba581367273acbdb797d7d07fee9546cc74347313e428e290
+size 20760576
diff --git a/params_shard_238.bin b/params_shard_238.bin
new file mode 100644
index 0000000000000000000000000000000000000000..90208d7730267440e93371393faf0ed2b23625d5
--- /dev/null
+++ b/params_shard_238.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a3b4b3233392efaec584f02ba6a86777d4849533f37531a234beb94b549a7459
+size 70778880
diff --git a/params_shard_239.bin b/params_shard_239.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a24488508c324970e09a0f4f9014cb26d868b2c4
--- /dev/null
+++ b/params_shard_239.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d0a961e72723cb4f2989b380f0991308b7316064d94e3dedea345ff5f72506b0
+size 141557760
diff --git a/params_shard_24.bin b/params_shard_24.bin
new file mode 100644
index 0000000000000000000000000000000000000000..08553b9863b6e27dba05ff424d6613d9a3ec1808
--- /dev/null
+++ b/params_shard_24.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ee6cb6e124835792ec1d7660fc9dae52bedb19c47a342fdd27d811bc12239c8a
+size 18350080
diff --git a/params_shard_240.bin b/params_shard_240.bin
new file mode 100644
index 0000000000000000000000000000000000000000..757c30f4dd438889cf7ea038b3409e6e6e7de7c8
--- /dev/null
+++ b/params_shard_240.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:996eb0f69b47abd940fd2a0f56983fdb66679c923193fd931e74211d1757ae19
+size 18350080
diff --git a/params_shard_241.bin b/params_shard_241.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9181fff62b2ea19f8dfd75117a09efb1d5e77007
--- /dev/null
+++ b/params_shard_241.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5d9800a39b9a124525fd572db7888ac7876d037587dc59e95287686efdc4c0f3
+size 20760576
diff --git a/params_shard_242.bin b/params_shard_242.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a3e76e961a46743a93255a320c92977e9087a352
--- /dev/null
+++ b/params_shard_242.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:755973b9ec2d010a5966b8453f398097d34859a58c92ce425251b7bc9b0b85d1
+size 70778880
diff --git a/params_shard_243.bin b/params_shard_243.bin
new file mode 100644
index 0000000000000000000000000000000000000000..618847eb0fa4bd6fcb3a193f7d100112bb476b60
--- /dev/null
+++ b/params_shard_243.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9e9f9a4be940a80e9d4f434099626179039e40f0e1ca2b8d3e61439d68515cec
+size 141557760
diff --git a/params_shard_244.bin b/params_shard_244.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0f4b6a98d3bebd2f49a205ff578c3e18fe150eff
--- /dev/null
+++ b/params_shard_244.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5c5a9abc8569f9d6c2f034f0d65af809f2e11baea7c86d66579798ef6dae45de
+size 18350080
diff --git a/params_shard_245.bin b/params_shard_245.bin
new file mode 100644
index 0000000000000000000000000000000000000000..03ed25d94ae51e6736a81d7f3f0273a3da0a208d
--- /dev/null
+++ b/params_shard_245.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:048ad358044ce5de2f39bffdfdb2087eeba454f84d137897b037fa9d7d69e4f2
+size 20760576
diff --git a/params_shard_246.bin b/params_shard_246.bin
new file mode 100644
index 0000000000000000000000000000000000000000..feb80f13786424d597fd25929c3092227d9dba7b
--- /dev/null
+++ b/params_shard_246.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3a367fe3acedc623869f2ed1c037af779c34c9b55785da8a8fcb19109504fdaf
+size 70778880
diff --git a/params_shard_247.bin b/params_shard_247.bin
new file mode 100644
index 0000000000000000000000000000000000000000..05546a9b1a0f92d227472e4451cbc6b7efeabe1f
--- /dev/null
+++ b/params_shard_247.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:58c32da04c75a34225bf462b14e0bfa7bbe01b2e25a12a9f2cbc392b9bdc95f5
+size 141557760
diff --git a/params_shard_248.bin b/params_shard_248.bin
new file mode 100644
index 0000000000000000000000000000000000000000..35772d28c3e4e18e3ac0e20b5e8da3bc5da31718
--- /dev/null
+++ b/params_shard_248.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:682f4254ce31e06a706f18b6d277107829dedb2c39a5ffc65894aecfee87fb18
+size 18350080
diff --git a/params_shard_249.bin b/params_shard_249.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a43a89e79526781dea77b6de84c8c616b348de46
--- /dev/null
+++ b/params_shard_249.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:33c3d3b0aa11e428bdbfccfd160462c3fd02dc0b4eedbb6e9653e24df1240be7
+size 20760576
diff --git a/params_shard_25.bin b/params_shard_25.bin
new file mode 100644
index 0000000000000000000000000000000000000000..487e21f5976b0459eba01bdfced1fba5d9014531
--- /dev/null
+++ b/params_shard_25.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:722559265002e87ef2b2eba43960f0c933845ab39a79c9d576898c0d9a1dbad5
+size 20760576
diff --git a/params_shard_250.bin b/params_shard_250.bin
new file mode 100644
index 0000000000000000000000000000000000000000..eadd7dbebf169cdd230ddbfe2105f955326b0c66
--- /dev/null
+++ b/params_shard_250.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0783970b8cb98ce2af51d38da3151125b9d475246298fecae631116d6ba6ee5a
+size 70778880
diff --git a/params_shard_251.bin b/params_shard_251.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f30be2daf8482b6b464c4917cc86a5fe713f7da9
--- /dev/null
+++ b/params_shard_251.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e851e1606d36c51be89b5e144f6134a8bdda5eeedae6ff40d4a9c753e7dd2b6b
+size 141557760
diff --git a/params_shard_252.bin b/params_shard_252.bin
new file mode 100644
index 0000000000000000000000000000000000000000..323dd5c57fa3e17b756bbd3ed581043bbe2e30a7
--- /dev/null
+++ b/params_shard_252.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c4b75edd81e191f9852b61a4a3e0f61a9b08764d16cada46d2bb176623b02648
+size 18350080
diff --git a/params_shard_253.bin b/params_shard_253.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9a1c98733348cc2a51311ce72987f513cfab3a7e
--- /dev/null
+++ b/params_shard_253.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:148e0ad56c61fa61ad47c212c8b40d255ed701492ccf2690c03cdcdeb6ea7f76
+size 20760576
diff --git a/params_shard_254.bin b/params_shard_254.bin
new file mode 100644
index 0000000000000000000000000000000000000000..37746417d453d375450f78900d0a1bc47368d206
--- /dev/null
+++ b/params_shard_254.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1d00f5ff8a190df705e3736c47c4c1805ea731a679bea8654bf21339c53c30d8
+size 70778880
diff --git a/params_shard_255.bin b/params_shard_255.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b10f09295984e60b036751f569c8b1df24a9da86
--- /dev/null
+++ b/params_shard_255.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2ced1b41a32ab877687c260627c5ee21ebe9a8f81bad4c6026f2d81b235983e3
+size 141557760
diff --git a/params_shard_256.bin b/params_shard_256.bin
new file mode 100644
index 0000000000000000000000000000000000000000..414939564dba291de62e05dbb3f823ea642bcfa5
--- /dev/null
+++ b/params_shard_256.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a42c845ef5daac5f2eb65d379afd543b1406173fc5cbc92bc859dc321ae0e5fe
+size 18350080
diff --git a/params_shard_257.bin b/params_shard_257.bin
new file mode 100644
index 0000000000000000000000000000000000000000..29b765e84c95a99c923d406948b8fe4565e8670a
--- /dev/null
+++ b/params_shard_257.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:71c5ed1d5530c21c9932dfa44df572d51c5c84810f0c703f5945779c7fe7d5f8
+size 20760576
diff --git a/params_shard_258.bin b/params_shard_258.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6c35505590257246fed08f1ba311b065081a499c
--- /dev/null
+++ b/params_shard_258.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:adb0a1bf4f464bbfca1a05c7511c785d3352dcd8459aa14f6262bffa1132168d
+size 13527040
diff --git a/params_shard_26.bin b/params_shard_26.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bf2254ecff847925cb5c0a9186b49e2d43420ff6
--- /dev/null
+++ b/params_shard_26.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ab028c2669a18dd208ba948f10c46dfa1e83906d6f7fc5f7954c285f7ace3bcd
+size 70778880
diff --git a/params_shard_27.bin b/params_shard_27.bin
new file mode 100644
index 0000000000000000000000000000000000000000..132c05970eb794060c898793a6dca4b2aba196cf
--- /dev/null
+++ b/params_shard_27.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9e102aa0fa4916d43687287033aa75f69cb4811cbcd542bf0230b634890a5ddd
+size 141557760
diff --git a/params_shard_28.bin b/params_shard_28.bin
new file mode 100644
index 0000000000000000000000000000000000000000..729bb60fd88e4432319625bc2f6019925f01d18d
--- /dev/null
+++ b/params_shard_28.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9ee70bcb0bed96f754649ed5069fcbfbec3471b2289484459385d9413368165f
+size 18350080
diff --git a/params_shard_29.bin b/params_shard_29.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2cfa8ecd0530f6a7ee1fb5261c8e08bf22b640b1
--- /dev/null
+++ b/params_shard_29.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5523929d7f5bf4cd6844e8f48c0cad3dedb4a13a5c0cd3abe53275d81bf200fe
+size 20760576
diff --git a/params_shard_3.bin b/params_shard_3.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d45514125776c78d6a05087a4bb035abd0cd5667
--- /dev/null
+++ b/params_shard_3.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b8f4d9848631d25e0afb33626025233c383977b4797eb41fa0fca6a670cb0598
+size 141557760
diff --git a/params_shard_30.bin b/params_shard_30.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1c8253c592cebcb12dc404fc4a268affcce4b566
--- /dev/null
+++ b/params_shard_30.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:77cb15abc31f2e877a30ee7dd5f65adb304c1307503b082ec5b39364629e5adb
+size 70778880
diff --git a/params_shard_31.bin b/params_shard_31.bin
new file mode 100644
index 0000000000000000000000000000000000000000..dcb15a960dc7157bd3d9566158923b86fdba5eb0
--- /dev/null
+++ b/params_shard_31.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3478fd99aee8bc0b6386c8e018879d17f6abab8fb54e254c3cd3a9ae8567214d
+size 141557760
diff --git a/params_shard_32.bin b/params_shard_32.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a4b8c9a96510a307be2901c1a8bb7bebb6b4ab8d
--- /dev/null
+++ b/params_shard_32.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:29461bb10f3c5eed26fce76df8a5a7eb052a4b04d563e3fa135d384120a4fe30
+size 18350080
diff --git a/params_shard_33.bin b/params_shard_33.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2f4071e752ebf55b3d48fedbc6a19798deab33d6
--- /dev/null
+++ b/params_shard_33.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:61b81eeb33abc7f790c294146155f179eda6ea16081658e32123c00aa8e027ee
+size 20760576
diff --git a/params_shard_34.bin b/params_shard_34.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ea3a2f607b2382ea8a4d2b08f4558377f1b45177
--- /dev/null
+++ b/params_shard_34.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cd0e47b1f34175d2bd6219b5019033e6a87c2f52f9dfde16aea4b0140dde8196
+size 70778880
diff --git a/params_shard_35.bin b/params_shard_35.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9ab17eda6fac581af8aa17df88f85438088426b2
--- /dev/null
+++ b/params_shard_35.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8d4bb3eabd6c36c03072cc9c0917c4432735b6115b6b6b82886c9bb1365894f9
+size 141557760
diff --git a/params_shard_36.bin b/params_shard_36.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f0da54fb75917625d82d5334ad15852bfb4de9df
--- /dev/null
+++ b/params_shard_36.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:60a7bdeb18b4894acc66d982d1f89a810464bd31ca9e9f0f5c7857542c307125
+size 18350080
diff --git a/params_shard_37.bin b/params_shard_37.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7c4434a0fb123c211a39c40e119c530fc17e2cd2
--- /dev/null
+++ b/params_shard_37.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c4ea8aad3aaee2501303c5b1fe130ffab32af631f079e6e7137cdf31fc95e627
+size 20760576
diff --git a/params_shard_38.bin b/params_shard_38.bin
new file mode 100644
index 0000000000000000000000000000000000000000..fc7fc1c599c7a5cfbcb8ad67a935fe072a84e4c4
--- /dev/null
+++ b/params_shard_38.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:036fa2093a5cc067dabf8e42ab29b17244343957dd56bf77786ae73c279f831b
+size 70778880
diff --git a/params_shard_39.bin b/params_shard_39.bin
new file mode 100644
index 0000000000000000000000000000000000000000..283085547be5df5d2c2ef51e9166ada636ea3b99
--- /dev/null
+++ b/params_shard_39.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fee0106a96382fb4df37383c8142eb64a7caef4c8526da7a82f339f488b91864
+size 141557760
diff --git a/params_shard_4.bin b/params_shard_4.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4d247702633e3d511a1c92cf116dad39ecab0079
--- /dev/null
+++ b/params_shard_4.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f2cfc19c099d052176334ccd09bced255c7bc6280b17bf915a0bc12e0f93bf2d
+size 18350080
diff --git a/params_shard_40.bin b/params_shard_40.bin
new file mode 100644
index 0000000000000000000000000000000000000000..697860ad6c049399f0f3530e29b9d877614b38b0
--- /dev/null
+++ b/params_shard_40.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:340b98107522384c198ebc10e2017ae02a9f0b0d65e578500d9560cdfd77735e
+size 18350080
diff --git a/params_shard_41.bin b/params_shard_41.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3b49fafaa94b7f8249877af6778c4a4ca961e4df
--- /dev/null
+++ b/params_shard_41.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5c98a8aa4c10c587dfa557d4c95d7f6a9b1a3f6851e2a542de324e1980666f90
+size 20760576
diff --git a/params_shard_42.bin b/params_shard_42.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b74719ac6cc8f75b06e4c71d18fe390f49fdd94b
--- /dev/null
+++ b/params_shard_42.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:da2c905f4703f85f426b45012eb15221b058dcdc1177e2771396da560b5f4c9f
+size 70778880
diff --git a/params_shard_43.bin b/params_shard_43.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a476f82152eaae54fd9dc3611a1d9199e67a6619
--- /dev/null
+++ b/params_shard_43.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:78e603ff3c5a72560fc0f975d80d5fd217d5f40e7d91eeda89b6326c6b6d9ddb
+size 141557760
diff --git a/params_shard_44.bin b/params_shard_44.bin
new file mode 100644
index 0000000000000000000000000000000000000000..87c2a2ac388b0d4b4b40497fe79f401b75916eb8
--- /dev/null
+++ b/params_shard_44.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dee26afee257c266bb643f89b2dc8478db7652da361a0519dc68db008b297224
+size 18350080
diff --git a/params_shard_45.bin b/params_shard_45.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6b2f62a1373f0c0e8d26bc233d0d1366c91a9e32
--- /dev/null
+++ b/params_shard_45.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:58325e414cac5636bf8ee539c6ba894b0dd96537799b4f0e0ac3034892c355a1
+size 20760576
diff --git a/params_shard_46.bin b/params_shard_46.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9877e7d6c91ae1df09ab81a35e1ead995b1647be
--- /dev/null
+++ b/params_shard_46.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fc19a9c01bbe8365bf79c8a6447379b92d7aa677ad0cc25d2953a6fa27283c5c
+size 70778880
diff --git a/params_shard_47.bin b/params_shard_47.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8729e53d307a8398218b093f72045f269f101f67
--- /dev/null
+++ b/params_shard_47.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5a45ff72ee4f0bc9c891a2edf0f45374f27df3631d42f30baa8a2d34b0b3b1ac
+size 141557760
diff --git a/params_shard_48.bin b/params_shard_48.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f618785310c5afbadbea416a0ce85b3a57ef5e07
--- /dev/null
+++ b/params_shard_48.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:da0741f036eec9cc27654741c4f22d293dd736749763be4e359026a668fd756d
+size 18350080
diff --git a/params_shard_49.bin b/params_shard_49.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e45df6bacf840eb25f343b05b7be9193597a414f
--- /dev/null
+++ b/params_shard_49.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b8cb0cd754f1fd7044a51a938f0163c1d7203fc9399d683c7373b0b25b30dd59
+size 20760576
diff --git a/params_shard_5.bin b/params_shard_5.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1f412b28ae699540d9577abc39fca3aaf047cd70
--- /dev/null
+++ b/params_shard_5.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:464d3ce4c6ff4e4e667c7c8f1c7310b0c5a50c9d23b3751e0442ae00db2c6605
+size 31574016
diff --git a/params_shard_50.bin b/params_shard_50.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e174c50fdcbac057b2b53fa7a3e9b4f3cca5a91e
--- /dev/null
+++ b/params_shard_50.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1e404cd0b49c932a240813e6edc9651d453d71c8eecd4661383b9352f8dc1664
+size 70778880
diff --git a/params_shard_51.bin b/params_shard_51.bin
new file mode 100644
index 0000000000000000000000000000000000000000..fd7f61cc604b6445d60eebcae4dd2611dc6a3bff
--- /dev/null
+++ b/params_shard_51.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7aad7969b5740ae371430ffc2e51f0faa910cc81fb8345e04ea4e54d0d002222
+size 141557760
diff --git a/params_shard_52.bin b/params_shard_52.bin
new file mode 100644
index 0000000000000000000000000000000000000000..474f4a370260af5259623ad7e0be93bb4a9ae32e
--- /dev/null
+++ b/params_shard_52.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:15c74c38d32aa87ba13d5ae85527e2515ab79fc91fb9c7db229eefb0cf06837c
+size 18350080
diff --git a/params_shard_53.bin b/params_shard_53.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d01153f2655f393f2b60162796f28363c9a3c6de
--- /dev/null
+++ b/params_shard_53.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e0e798cb4a43a86762b65643e2b82614dacad5f9ebf7e352419bdd635273a69e
+size 20760576
diff --git a/params_shard_54.bin b/params_shard_54.bin
new file mode 100644
index 0000000000000000000000000000000000000000..13de3ea0ef038dadc2a1061e6df1f13089a0ae73
--- /dev/null
+++ b/params_shard_54.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3e8dc4d8d845e5b13aec3918fbaacc0e6b4f4bf084e04a96b00503a746c46fd8
+size 70778880
diff --git a/params_shard_55.bin b/params_shard_55.bin
new file mode 100644
index 0000000000000000000000000000000000000000..efa12cdcaa833637c26861eb3104a20080b7161f
--- /dev/null
+++ b/params_shard_55.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:740966cc1a8f79aa94707b1c932f402a0fb7af9059b5762dab2c11a55f60d8a0
+size 141557760
diff --git a/params_shard_56.bin b/params_shard_56.bin
new file mode 100644
index 0000000000000000000000000000000000000000..23b8373fa1be75bb6841519ec0042d5ccf559537
--- /dev/null
+++ b/params_shard_56.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:17bde064e17f837372ec44b73f76af93fefb24e12bb97895824de44100029ca7
+size 18350080
diff --git a/params_shard_57.bin b/params_shard_57.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ed72b96fe0a89c8aa97703af6df97927c375f7be
--- /dev/null
+++ b/params_shard_57.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c7890508fe6222e5e78f3a5bef322f1dfb7918a61cc9ecf41290f44689b41184
+size 20760576
diff --git a/params_shard_58.bin b/params_shard_58.bin
new file mode 100644
index 0000000000000000000000000000000000000000..277f3d080cc857000141df9881374c8d4860fbe1
--- /dev/null
+++ b/params_shard_58.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:794948f010b05f1fd9593efc9f0b2f47521fa95ad4ae28710ab700129fc952ce
+size 70778880
diff --git a/params_shard_59.bin b/params_shard_59.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c61ff7d1f199497fc5fd651700ebd4d02c417217
--- /dev/null
+++ b/params_shard_59.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:32e2a9c19afcc36324afa29c244cba19516a6c5bbb4d8bb7180996cc68a43ae1
+size 141557760
diff --git a/params_shard_6.bin b/params_shard_6.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a22335fee7e7497742017e62714c8d2069376c3d
--- /dev/null
+++ b/params_shard_6.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5137b679327a6bb5dabf3629e0b1571b8cf11aedb22bbd11e1bb55467e0240a5
+size 70778880
diff --git a/params_shard_60.bin b/params_shard_60.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b14a9a2571397351963207220340681ff7adb001
--- /dev/null
+++ b/params_shard_60.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c40b30a2755c0f25cd217ede10d5aa8ec06c58f011017f17144f9db324cc296a
+size 18350080
diff --git a/params_shard_61.bin b/params_shard_61.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e7ed0a0b9a7e28ecfbc0e5cf7bbb7c4f381b0ab7
--- /dev/null
+++ b/params_shard_61.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:65fc96a9f3a6e4cd456c6c53a46eca1759f22fe6e20640482ebfd7cdc146741d
+size 20760576
diff --git a/params_shard_62.bin b/params_shard_62.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c2c8bd07e7006f0c41e32819714443aa64f4a28a
--- /dev/null
+++ b/params_shard_62.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4c7afe0f9009468a57c4fdd5b92eaa928503184965e4d16df91978ef646e2f5f
+size 70778880
diff --git a/params_shard_63.bin b/params_shard_63.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e2208ae0ff09737b1e33812a32023bb8aa44ea56
--- /dev/null
+++ b/params_shard_63.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1e7b774210d1e3a16f78a48025e3e69808d028bc10dfc266bf13ed0f2b0cc307
+size 141557760
diff --git a/params_shard_64.bin b/params_shard_64.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2a3f32735f7d368e23fe2e04c24848af0e5733ba
--- /dev/null
+++ b/params_shard_64.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:777ad8bd8310984083f9c4cf4548598f6d100deae59986c5bb50947bd662c052
+size 18350080
diff --git a/params_shard_65.bin b/params_shard_65.bin
new file mode 100644
index 0000000000000000000000000000000000000000..33a8d0e7ffd5d1895ea135549c25fe34cfa68bcb
--- /dev/null
+++ b/params_shard_65.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0cfb419f569cd9ccb072ca9cf6c42c99683b6bdb6f95938cadda867cdd59e4bd
+size 20760576
diff --git a/params_shard_66.bin b/params_shard_66.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a9768ccdfa8a131d3c9322d5c0125220ec39818e
--- /dev/null
+++ b/params_shard_66.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8f68203f4e6d6ac9bd92eb843a02b7f38d48d4c8bfd520e6aeb2c3a40cd83375
+size 70778880
diff --git a/params_shard_67.bin b/params_shard_67.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9f30db301d4e721b836d05d12db11ebb9b919c60
--- /dev/null
+++ b/params_shard_67.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d976588a174a3ade8b9d19df01a82c41f2f0a6e4499260762f82ad171057ae25
+size 141557760
diff --git a/params_shard_68.bin b/params_shard_68.bin
new file mode 100644
index 0000000000000000000000000000000000000000..79d816740525731b2395f48b9f38e230ee4cdaa6
--- /dev/null
+++ b/params_shard_68.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:20abd246838c063cf27d99b0fa082b60f5f9782514b9b3fe9e5fc4f1c9dc52be
+size 18350080
diff --git a/params_shard_69.bin b/params_shard_69.bin
new file mode 100644
index 0000000000000000000000000000000000000000..06ff07a3e58fdf2a4175e08984ab461733be6e1b
--- /dev/null
+++ b/params_shard_69.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5515ad0096a8d43795077a0572a9463d29ecee92c89d418f785d4180942b10f9
+size 20760576
diff --git a/params_shard_7.bin b/params_shard_7.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8ff85f168985f19027eaa352233c404a7a0934ab
--- /dev/null
+++ b/params_shard_7.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6b4996117e4badf49127aae3a1671c20cb899a22d65527cbc67176ac3cde06e4
+size 141557760
diff --git a/params_shard_70.bin b/params_shard_70.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8a35d1770bb1cdb85fb61d660821d9533459b047
--- /dev/null
+++ b/params_shard_70.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4cfda48c1032d502ae31caa0d89073206e5462901f7965dd831b59b29abd0e93
+size 70778880
diff --git a/params_shard_71.bin b/params_shard_71.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8a503ad14fb4af879d7a0431a57e4f1d9e62601e
--- /dev/null
+++ b/params_shard_71.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:90cc838a9bd7825e4a659b563d5807acebf641520d7cd5662907ddc83239d0ea
+size 141557760
diff --git a/params_shard_72.bin b/params_shard_72.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c0cb8f236e990d2ed527a9529ddde6892e877542
--- /dev/null
+++ b/params_shard_72.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:062a28d6a03bf5eaaa61f933a9ef6cfa1432c9cf2a1146facdf6ad14846ad495
+size 18350080
diff --git a/params_shard_73.bin b/params_shard_73.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1d28e79960ed6ce33b97205472986e4eb9a877d7
--- /dev/null
+++ b/params_shard_73.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:998ca392b99b16ba0b20742ce19e35c3b4aabdc91a3af5106c9d59daf67329b9
+size 20760576
diff --git a/params_shard_74.bin b/params_shard_74.bin
new file mode 100644
index 0000000000000000000000000000000000000000..55e054225db4781b7669c14d2f8209cd3ae9d9c4
--- /dev/null
+++ b/params_shard_74.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3353de49a9fab3c276ebc19cac63ea39c0ae103bddc4bcd72e1cd7f438903808
+size 70778880
diff --git a/params_shard_75.bin b/params_shard_75.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a3066f3f05df0709a4e0eacf1a3e31a6aa3ecba9
--- /dev/null
+++ b/params_shard_75.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f717db8f13a5c8fb1d69e62c48ea50cb3bf29de6ce55c2ed0f1cfbf1216d65ee
+size 141557760
diff --git a/params_shard_76.bin b/params_shard_76.bin
new file mode 100644
index 0000000000000000000000000000000000000000..aac0e43ab1863af3dc62a68ee5aab4dc2e245bfe
--- /dev/null
+++ b/params_shard_76.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4b1bbe7bd3cea9dc3bf0e2747e98461c9e2a6e60c1cb419c7fe803e2921b4728
+size 18350080
diff --git a/params_shard_77.bin b/params_shard_77.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d12b4f2bc8da09fb484752640a8fae0acaa12a7b
--- /dev/null
+++ b/params_shard_77.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:67a192e74f36c57cb066738463b0a3d45b243d2f95a424337545152ee255ee2d
+size 20760576
diff --git a/params_shard_78.bin b/params_shard_78.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e9e8bbe7417c5243611de7d0d1b09b96bb059b24
--- /dev/null
+++ b/params_shard_78.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b2cdb73a57466bdc24e444468314a8740c4bd4a4620c0c7472ab613e63be4be1
+size 70778880
diff --git a/params_shard_79.bin b/params_shard_79.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e44d02d23017d3f2ffe3934f9f8e78208eb2be41
--- /dev/null
+++ b/params_shard_79.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f1ae0472a180f5d96f13befd84b28e8dc2f0a0ff130a30de759a4d6d974752de
+size 141557760
diff --git a/params_shard_8.bin b/params_shard_8.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6541c65b3a91d61d8a302d8bcb8e1ae5ff8666dd
--- /dev/null
+++ b/params_shard_8.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4942e5788ff93f4d7b6ff6c8cd12ca9af7f877577862ba581098a8dc38ca7d1e
+size 18350080
diff --git a/params_shard_80.bin b/params_shard_80.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e430bc6eaa8a25eae4932e4072665ebfdf7cabe4
--- /dev/null
+++ b/params_shard_80.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d1f6d1adbd54750859b9688ef6a9aee09d3eaee77307c5df88a45ec08ef4b883
+size 18350080
diff --git a/params_shard_81.bin b/params_shard_81.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bda2a01dfbbefa77da9a282f914db1c41789413a
--- /dev/null
+++ b/params_shard_81.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d0cba324d8f8d08165ae0d77867fe2e5a14358da016a1ef4b6635c1e58a28af0
+size 20760576
diff --git a/params_shard_82.bin b/params_shard_82.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3149395f72d3350d585084800bc80021d65c3665
--- /dev/null
+++ b/params_shard_82.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8a1a8577f602ba52b8b6a4a64b0f2f33fbd9bd350d496fd6fd03fd8341823b15
+size 70778880
diff --git a/params_shard_83.bin b/params_shard_83.bin
new file mode 100644
index 0000000000000000000000000000000000000000..34b82d44e9d63a5931f4b7a1681d66ea2a5d04e3
--- /dev/null
+++ b/params_shard_83.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:321a53731b8d097db72285465822dfbc367939d8ff8ef84b1137b97d4e062453
+size 141557760
diff --git a/params_shard_84.bin b/params_shard_84.bin
new file mode 100644
index 0000000000000000000000000000000000000000..399e079d3a553d02c6da5fc3f30579edcfc0d5d0
--- /dev/null
+++ b/params_shard_84.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1382307676a45cad8fbeabffaf33d02b00c55baed9cbbc71cd1a8c63506b565a
+size 18350080
diff --git a/params_shard_85.bin b/params_shard_85.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a814789b80cff08cbe26eb286a5bfd6a14f69b6b
--- /dev/null
+++ b/params_shard_85.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:57dab7ceed011b514dc23469486ebb0fb29f070fcfbf4a1f4f9972892bf76f74
+size 20760576
diff --git a/params_shard_86.bin b/params_shard_86.bin
new file mode 100644
index 0000000000000000000000000000000000000000..92e4a73c116a1fd34fde18720060460527949fb6
--- /dev/null
+++ b/params_shard_86.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5a8688ea946c3b6d4117916b8bb3a07805bfe372ac000bf0862f4260ed29f10c
+size 70778880
diff --git a/params_shard_87.bin b/params_shard_87.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ae70ff29c2be9e53aefd6d45cc5ec6fbd5f35b12
--- /dev/null
+++ b/params_shard_87.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:500e8f6ea4ecd280100c7b5aa32019d37653056e4f995154c7a947ed4dca69c1
+size 141557760
diff --git a/params_shard_88.bin b/params_shard_88.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a03941d09075a8e615b4a170017c1216de77d11b
--- /dev/null
+++ b/params_shard_88.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:feac65ff06b521fe1be3efb5033d3c0e4cf3f0f05c0792db2342f1e2b7b0f60f
+size 18350080
diff --git a/params_shard_89.bin b/params_shard_89.bin
new file mode 100644
index 0000000000000000000000000000000000000000..75f2fa1ca57d58b8ea484ce92f9e78ea08572e14
--- /dev/null
+++ b/params_shard_89.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:52f920b6c99438d47959fe517be87a5887b5f60fc42e0d5d51edc77111efe997
+size 20760576
diff --git a/params_shard_9.bin b/params_shard_9.bin
new file mode 100644
index 0000000000000000000000000000000000000000..593ba30629cc79b0dba38e5b3ecaad3797a62c8f
--- /dev/null
+++ b/params_shard_9.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8f4ba7b1734e3c120110818a7adc861ec116f8f489a45b432efa817666050e32
+size 20760576
diff --git a/params_shard_90.bin b/params_shard_90.bin
new file mode 100644
index 0000000000000000000000000000000000000000..78e43c2fa3382763d1b54a1a16779bbfd6612b22
--- /dev/null
+++ b/params_shard_90.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f5afdf1fdde36aebc4e8182771afedc855f269a570d1b2a2aa2f1cf148be4ec9
+size 70778880
diff --git a/params_shard_91.bin b/params_shard_91.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0d40d2a3f4807c005dba154d9736785658ff64e4
--- /dev/null
+++ b/params_shard_91.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:059ff1755bb4434bddf05a9997866ad11100492885d03b39f2a4e065640ee4a1
+size 141557760
diff --git a/params_shard_92.bin b/params_shard_92.bin
new file mode 100644
index 0000000000000000000000000000000000000000..81ffc86e62773da3188983c5490ce333c514ad22
--- /dev/null
+++ b/params_shard_92.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:25e7a1871b90eb415fd924fa6efa757767389412eddacd56881426bd892d3513
+size 18350080
diff --git a/params_shard_93.bin b/params_shard_93.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e219f03f398dd4cc28f97dfd4ea463aeb4000439
--- /dev/null
+++ b/params_shard_93.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6d03496e85a535cc5164eae50a28e2e838889d0551052df2126291a6f134cdf9
+size 20760576
diff --git a/params_shard_94.bin b/params_shard_94.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bd1935eeab82a0eff1628fda1c80f94c7465ea1d
--- /dev/null
+++ b/params_shard_94.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:09c2cd40820a778f9278ea653e1fee541c0754fd3073566be0e012942dad9650
+size 70778880
diff --git a/params_shard_95.bin b/params_shard_95.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8ad9fac17cdc35f383cbae53a22ca470f2ed9c15
--- /dev/null
+++ b/params_shard_95.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:162d5a8afe946672e7e6f8b6ae248b523f6a3465ddba7a70596c8f72c5e5eea7
+size 141557760
diff --git a/params_shard_96.bin b/params_shard_96.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0f672d57671ddf13f56bb15778f9cba1cfd5fd22
--- /dev/null
+++ b/params_shard_96.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f5bc7529688cc009184d1846aa5651bde236d8d0707e1a5a61a20005370be272
+size 18350080
diff --git a/params_shard_97.bin b/params_shard_97.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2cc4376604094afe36e4b0b83f43ecbd4c177b96
--- /dev/null
+++ b/params_shard_97.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f89b06721a465336f5d766327a1925ff8a21dfd3ebd2208d154b4ba17a99fb70
+size 20760576
diff --git a/params_shard_98.bin b/params_shard_98.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ef1c15ea15214ee75d35cc65aee4c940b50c003a
--- /dev/null
+++ b/params_shard_98.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:339400e6ba05585a072724f56d7a7a87aa3c3f045613e7eaa198be163770acd3
+size 70778880
diff --git a/params_shard_99.bin b/params_shard_99.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4f6f92f6b319f7f0131aba04cfd0b4a9e8bb4093
--- /dev/null
+++ b/params_shard_99.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:191e7662de4ae6aaa7089fb0cbfcd6f5188c80feb3e8839a5b06e36007bd8151
+size 141557760
diff --git a/private-llm-config.json b/private-llm-config.json
new file mode 100644
index 0000000000000000000000000000000000000000..1e81ae0cb4c157444b450dfeb3798d019c2ce900
--- /dev/null
+++ b/private-llm-config.json
@@ -0,0 +1,45 @@
+{
+ "model_type": "qwen2",
+ "quantization": "GPTQ-Int4",
+ "model_config": {
+ "hidden_act": "silu",
+ "hidden_size": 5120,
+ "intermediate_size": 27648,
+ "num_attention_heads": 40,
+ "num_hidden_layers": 64,
+ "num_key_value_heads": 8,
+ "rms_norm_eps": 1e-05,
+ "rope_theta": 1000000.0,
+ "vocab_size": 152064,
+ "tie_word_embeddings": false,
+ "context_window_size": 8192,
+ "prefill_chunk_size": 128,
+ "tensor_parallel_shards": 1,
+ "head_dim": 128,
+ "dtype": "float32",
+ "max_batch_size": 80
+ },
+ "vocab_size": 152064,
+ "context_window_size": 8192,
+ "sliding_window_size": -1,
+ "prefill_chunk_size": 128,
+ "attention_sink_size": -1,
+ "tensor_parallel_shards": 1,
+ "mean_gen_len": 512,
+ "max_gen_len": 4096,
+ "shift_fill_factor": 0.3,
+ "temperature": 0.7,
+ "presence_penalty": 0.0,
+ "frequency_penalty": 0.0,
+ "repetition_penalty": 1.2,
+ "top_p": 0.95,
+ "conv_template": "deepseek-r1-qwen",
+ "pad_token_id": 0,
+ "bos_token_id": 151643,
+ "eos_token_id": 151643,
+ "tokenizer_files": [
+ "tokenizer.json",
+ "tokenizer_config.json"
+ ],
+ "version": "0.1.0"
+}
diff --git a/tokenizer.json b/tokenizer.json
new file mode 100644
index 0000000000000000000000000000000000000000..a34650995da6939a945c330eadb0687147ac3ef8
--- /dev/null
+++ b/tokenizer.json
@@ -0,0 +1,303282 @@
+{
+ "version": "1.0",
+ "truncation": null,
+ "padding": null,
+ "added_tokens": [
+ {
+ "id": 151643,
+ "content": "<|end▁of▁sentence|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": true
+ },
+ {
+ "id": 151644,
+ "content": "<|User|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": false
+ },
+ {
+ "id": 151645,
+ "content": "<|Assistant|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": false
+ },
+ {
+ "id": 151646,
+ "content": "<|begin▁of▁sentence|>",
+ "normalized": false,
+ "lstrip": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ {
+ "id": 151647,
+ "content": "<|EOT|>",
+ "normalized": false,
+ "lstrip": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ {
+ "id": 151648,
+ "content": "
&": 5789, + "CON": 5790, + "Ġrepl": 5791, + "Ġregular": 5792, + "Storage": 5793, + "ramework": 5794, + "Ġgoal": 5795, + "Ġtouch": 5796, + ".widget": 5797, + "Ġbuilt": 5798, + "des": 5799, + "Part": 5800, + "(re": 5801, + "Ġworth": 5802, + "hib": 5803, + "game": 5804, + "Ġв": 5805, + "acion": 5806, + "ĠWhite": 5807, + "(type": 5808, + "(`": 5809, + "Ġnatural": 5810, + "Ġinj": 5811, + "Ġcalcul": 5812, + "ĠApril": 5813, + ".List": 5814, + "Ġassociated": 5815, + "ĉSystem": 5816, + "~~": 5817, + "=[": 5818, + "Ġstorage": 5819, + "Ġbytes": 5820, + "Ġtravel": 5821, + "Ġsou": 5822, + "Ġpassed": 5823, + "!=": 5824, + "ascript": 5825, + ".open": 5826, + "Ġgrid": 5827, + "Ġbus": 5828, + "Ġrecogn": 5829, + "Ab": 5830, + "Ġhon": 5831, + "ĠCenter": 5832, + "Ġprec": 5833, + "build": 5834, + "HTML": 5835, + "ĠSan": 5836, + "Ġcountries": 5837, + "aled": 5838, + "token": 5839, + "kt": 5840, + "Ġqual": 5841, + "Last": 5842, + "adow": 5843, + "Ġmanufact": 5844, + "idad": 5845, + "jango": 5846, + "Next": 5847, + "xf": 5848, + ".a": 5849, + "Ġporno": 5850, + "ĠPM": 5851, + "erve": 5852, + "iting": 5853, + "_th": 5854, + "ci": 5855, + "=None": 5856, + "gs": 5857, + "Ġlogin": 5858, + "atives": 5859, + "']);Ċ": 5860, + "Äħ": 5861, + "Ġill": 5862, + "IA": 5863, + "children": 5864, + "DO": 5865, + "Ġlevels": 5866, + "Ġ{{": 5867, + "Ġlooks": 5868, + "Ġ\"#": 5869, + "ToString": 5870, + "Ġnecessary": 5871, + "ĠĠĠĊ": 5872, + "cell": 5873, + "Entry": 5874, + "Ġ'#": 5875, + "Ġextrem": 5876, + "Selector": 5877, + "Ġplaceholder": 5878, + "Load": 5879, + "Ġreleased": 5880, + "ORE": 5881, + "Enumer": 5882, + "ĠTV": 5883, + "SET": 5884, + "inq": 5885, + "Press": 5886, + "ĠDepartment": 5887, + "Ġproperties": 5888, + "Ġrespond": 5889, + "Search": 5890, + "ael": 5891, + "Ġrequ": 5892, + "ĠBook": 5893, + "/Ċ": 5894, + "(st": 5895, + "Ġfinancial": 5896, + "icket": 5897, + "_input": 5898, + "Ġthreat": 5899, + "(in": 5900, + "Strip": 5901, + "ìĿ": 5902, + "ção": 5903, + "Ġevidence": 5904, + "));": 5905, + "ĠBro": 5906, + "Ġ[];Ċ": 5907, + "Ġou": 5908, + "buf": 5909, + "Script": 5910, + "dat": 5911, + "Ġrule": 5912, + "#import": 5913, + "=\"/": 5914, + "Serial": 5915, + "Ġstarting": 5916, + "[index": 5917, + "ae": 5918, + "Ġcontrib": 5919, + "session": 5920, + "_new": 5921, + "utable": 5922, + "ober": 5923, + "Ġ\"./": 5924, + "Ġlogger": 5925, + "Ġrecently": 5926, + "Ġreturned": 5927, + "ččĊ": 5928, + ")))Ċ": 5929, + "itions": 5930, + "Ġseek": 5931, + "Ġcommunic": 5932, + "Ġ\".": 5933, + "Ġusername": 5934, + "ECT": 5935, + "DS": 5936, + "Ġotherwise": 5937, + "ĠGerman": 5938, + ".aw": 5939, + "Adapter": 5940, + "ixel": 5941, + "Ġsystems": 5942, + "Ġdrop": 5943, + "Ġstructure": 5944, + "Ġ$(\"#": 5945, + "encies": 5946, + "anning": 5947, + "ĠLink": 5948, + "ĠResponse": 5949, + "Ġstri": 5950, + "ż": 5951, + "ĠDB": 5952, + "æĹ": 5953, + "android": 5954, + "submit": 5955, + "otion": 5956, + "(@": 5957, + ".test": 5958, + "ĊĊĊĊĊĊĊĊ": 5959, + "];čĊ": 5960, + "Ġdirectly": 5961, + "Ġ\"%": 5962, + "ris": 5963, + "elta": 5964, + "AIL": 5965, + "){čĊ": 5966, + "mine": 5967, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 5968, + "(k": 5969, + "bon": 5970, + "asic": 5971, + "pite": 5972, + "___": 5973, + "Max": 5974, + "Ġerrors": 5975, + "ĠWhile": 5976, + "Ġarguments": 5977, + "Ġensure": 5978, + "Right": 5979, + "-based": 5980, + "Web": 5981, + "Ġ-=": 5982, + "Ġintrodu": 5983, + "ĠInst": 5984, + "ĠWash": 5985, + "ordin": 5986, + "join": 5987, + "Database": 5988, + "Ġgrad": 5989, + "Ġusually": 5990, + "ITE": 5991, + "Props": 5992, + "?>Ċ": 5993, + "ĠGo": 5994, + "@Override": 5995, + "REF": 5996, + "Ġip": 5997, + "ĠAustral": 5998, + "Ġist": 5999, + "ViewById": 6000, + "Ġserious": 6001, + "Ġcustomer": 6002, + ".prototype": 6003, + "odo": 6004, + "cor": 6005, + "Ġdoor": 6006, + "ĠWITHOUT": 6007, + "Ġplant": 6008, + "Ġbegan": 6009, + "Ġdistance": 6010, + "()).": 6011, + "Ġchance": 6012, + "Ġord": 6013, + "came": 6014, + "pragma": 6015, + "Ġprotect": 6016, + "ragment": 6017, + "ĠNode": 6018, + "ening": 6019, + "Ñĩ": 6020, + "Ġroute": 6021, + "ĠSchool": 6022, + "hi": 6023, + "Ġneighb": 6024, + "After": 6025, + "licit": 6026, + "Ġcontr": 6027, + "Ġprimary": 6028, + "AA": 6029, + ".WriteLine": 6030, + "utils": 6031, + "Ġbi": 6032, + "Red": 6033, + ".Linq": 6034, + ".object": 6035, + "Ġleaders": 6036, + "unities": 6037, + "Ġgun": 6038, + "onth": 6039, + "ĠDev": 6040, + "FILE": 6041, + "Ġcomments": 6042, + "_len": 6043, + "arrow": 6044, + "amount": 6045, + "Range": 6046, + "sert": 6047, + "GridView": 6048, + "Ġupdated": 6049, + "ĠMo": 6050, + "Ġinform": 6051, + "ociety": 6052, + "ala": 6053, + "Access": 6054, + "Ġhab": 6055, + "Ġcreat": 6056, + "_arg": 6057, + "ĠJanuary": 6058, + "ĠDay": 6059, + "\")čĊ": 6060, + "uple": 6061, + "document": 6062, + "gorith": 6063, + "menu": 6064, + "ĠOver": 6065, + "bb": 6066, + ".title": 6067, + "_out": 6068, + "Ġled": 6069, + "uri": 6070, + "Ġ?>": 6071, + "gl": 6072, + "Ġbank": 6073, + "ayment": 6074, + "ĉprintf": 6075, + "MD": 6076, + "Ġsample": 6077, + "Ġhands": 6078, + "ĠVersion": 6079, + "uario": 6080, + "Ġoffers": 6081, + "ityEngine": 6082, + "Ġshape": 6083, + "Ġsleep": 6084, + "_point": 6085, + "Settings": 6086, + "Ġachie": 6087, + "Ġsold": 6088, + "ota": 6089, + ".bind": 6090, + "Am": 6091, + "Ġsafe": 6092, + "Store": 6093, + "Ġshared": 6094, + "Ġpriv": 6095, + "_VAL": 6096, + "Ġsens": 6097, + "){": 6098, + "Ġremember": 6099, + "shared": 6100, + "element": 6101, + "Ġshoot": 6102, + "Vert": 6103, + "cout": 6104, + "Ġenv": 6105, + "_label": 6106, + "Ġ>Ċ": 6107, + "run": 6108, + "Ġscene": 6109, + "(array": 6110, + "device": 6111, + "_title": 6112, + "agon": 6113, + "]čĊ": 6114, + "aby": 6115, + "Ġbecame": 6116, + "boolean": 6117, + "Ġpark": 6118, + "ĠCode": 6119, + "upload": 6120, + "riday": 6121, + "ĠSeptember": 6122, + "Fe": 6123, + "Ġsen": 6124, + "cing": 6125, + "FL": 6126, + "Col": 6127, + "uts": 6128, + "_page": 6129, + "inn": 6130, + "Ġimplied": 6131, + "aling": 6132, + "Ġyourself": 6133, + ".Count": 6134, + "conf": 6135, + "Ġaud": 6136, + "_init": 6137, + ".)": 6138, + "Ġwrote": 6139, + "NG": 6140, + ".Error": 6141, + "ä»": 6142, + ".for": 6143, + "Ġequal": 6144, + "ĠRequest": 6145, + "Ġserial": 6146, + "Ġallows": 6147, + "XX": 6148, + "Ġmiddle": 6149, + "chor": 6150, + "ø": 6151, + "erval": 6152, + ".Column": 6153, + "reading": 6154, + "Ġescort": 6155, + "ĠAugust": 6156, + "Ġquickly": 6157, + "Ġweap": 6158, + "ĠCG": 6159, + "ropri": 6160, + "ho": 6161, + "Ġcop": 6162, + "(struct": 6163, + "ĠBig": 6164, + "Ġvs": 6165, + "Ġfrequ": 6166, + ".Value": 6167, + "Ġactions": 6168, + "Ġproper": 6169, + "Ġinn": 6170, + "Ġobjects": 6171, + "Ġmatrix": 6172, + "avascript": 6173, + "Ġones": 6174, + ".group": 6175, + "Ġgreen": 6176, + "Ġpaint": 6177, + "ools": 6178, + "ycl": 6179, + "encode": 6180, + "olt": 6181, + "comment": 6182, + ".api": 6183, + "Dir": 6184, + "Ġune": 6185, + "izont": 6186, + ".position": 6187, + "Ġdesigned": 6188, + "_val": 6189, + "avi": 6190, + "iring": 6191, + "tab": 6192, + "Ġlayer": 6193, + "Ġviews": 6194, + "Ġreve": 6195, + "rael": 6196, + "ĠON": 6197, + "rics": 6198, + "np": 6199, + "Ġcore": 6200, + "());čĊ": 6201, + "Main": 6202, + "Ġexpert": 6203, + "ĉĉčĊ": 6204, + "_en": 6205, + "Ġ/>": 6206, + "utter": 6207, + "IAL": 6208, + "ails": 6209, + "ĠKing": 6210, + "*/ĊĊ": 6211, + "ĠMet": 6212, + "_end": 6213, + "addr": 6214, + "ora": 6215, + "Ġir": 6216, + "Min": 6217, + "Ġsurpr": 6218, + "Ġrepe": 6219, + "Ġdirectory": 6220, + "PUT": 6221, + "-S": 6222, + "Ġelection": 6223, + "haps": 6224, + ".pre": 6225, + "cm": 6226, + "Values": 6227, + "Ġ\"Ċ": 6228, + "column": 6229, + "ivil": 6230, + "Login": 6231, + "inue": 6232, + "Ġbeautiful": 6233, + "Ġsecret": 6234, + "(event": 6235, + "Ġchat": 6236, + "ums": 6237, + "Ġorigin": 6238, + "Ġeffects": 6239, + "Ġmanagement": 6240, + "illa": 6241, + "tk": 6242, + "Ġsetting": 6243, + "ĠCour": 6244, + "Ġmassage": 6245, + "ĉend": 6246, + "Ġhappy": 6247, + "Ġfinish": 6248, + "Ġcamera": 6249, + "ĠVer": 6250, + "ĠDemocr": 6251, + "ĠHer": 6252, + "(Q": 6253, + "cons": 6254, + "ita": 6255, + "Ġ'.": 6256, + "{}": 6257, + "ĉC": 6258, + "Ġstuff": 6259, + "Ġ:Ċ": 6260, + "ĠAR": 6261, + "Task": 6262, + "hidden": 6263, + "eros": 6264, + "IGN": 6265, + "atio": 6266, + "ĠHealth": 6267, + "olute": 6268, + "Enter": 6269, + "'>": 6270, + "ĠTwitter": 6271, + "ĠCounty": 6272, + "scribe": 6273, + "Ġ=>Ċ": 6274, + "Ġhy": 6275, + "fit": 6276, + "Ġmilitary": 6277, + "Ġsale": 6278, + "required": 6279, + "non": 6280, + "bootstrap": 6281, + "hold": 6282, + "rim": 6283, + "-old": 6284, + "ĠDown": 6285, + "Ġmention": 6286, + "contact": 6287, + "_group": 6288, + "oday": 6289, + "Ġtown": 6290, + "Ġsolution": 6291, + "uate": 6292, + "elling": 6293, + "]->": 6294, + "otes": 6295, + "ental": 6296, + "omen": 6297, + "ospital": 6298, + "ĠSup": 6299, + "_EN": 6300, + "Ġslow": 6301, + "SESSION": 6302, + "Ġblue": 6303, + "ago": 6304, + "Ġlives": 6305, + "Ġ^": 6306, + ".un": 6307, + "inst": 6308, + "enge": 6309, + "Ġcustomers": 6310, + "Ġcast": 6311, + "udget": 6312, + "ï¼ģ": 6313, + "icens": 6314, + "Ġdetermin": 6315, + "Selected": 6316, + "_pl": 6317, + "ueue": 6318, + "Ġdark": 6319, + "//ĊĊ": 6320, + "si": 6321, + "thern": 6322, + "ĠJapan": 6323, + "/w": 6324, + "PU": 6325, + "ĠEast": 6326, + "ovie": 6327, + "Ġpackage": 6328, + "Ġnor": 6329, + "Ġapi": 6330, + "bot": 6331, + "\"];Ċ": 6332, + "_post": 6333, + "ulate": 6334, + "Ġclub": 6335, + "'));Ċ": 6336, + "Ġloop": 6337, + "PIO": 6338, + "ione": 6339, + "shot": 6340, + "Initial": 6341, + "Ġplayed": 6342, + "register": 6343, + "rought": 6344, + "_max": 6345, + "acement": 6346, + "match": 6347, + "raphics": 6348, + "AST": 6349, + "Ġexisting": 6350, + "Ġcomplex": 6351, + "DA": 6352, + ".Ch": 6353, + ".common": 6354, + "mo": 6355, + "Ġ'../../": 6356, + "ito": 6357, + "Ġanalysis": 6358, + "Ġdeliver": 6359, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĊ": 6360, + "idx": 6361, + "Ãł": 6362, + "ongo": 6363, + "ĠEnglish": 6364, + "Ċ": 9992, + "_default": 9993, + "ĠDatabase": 9994, + "rep": 9995, + "ESS": 9996, + "nergy": 9997, + ".Find": 9998, + "_mask": 9999, + "Ġrise": 10000, + "Ġkernel": 10001, + "::$": 10002, + ".Q": 10003, + "Ġoffering": 10004, + "decl": 10005, + "ĠCS": 10006, + "Ġlisted": 10007, + "Ġmostly": 10008, + "enger": 10009, + "Ġblocks": 10010, + "olo": 10011, + "Ġgoverning": 10012, + "\\F": 10013, + "Ġconcent": 10014, + ".getText": 10015, + "Ġmb": 10016, + "Ġoccurred": 10017, + "Ġchanging": 10018, + "Scene": 10019, + "_CODE": 10020, + "Beh": 10021, + "\"The": 10022, + "Ġtile": 10023, + "ĠAssociation": 10024, + "ĉP": 10025, + "alty": 10026, + "_ad": 10027, + "odies": 10028, + "iated": 10029, + "Ġprepared": 10030, + "possible": 10031, + "Ġmort": 10032, + "TEST": 10033, + "Ġignore": 10034, + "Ġcalc": 10035, + "Ġrs": 10036, + "ĠassertEquals": 10037, + "Ġsz": 10038, + "ĠTHIS": 10039, + ".\"Ċ": 10040, + "Ġcanvas": 10041, + "java": 10042, + "Ġdut": 10043, + "VALID": 10044, + ".sql": 10045, + ".input": 10046, + "Ġaux": 10047, + "Sup": 10048, + "Ġartist": 10049, + "Vec": 10050, + "_TIME": 10051, + ".stringify": 10052, + "etween": 10053, + "ĠCategory": 10054, + "Ġ[-": 10055, + "ĠDevExpress": 10056, + "ĠJul": 10057, + "Ġring": 10058, + ".ed": 10059, + "YY": 10060, + "Let": 10061, + "TextField": 10062, + "Ġflat": 10063, + "_print": 10064, + "ĠOTHER": 10065, + "adian": 10066, + "Ġchecked": 10067, + "ele": 10068, + "Align": 10069, + "standing": 10070, + "Ġ[],": 10071, + "Ġlab": 10072, + "ucky": 10073, + "ĠChristmas": 10074, + "(image": 10075, + ".module": 10076, + "Ġlots": 10077, + "Ġslightly": 10078, + "(final": 10079, + "erge": 10080, + "è¿": 10081, + "ĠPolice": 10082, + "ĠRight": 10083, + "Ġaward": 10084, + "ĠOS": 10085, + "Ġ{}ĊĊ": 10086, + "Ġptr": 10087, + "oves": 10088, + "icated": 10089, + "ем": 10090, + "Ġmanage": 10091, + "oliday": 10092, + "Amount": 10093, + "oolStrip": 10094, + "tbody": 10095, + "Nav": 10096, + "wrap": 10097, + "BB": 10098, + "Ġwatching": 10099, + "arios": 10100, + "Ġoptional": 10101, + "_K": 10102, + "ĠLicensed": 10103, + ".Map": 10104, + "Timer": 10105, + "ĠAP": 10106, + "ĠRev": 10107, + "(o": 10108, + ",c": 10109, + "umin": 10110, + "etailed": 10111, + "ĠHy": 10112, + "Ġblank": 10113, + "agger": 10114, + "ĠSelf": 10115, + "()[": 10116, + ".make": 10117, + "earn": 10118, + "channel": 10119, + ";Ċ": 10133, + "World": 10134, + "Ġpython": 10135, + "Ġlif": 10136, + "Ġtrav": 10137, + "Ġconven": 10138, + "company": 10139, + "ĠClub": 10140, + "Ver": 10141, + "Btn": 10142, + "Ġzone": 10143, + "products": 10144, + "ĠEduc": 10145, + "Ġverify": 10146, + "ĠMil": 10147, + "ono": 10148, + "]);ĊĊ": 10149, + "ENCE": 10150, + "Ġpacket": 10151, + "Ġcer": 10152, + "Ġenumer": 10153, + "Ġpars": 10154, + "formed": 10155, + "Ġoccup": 10156, + "tre": 10157, + "Ġexercise": 10158, + "Day": 10159, + "_sum": 10160, + "Ġasking": 10161, + "aption": 10162, + "Ġorders": 10163, + "Ġspending": 10164, + "ĠERR": 10165, + ".Dis": 10166, + "ĠUtil": 10167, + "âĢľI": 10168, + "\\'": 10169, + "?)": 10170, + "/>Ċ": 10171, + "Ġemot": 10172, + "Ġinfluence": 10173, + "ĠAfrica": 10174, + "atters": 10175, + "Ùħ": 10176, + ".session": 10177, + "Ġchief": 10178, + "ĉĉĉĉĉĉĉĉĉĉĉ": 10179, + "Ġtom": 10180, + "cluded": 10181, + "serial": 10182, + "_handler": 10183, + ".Type": 10184, + "aped": 10185, + "Ġpolicies": 10186, + "-ex": 10187, + "-tr": 10188, + "blank": 10189, + "merce": 10190, + "Ġcoverage": 10191, + "Ġrc": 10192, + "_matrix": 10193, + "_box": 10194, + "Ġcharges": 10195, + "ĠBoston": 10196, + "Pe": 10197, + "Ġcircum": 10198, + "Ġfilled": 10199, + "Ġnorth": 10200, + "ictureBox": 10201, + "ĉres": 10202, + "è®": 10203, + "Ġtermin": 10204, + "Ġ[âĢ¦": 10205, + "IRECT": 10206, + "Ġber": 10207, + "Ġ\"../../": 10208, + "retch": 10209, + ".code": 10210, + "_col": 10211, + "ĠGovernment": 10212, + "Ġargv": 10213, + "ĠLord": 10214, + "asi": 10215, + "Exec": 10216, + "ĉlet": 10217, + "vertis": 10218, + "Ġdiscussion": 10219, + "enance": 10220, + "outube": 10221, + "typeof": 10222, + "Ġserved": 10223, + "ĠPut": 10224, + "ĉx": 10225, + "Ġsweet": 10226, + "Before": 10227, + "ategy": 10228, + ".of": 10229, + "ĠMaterial": 10230, + "Sort": 10231, + "ONT": 10232, + "igital": 10233, + "Why": 10234, + "Ġsust": 10235, + "Ġç": 10236, + "abet": 10237, + "Ġsegment": 10238, + "Ġ[],Ċ": 10239, + "ĠMuslim": 10240, + "ĠfindViewById": 10241, + "cut": 10242, + "_TEXT": 10243, + "ĠMary": 10244, + "Ġloved": 10245, + "Ġlie": 10246, + "ĠJO": 10247, + "Ġisset": 10248, + "month": 10249, + "Ġprime": 10250, + "ti": 10251, + "ĠCarol": 10252, + "Use": 10253, + "ĠPop": 10254, + "ĠSave": 10255, + "Interval": 10256, + "execute": 10257, + "dy": 10258, + "ĠIran": 10259, + "_cont": 10260, + "ĉT": 10261, + "Ġphase": 10262, + "checkbox": 10263, + "week": 10264, + "Ġhide": 10265, + "Ġtil": 10266, + "Ġju": 10267, + "Custom": 10268, + "burg": 10269, + "/M": 10270, + "TON": 10271, + "Ġquant": 10272, + "Ġrub": 10273, + "ixels": 10274, + "Ġinstalled": 10275, + "Ġdump": 10276, + "Ġproperly": 10277, + "(List": 10278, + "Ġdecide": 10279, + "apply": 10280, + "Has": 10281, + "Ġkeeping": 10282, + "Ġcitizens": 10283, + "Ġjoint": 10284, + "pool": 10285, + "Socket": 10286, + "_op": 10287, + "Ġweapon": 10288, + "gnore": 10289, + "ĠExec": 10290, + "otten": 10291, + "ĠMS": 10292, + "Ġ(-": 10293, + "ĠReview": 10294, + "Ġexamples": 10295, + "Ġtight": 10296, + "!(": 10297, + "DP": 10298, + "ĠMessageBox": 10299, + "Ġphotograph": 10300, + "URI": 10301, + "ét": 10302, + "low": 10303, + "ĠGrand": 10304, + ".persistence": 10305, + "Ġmaintain": 10306, + "Ġnums": 10307, + "Ġzip": 10308, + "ials": 10309, + "ĠGets": 10310, + "peg": 10311, + "ĠBuffer": 10312, + "~~~~": 10313, + "rastructure": 10314, + "ĠPL": 10315, + "uen": 10316, + "obby": 10317, + "sizeof": 10318, + "Ġpic": 10319, + "Ġseed": 10320, + "Ġexperienced": 10321, + "Ġodd": 10322, + "Ġkick": 10323, + "Ġprocedure": 10324, + "avigator": 10325, + "-on": 10326, + ",j": 10327, + "ĠAlthough": 10328, + "ĠuserId": 10329, + "accept": 10330, + "Blue": 10331, + "IColor": 10332, + "layer": 10333, + "available": 10334, + "Ġends": 10335, + ".table": 10336, + "Ġdataset": 10337, + "bus": 10338, + "Ġexplain": 10339, + "(pro": 10340, + "ĠCommittee": 10341, + "Ġnoted": 10342, + "]:Ċ": 10343, + "Dim": 10344, + "stdio": 10345, + ".\",Ċ": 10346, + "_source": 10347, + "ĠWeek": 10348, + "ĠEdge": 10349, + "Ġoperating": 10350, + "Ġeste": 10351, + "ipl": 10352, + "agination": 10353, + "Ġproceed": 10354, + "Ġanimation": 10355, + ".Models": 10356, + "ĠWatch": 10357, + "iat": 10358, + "Ġoppon": 10359, + "/A": 10360, + "Report": 10361, + "Ġsounds": 10362, + "_buf": 10363, + "IELD": 10364, + "Ġbund": 10365, + "ĉget": 10366, + ".pr": 10367, + "(tmp": 10368, + "Ġkid": 10369, + ">ĊĊĊ": 10370, + "Ġyang": 10371, + "NotFound": 10372, + "ÑĨ": 10373, + "math": 10374, + "@gmail": 10375, + "ĠLIMIT": 10376, + "redients": 10377, + "Ġvent": 10378, + "avigate": 10379, + "Look": 10380, + "Ġreligious": 10381, + "Ġrand": 10382, + "rio": 10383, + "(GL": 10384, + "_ip": 10385, + "uan": 10386, + "iciency": 10387, + "ĠChange": 10388, + ">čĊčĊ": 10389, + "ĠEntity": 10390, + "Ġrencontre": 10391, + "ĠRet": 10392, + "plan": 10393, + "én": 10394, + "BOOL": 10395, + "uries": 10396, + "train": 10397, + "Definition": 10398, + "============": 10399, + "zz": 10400, + "Animation": 10401, + "ĠOK": 10402, + "_menu": 10403, + ".bl": 10404, + "_score": 10405, + "Ġacad": 10406, + "(System": 10407, + "Ġrefresh": 10408, + "'=>$": 10409, + ".Graphics": 10410, + "amento": 10411, + "pid": 10412, + "tc": 10413, + "Ġtips": 10414, + "Ġhomes": 10415, + "Ġfuel": 10416, + "âĸ": 10417, + "_helper": 10418, + "ĠĠčĊ": 10419, + "ĠRoom": 10420, + ".Close": 10421, + "_attr": 10422, + "ĠMount": 10423, + "ĠEv": 10424, + "arser": 10425, + "_top": 10426, + "eah": 10427, + "ĠDelete": 10428, + "ãĢį": 10429, + "uke": 10430, + "Ġusage": 10431, + "aria": 10432, + "_dev": 10433, + "Ġtexture": 10434, + "Ġconversation": 10435, + "eper": 10436, + "Bean": 10437, + "done": 10438, + "nonatomic": 10439, + "ĠSecond": 10440, + "Ġshooting": 10441, + "_pre": 10442, + "Components": 10443, + "Ġ]ĊĊ": 10444, + "__,": 10445, + "stitution": 10446, + ".Char": 10447, + ">();ĊĊ": 10448, + "Ġpresented": 10449, + "Ġwa": 10450, + "oker": 10451, + "-ĊĊ": 10452, + "iner": 10453, + "Ġbecoming": 10454, + "Ġincident": 10455, + "Att": 10456, + "Ġrevealed": 10457, + "forc": 10458, + "Ġboot": 10459, + ".page": 10460, + "Enumerator": 10461, + "_->": 10462, + "Photo": 10463, + "Ġspring": 10464, + ".\",": 10465, + "ĠDictionary": 10466, + "BJECT": 10467, + "Ġlocations": 10468, + "Ġsamples": 10469, + "InputStream": 10470, + "ĠBrown": 10471, + "Ġstats": 10472, + "quality": 10473, + "Ñħ": 10474, + "-dis": 10475, + "Ġhelping": 10476, + "Ġped": 10477, + "(se": 10478, + "ĠWho": 10479, + "alian": 10480, + "internal": 10481, + "Ġft": 10482, + ">().": 10483, + "->{": 10484, + "Ġmine": 10485, + "Ġsector": 10486, + "Ġgro": 10487, + "Ġopportunities": 10488, + "Ġü": 10489, + "Ġmp": 10490, + "Ġalleged": 10491, + "Ġdoubt": 10492, + "Mouse": 10493, + "About": 10494, + "_part": 10495, + "Ġchair": 10496, + "Ġstopped": 10497, + "loop": 10498, + "entities": 10499, + "Ġapps": 10500, + "ansion": 10501, + "Ġmental": 10502, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 10503, + "FR": 10504, + "Ġdefend": 10505, + "care": 10506, + "Ġideal": 10507, + "/api": 10508, + "urface": 10509, + "Ġele": 10510, + "ulator": 10511, + "ĠRights": 10512, + "anguages": 10513, + "Ġfunds": 10514, + "Ġadapt": 10515, + "Attributes": 10516, + "Ġdeploy": 10517, + "opts": 10518, + "Ġvalidation": 10519, + "Ġconcerns": 10520, + "uce": 10521, + ".num": 10522, + "ulture": 10523, + "ila": 10524, + "Ġcup": 10525, + "Ġpure": 10526, + ".Fore": 10527, + "ĠHashMap": 10528, + ".valueOf": 10529, + "asm": 10530, + "MO": 10531, + "Ġcs": 10532, + "Ġstores": 10533, + "Ġ************************************************************************": 10534, + "Ġcommunication": 10535, + "mem": 10536, + ".EventHandler": 10537, + ".Status": 10538, + "_right": 10539, + ".setOn": 10540, + "Sheet": 10541, + "Ġidentify": 10542, + "enerated": 10543, + "ordered": 10544, + "Ġ\"[": 10545, + "Ġswe": 10546, + "Condition": 10547, + "ĠAccording": 10548, + "Ġprepare": 10549, + "Ġrob": 10550, + "Pool": 10551, + "Ġsport": 10552, + "rv": 10553, + "ĠRouter": 10554, + "Ġalternative": 10555, + "([]": 10556, + "ĠChicago": 10557, + "ipher": 10558, + "ische": 10559, + "ĠDirector": 10560, + "kl": 10561, + "ĠWil": 10562, + "keys": 10563, + "Ġmysql": 10564, + "Ġwelcome": 10565, + "king": 10566, + "ĠManager": 10567, + "Ġcaught": 10568, + ")}Ċ": 10569, + "Score": 10570, + "_PR": 10571, + "Ġsurvey": 10572, + "hab": 10573, + "Headers": 10574, + "ADER": 10575, + "Ġdecor": 10576, + "Ġturns": 10577, + "Ġradius": 10578, + "errupt": 10579, + "Cor": 10580, + "Ġmel": 10581, + "Ġintr": 10582, + "(q": 10583, + "ĠAC": 10584, + "amos": 10585, + "MAX": 10586, + "ĠGrid": 10587, + "ĠJesus": 10588, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 10589, + ".DE": 10590, + "Ġts": 10591, + "Ġlinked": 10592, + "free": 10593, + "ĠQt": 10594, + "Ġ/**čĊ": 10595, + "Ġfaster": 10596, + "ctr": 10597, + "_J": 10598, + "DT": 10599, + ".Check": 10600, + "Ġcombination": 10601, + "Ġintended": 10602, + "-the": 10603, + "-type": 10604, + "ectors": 10605, + "ami": 10606, + "uting": 10607, + "Ġuma": 10608, + "XML": 10609, + "UCT": 10610, + "Ap": 10611, + "ĠRandom": 10612, + "Ġran": 10613, + ".sort": 10614, + "Ġsorted": 10615, + ".Un": 10616, + "_PER": 10617, + "itory": 10618, + "Ġpriority": 10619, + "ĠGal": 10620, + "ĠOld": 10621, + "hot": 10622, + "ĠDisplay": 10623, + "(sub": 10624, + "_TH": 10625, + "_Y": 10626, + "ĠCare": 10627, + "loading": 10628, + "Kind": 10629, + "_handle": 10630, + ",,": 10631, + "rase": 10632, + "_replace": 10633, + ".addEventListener": 10634, + "ĠRT": 10635, + "Ġentered": 10636, + "gers": 10637, + "Ġich": 10638, + "(start": 10639, + "/app": 10640, + "Ġbrother": 10641, + "Memory": 10642, + "Outlet": 10643, + "Ġutf": 10644, + "prec": 10645, + "Ġnavigation": 10646, + "ORK": 10647, + "Ġdst": 10648, + "Detail": 10649, + "Ġaudience": 10650, + "Ġdur": 10651, + "Ġcluster": 10652, + "unched": 10653, + "Ġ],": 10654, + "Ġcomfortable": 10655, + ".values": 10656, + "ĠTotal": 10657, + "Ġsnap": 10658, + "Ġstandards": 10659, + "Ġperformed": 10660, + "hand": 10661, + "(\"@": 10662, + "åŃ": 10663, + "Ġphil": 10664, + "ibr": 10665, + "trim": 10666, + "Ġforget": 10667, + "Ġdoctor": 10668, + ".TextBox": 10669, + "icons": 10670, + ",s": 10671, + "ĠOp": 10672, + "Sm": 10673, + "Stop": 10674, + "ĉList": 10675, + "ĉu": 10676, + "Comment": 10677, + "_VERSION": 10678, + ".Xtra": 10679, + "Person": 10680, + "rb": 10681, + "LOB": 10682, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĊ": 10683, + "ĠCentral": 10684, + "ICK": 10685, + "raq": 10686, + "Ġputting": 10687, + "Ġmd": 10688, + "ĠLove": 10689, + "Program": 10690, + "Border": 10691, + "oor": 10692, + "Ġallowing": 10693, + "after": 10694, + "Ġentries": 10695, + "ĠMaybe": 10696, + "]).": 10697, + "ĠShort": 10698, + ")\\": 10699, + ".now": 10700, + "friend": 10701, + "Ġprefer": 10702, + "ĠGPIO": 10703, + "osis": 10704, + "ĠGameObject": 10705, + "Ġskip": 10706, + "Ġcompetition": 10707, + "_match": 10708, + "lications": 10709, + "_CONT": 10710, + ".groupBox": 10711, + "Ġals": 10712, + "\"We": 10713, + "_eq": 10714, + "lan": 10715, + "_search": 10716, + "ĠMusic": 10717, + "asis": 10718, + "Ġbind": 10719, + "ĠIsland": 10720, + "rum": 10721, + "(E": 10722, + "Ġseat": 10723, + "Video": 10724, + "Ġack": 10725, + "reek": 10726, + "={()": 10727, + "Ġrating": 10728, + "Ġrestaurant": 10729, + "DEX": 10730, + "(buf": 10731, + "pping": 10732, + "uality": 10733, + "Ġleague": 10734, + "Ġfocused": 10735, + "apon": 10736, + "$data": 10737, + "CLUD": 10738, + "CLUDING": 10739, + "Ġabsolute": 10740, + "(query": 10741, + "Ġtells": 10742, + "Ang": 10743, + "Ġcommunities": 10744, + "Ġhonest": 10745, + "oking": 10746, + "Ġapart": 10747, + "arity": 10748, + "/$": 10749, + "_module": 10750, + "ĠEnc": 10751, + ".an": 10752, + ".Config": 10753, + "Cre": 10754, + "Ġshock": 10755, + "ĠArab": 10756, + "IENT": 10757, + "/re": 10758, + "Ġretrie": 10759, + "ycler": 10760, + "isa": 10761, + "ĠOrgan": 10762, + ".graph": 10763, + "Ġí": 10764, + "ĠBAS": 10765, + "Enum": 10766, + "Ġpossibly": 10767, + "ÑĢаÐ": 10768, + "ĠJapanese": 10769, + "Ġcraft": 10770, + "ĠPlace": 10771, + "Ġtalent": 10772, + "Ġfunding": 10773, + "Ġconfirmed": 10774, + "Ġcycle": 10775, + "/x": 10776, + "GE": 10777, + "Ġhearing": 10778, + "Ġplants": 10779, + "Ġmouth": 10780, + "pages": 10781, + "oria": 10782, + "ĠRemove": 10783, + "_total": 10784, + "Ġod": 10785, + "ollapse": 10786, + "door": 10787, + "Ġbought": 10788, + "Ġaddr": 10789, + "ARCH": 10790, + "_dim": 10791, + "dden": 10792, + "Ġdecades": 10793, + "REQUEST": 10794, + "Ġversions": 10795, + "fire": 10796, + "Ġmoves": 10797, + "fb": 10798, + "Ġcoffee": 10799, + ".connect": 10800, + "ĠRow": 10801, + "Ġschema": 10802, + "Scope": 10803, + "-Type": 10804, + "Ġfighting": 10805, + "Ġretail": 10806, + "Ġmodified": 10807, + "TF": 10808, + "Files": 10809, + "nie": 10810, + "_command": 10811, + "stone": 10812, + "ĠÑĤ": 10813, + "_thread": 10814, + "Ġbond": 10815, + "ĠDevelopment": 10816, + "Ġpt": 10817, + "FORM": 10818, + "plet": 10819, + "Ġidentified": 10820, + "cpp": 10821, + "Ġcoding": 10822, + "oked": 10823, + "ĠMaster": 10824, + "IDTH": 10825, + "Ġresidents": 10826, + "redit": 10827, + "ĠPhoto": 10828, + "=-": 10829, + "unte": 10830, + "ateur": 10831, + "_STATE": 10832, + "ĠSing": 10833, + "Ġsheet": 10834, + ".val": 10835, + "orse": 10836, + "Ġhers": 10837, + "Ġdetermined": 10838, + "Common": 10839, + "Ġwed": 10840, + "_queue": 10841, + "PH": 10842, + "ĠAtl": 10843, + "cred": 10844, + "/LICENSE": 10845, + "Ġmes": 10846, + "Ġadvanced": 10847, + ".java": 10848, + ".Sh": 10849, + "Go": 10850, + "kill": 10851, + "fp": 10852, + "_settings": 10853, + "Ġpal": 10854, + "Ġtruck": 10855, + "Ġcombined": 10856, + "Ġ\"${": 10857, + "ĠCorpor": 10858, + "Ġjoined": 10859, + "ĠJose": 10860, + "ĠCup": 10861, + "uns": 10862, + "estival": 10863, + "levision": 10864, + "Ġbroken": 10865, + "Ġmarriage": 10866, + "ĠWestern": 10867, + "Ġrepresents": 10868, + "ĠTitle": 10869, + "Ġss": 10870, + ".Ass": 10871, + "ongoose": 10872, + "iento": 10873, + "<>();Ċ": 10874, + "Ġabsolutely": 10875, + "Ġsmooth": 10876, + "TERN": 10877, + "ĠUnless": 10878, + "Word": 10879, + "Ġmerge": 10880, + "igan": 10881, + "ĠVol": 10882, + "Ġnn": 10883, + ".getId": 10884, + "Ġз": 10885, + "Ġsexy": 10886, + "Ġseeking": 10887, + "Single": 10888, + ".this": 10889, + "Ġkom": 10890, + "bound": 10891, + ";\"": 10892, + "ĠfontSize": 10893, + "_df": 10894, + "Ġinjury": 10895, + "(H": 10896, + "Ġissued": 10897, + "_END": 10898, + ":self": 10899, + "Ġpatch": 10900, + "Ġleaves": 10901, + "Ġadopt": 10902, + "FileName": 10903, + "ãĢIJ": 10904, + "Ġexecutive": 10905, + "ĠByte": 10906, + "]))Ċ": 10907, + "Ġnu": 10908, + "outing": 10909, + "cluding": 10910, + "-R": 10911, + ".options": 10912, + "Ġsubstant": 10913, + "avax": 10914, + "ĠBUT": 10915, + "Ġtechnical": 10916, + "Ġtwice": 10917, + "Ġmás": 10918, + "Ġunivers": 10919, + "yr": 10920, + "Ġdrag": 10921, + "ĠDC": 10922, + "Ġsed": 10923, + "Ġbot": 10924, + "ĠPal": 10925, + "ĠHall": 10926, + "forcement": 10927, + "Ġauch": 10928, + ".mod": 10929, + "notation": 10930, + "_files": 10931, + ".line": 10932, + "_flag": 10933, + "[name": 10934, + "Ġresolution": 10935, + "Ġbott": 10936, + "(\"[": 10937, + "ende": 10938, + "(arr": 10939, + "Free": 10940, + "(@\"": 10941, + "ĠDistrict": 10942, + "PEC": 10943, + ":-": 10944, + "Picker": 10945, + "ĠJo": 10946, + "ĠĠĠĠĠĊ": 10947, + "ĠRiver": 10948, + "_rows": 10949, + "Ġhelpful": 10950, + "Ġmassive": 10951, + "---Ċ": 10952, + "Ġmeasures": 10953, + "ĠRuntime": 10954, + "Ġworry": 10955, + "ĠSpec": 10956, + "ĉD": 10957, + "ãĢij": 10958, + "Ġ){Ċ": 10959, + "Ġworse": 10960, + "(filename": 10961, + "Ġlay": 10962, + "Ġmagic": 10963, + "ĠTheir": 10964, + "oul": 10965, + "stroy": 10966, + "ĠWhere": 10967, + "Ġsudden": 10968, + "Ġdefe": 10969, + "Ġbinding": 10970, + "Ġflight": 10971, + "ĠOnInit": 10972, + "ĠWomen": 10973, + "ĠPolicy": 10974, + "Ġdrugs": 10975, + "ishing": 10976, + "('../": 10977, + "ĠMel": 10978, + "peat": 10979, + "tor": 10980, + "Ġproposed": 10981, + "Ġstated": 10982, + "_RES": 10983, + "Ġeast": 10984, + "ĠCONDITION": 10985, + "_desc": 10986, + "Ġwinning": 10987, + "folio": 10988, + "Mapper": 10989, + "ĠPan": 10990, + "ĠAnge": 10991, + ".servlet": 10992, + "Ġcopies": 10993, + "LM": 10994, + "Ġvm": 10995, + "åį": 10996, + "Ġdictionary": 10997, + "Seg": 10998, + "elines": 10999, + "ĠSend": 11000, + "Ġiron": 11001, + "ĠFort": 11002, + ".domain": 11003, + "Ġdebate": 11004, + "NotNull": 11005, + "eq": 11006, + "acher": 11007, + "lf": 11008, + "ĉfmt": 11009, + "Ġlawy": 11010, + "ÄŁ": 11011, + "ĠMen": 11012, + "Ġtrim": 11013, + "(NULL": 11014, + "Ġ!!": 11015, + "Ġpad": 11016, + "Ġfollows": 11017, + "\"][\"": 11018, + "requ": 11019, + "ĠEp": 11020, + ".github": 11021, + "(img": 11022, + "eto": 11023, + "('\\": 11024, + "Services": 11025, + "umbnail": 11026, + "_main": 11027, + "pleted": 11028, + "fortunately": 11029, + "Ġwindows": 11030, + "Ġplane": 11031, + "ĠConnection": 11032, + ".local": 11033, + "uard": 11034, + "}\\": 11035, + "==\"": 11036, + "andon": 11037, + "ĠRoy": 11038, + "west": 11039, + "iginal": 11040, + "emies": 11041, + "itz": 11042, + "'):Ċ": 11043, + "ĠPeter": 11044, + "Ġtough": 11045, + "Ġreduced": 11046, + "Ġcalculate": 11047, + "Ġrapid": 11048, + "customer": 11049, + "Ġefficient": 11050, + "Ġmedium": 11051, + "Ġfell": 11052, + ".ref": 11053, + "ĠCas": 11054, + "Ġfeedback": 11055, + "Speed": 11056, + "(output": 11057, + "aje": 11058, + "Ġcategories": 11059, + "Ġfee": 11060, + "};": 11061, + "Ġdeleted": 11062, + "reh": 11063, + "Ġproof": 11064, + "Desc": 11065, + "Build": 11066, + "Ġsides": 11067, + ".ArrayList": 11068, + "-%": 11069, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 11070, + "ر": 11071, + ".match": 11072, + "ли": 11073, + "Ġfeels": 11074, + "Ġachieve": 11075, + "Ġclim": 11076, + "_ON": 11077, + "ĠCD": 11078, + "Ġteacher": 11079, + "_current": 11080, + "bn": 11081, + "_PL": 11082, + "isting": 11083, + "Enable": 11084, + "GEN": 11085, + "Ġtv": 11086, + "Ġsock": 11087, + "Ġplays": 11088, + "Ġdiscount": 11089, + "ĠKE": 11090, + "ĠDebug": 11091, + "Fore": 11092, + "ĠIraq": 11093, + "Ġappearance": 11094, + "Mon": 11095, + "Ġstyled": 11096, + "ĠHuman": 11097, + "iot": 11098, + "ĠHistory": 11099, + "Ġsac": 11100, + "ĠCollection": 11101, + "Ġrecommended": 11102, + ".Selected": 11103, + "Ġorganizations": 11104, + "Ġdiscovered": 11105, + "cohol": 11106, + "adas": 11107, + "ĠThomas": 11108, + "May": 11109, + "Ġconserv": 11110, + "Ġdomin": 11111, + "ĠFollow": 11112, + "ĠSection": 11113, + "ĠThanks": 11114, + "Username": 11115, + "Ġrecipe": 11116, + "Ġwonderful": 11117, + ".sleep": 11118, + "_if": 11119, + "ĉĊĉĊ": 11120, + "orno": 11121, + "Ġru": 11122, + "_target": 11123, + ".\"\"": 11124, + "à¦": 11125, + "EventArgs": 11126, + "Ġinputs": 11127, + "Ġfif": 11128, + "Ġvision": 11129, + "cy": 11130, + "ĠSeries": 11131, + ")(((": 11132, + "Ġtrading": 11133, + "Ġmarker": 11134, + "Begin": 11135, + "Ġtypically": 11136, + "Ġcauses": 11137, + "dropdown": 11138, + "_DEBUG": 11139, + "Ġdetect": 11140, + "country": 11141, + "!\");Ċ": 11142, + "ĉR": 11143, + "appy": 11144, + "Ġcref": 11145, + "('<": 11146, + "\"=>": 11147, + "ĠLE": 11148, + "reader": 11149, + "Ġadministr": 11150, + "õ": 11151, + "ucket": 11152, + "Ġfashion": 11153, + ".char": 11154, + "izar": 11155, + "Ġdisable": 11156, + "Ġsuc": 11157, + "ĠLive": 11158, + "issue": 11159, + "Ġmetadata": 11160, + "flags": 11161, + "ĠðŁ": 11162, + "Ġcommitted": 11163, + "Ġva": 11164, + "Ġrough": 11165, + "Ġ'''Ċ": 11166, + "Ġhighlight": 11167, + "_vars": 11168, + "VO": 11169, + "Ġencoding": 11170, + "-Z": 11171, + "_sign": 11172, + "$(\"#": 11173, + "Ġrain": 11174, + "reatest": 11175, + "ĠEND": 11176, + "Selection": 11177, + "Ġcandidates": 11178, + "Ġsav": 11179, + ".Empty": 11180, + "Ġdecisions": 11181, + "Ġcollabor": 11182, + "ridge": 11183, + "feed": 11184, + "ression": 11185, + "Ġpersons": 11186, + "VM": 11187, + "ega": 11188, + "_BIT": 11189, + "According": 11190, + "acked": 11191, + "Ġdollars": 11192, + "_loss": 11193, + "ĠCost": 11194, + "}\"Ċ": 11195, + "Notification": 11196, + "Ġprostit": 11197, + "Ġauthority": 11198, + ".rec": 11199, + "Ġspokes": 11200, + "ĠToday": 11201, + "istant": 11202, + "ĠHead": 11203, + "âĢĿ.": 11204, + "ertainment": 11205, + "cean": 11206, + "culate": 11207, + "Ġven": 11208, + "However": 11209, + "_arr": 11210, + "Ġtokens": 11211, + "Graph": 11212, + "ĠJud": 11213, + "ĠVirgin": 11214, + "ĠSerial": 11215, + "unning": 11216, + "Mutable": 11217, + "agers": 11218, + ".csv": 11219, + "Ġdeveloping": 11220, + "Ġinstructions": 11221, + "Ġpromise": 11222, + "Ġrequested": 11223, + "_encode": 11224, + "/\"": 11225, + "ĠIcon": 11226, + "uilt": 11227, + "-day": 11228, + "Ġintelligence": 11229, + ".IS": 11230, + "ĠObservable": 11231, + "ĠHard": 11232, + "Bool": 11233, + "idential": 11234, + ".Anchor": 11235, + "Ġselling": 11236, + "CI": 11237, + "AGES": 11238, + "tle": 11239, + "bur": 11240, + "UFFER": 11241, + "RY": 11242, + "Ġbigger": 11243, + "Ġrat": 11244, + "Ġfamous": 11245, + "Ġtypename": 11246, + "Ġexplained": 11247, + "}}Ċ": 11248, + "Ġnuclear": 11249, + "-N": 11250, + "Ġcrisis": 11251, + "ĠEnter": 11252, + "Ġanswers": 11253, + "/${": 11254, + "/pl": 11255, + "Ġsequ": 11256, + "_next": 11257, + "mask": 11258, + "Ġstanding": 11259, + "Ġplenty": 11260, + "ĠCross": 11261, + "ĉret": 11262, + "dro": 11263, + "ĠCast": 11264, + "=true": 11265, + "ĠChris": 11266, + "icio": 11267, + "ĠMike": 11268, + "Decimal": 11269, + "addComponent": 11270, + "Len": 11271, + "Ġcock": 11272, + "Ġ#{": 11273, + "URN": 11274, + "": 11403, + "Ġ*=": 11404, + "ĠPS": 11405, + "Ġdangerous": 11406, + "[p": 11407, + "OME": 11408, + "Other": 11409, + "ĠStringBuilder": 11410, + "Points": 11411, + "heading": 11412, + "Ġcurrency": 11413, + "Ġpercentage": 11414, + "_API": 11415, + "Ġclassic": 11416, + "thead": 11417, + "ĠMO": 11418, + "FE": 11419, + "Idx": 11420, + "await": 11421, + "Ġè": 11422, + "Ġaccident": 11423, + "Ġvariant": 11424, + "Ġmyst": 11425, + "ĠLand": 11426, + "ĠBre": 11427, + "Ġharm": 11428, + "ĠAcc": 11429, + "Ġcharged": 11430, + "iones": 11431, + "Visibility": 11432, + "arry": 11433, + "ĠLanguage": 11434, + "Ġwalking": 11435, + "\".ĊĊ": 11436, + "ifer": 11437, + "Ġleadership": 11438, + ".From": 11439, + "ynam": 11440, + "Ġtimestamp": 11441, + "ipt": 11442, + "ĠHas": 11443, + "REFER": 11444, + "ĠIts": 11445, + "Ġlistener": 11446, + "UTE": 11447, + "_description": 11448, + "Ġexperiences": 11449, + "Ġcreates": 11450, + "RS": 11451, + "cart": 11452, + "black": 11453, + "Ġchoices": 11454, + "war": 11455, + "Ġ'''": 11456, + "Ġordered": 11457, + "Ġevening": 11458, + "Ġpil": 11459, + "Ġtun": 11460, + "ĠBad": 11461, + "(app": 11462, + "random": 11463, + "Ġexplicit": 11464, + "Ġarrived": 11465, + "Ġfly": 11466, + "Ġeconom": 11467, + "-mail": 11468, + "Ġlists": 11469, + "Ġarchitect": 11470, + "ĠPay": 11471, + "Ġds": 11472, + "ĠSol": 11473, + "Ġvehicles": 11474, + "Hz": 11475, + "-com": 11476, + "Ġking": 11477, + "_equal": 11478, + "ĠHelp": 11479, + "Ġabuse": 11480, + "--;Ċ": 11481, + "Ġextr": 11482, + "Ġchemical": 11483, + "ä¿": 11484, + "Ġorient": 11485, + "Ġbreath": 11486, + "ĠSpace": 11487, + "(element": 11488, + "wait": 11489, + "DED": 11490, + "igma": 11491, + "Ġentr": 11492, + "Ġsob": 11493, + "-name": 11494, + "Ġaffected": 11495, + "ika": 11496, + "Ġcoal": 11497, + "_work": 11498, + "Ġhundreds": 11499, + "Ġpolitics": 11500, + "subject": 11501, + "Ġconsumer": 11502, + "ANGE": 11503, + "Ġrepeated": 11504, + "Send": 11505, + "Ġ#[": 11506, + "Ġprotocol": 11507, + "Ġleads": 11508, + "useum": 11509, + "Every": 11510, + "Import": 11511, + "(count": 11512, + "Ġchallenges": 11513, + "Ġnovel": 11514, + "Ġdepart": 11515, + "bits": 11516, + ".Current": 11517, + "Ġ`${": 11518, + "oting": 11519, + "(\\": 11520, + "Ġcreative": 11521, + "Ġbuff": 11522, + "Ġintroduced": 11523, + "usic": 11524, + "modules": 11525, + "Are": 11526, + "-doc": 11527, + "language": 11528, + "_cache": 11529, + "Ġtod": 11530, + "?>": 11531, + "omething": 11532, + "Ġhun": 11533, + "åº": 11534, + "aters": 11535, + "Intent": 11536, + "Ġimplemented": 11537, + "ĠCase": 11538, + "Children": 11539, + "Ġnotification": 11540, + "Renderer": 11541, + "Wrapper": 11542, + "Objects": 11543, + "tl": 11544, + ".Contains": 11545, + "Plugin": 11546, + ".row": 11547, + "Ġforg": 11548, + "Ġpermit": 11549, + "Ġtargets": 11550, + "ĠIF": 11551, + "Ġtip": 11552, + "sex": 11553, + "Ġsupports": 11554, + "Ġfold": 11555, + "photo": 11556, + "},čĊ": 11557, + "Ġgoogle": 11558, + "$('#": 11559, + "Ġsharing": 11560, + "Ġgoods": 11561, + "vs": 11562, + "ĠDan": 11563, + "Rate": 11564, + "ĠMartin": 11565, + "Ġmanner": 11566, + "lie": 11567, + ".The": 11568, + "Internal": 11569, + "ĠCONTR": 11570, + "Mock": 11571, + "RIGHT": 11572, + "Ġ'{": 11573, + "Ġcontrols": 11574, + "Mat": 11575, + "Ġmand": 11576, + "Ġextended": 11577, + "Ok": 11578, + "Ġembed": 11579, + "Ġplanet": 11580, + "ĠNon": 11581, + "-ch": 11582, + ")\",": 11583, + "epar": 11584, + "Ġbelieved": 11585, + "ĠEnvironment": 11586, + "ĠFriend": 11587, + "-res": 11588, + "Ġhandling": 11589, + "nic": 11590, + "-level": 11591, + "scri": 11592, + "Xml": 11593, + "BE": 11594, + "ungen": 11595, + "Ġalter": 11596, + "[idx": 11597, + "Pop": 11598, + "cam": 11599, + "Ġ(((": 11600, + "Ġshipping": 11601, + "Ġbattery": 11602, + "iddleware": 11603, + "MC": 11604, + "Ġimpl": 11605, + "otation": 11606, + "ĠLab": 11607, + "