Commit
·
1146aeb
1
Parent(s):
655777a
SLM q3f16_1 mistral v2 weights
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mlc-chat-config.json +42 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
- params_shard_43.bin +3 -0
- params_shard_44.bin +3 -0
- params_shard_45.bin +3 -0
- params_shard_46.bin +3 -0
- params_shard_47.bin +3 -0
- params_shard_48.bin +3 -0
- params_shard_49.bin +3 -0
- params_shard_5.bin +3 -0
- params_shard_50.bin +3 -0
- params_shard_51.bin +3 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,42 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model_type": "mistral",
|
3 |
+
"quantization": "q3f16_1",
|
4 |
+
"model_config": {
|
5 |
+
"hidden_size": 4096,
|
6 |
+
"intermediate_size": 14336,
|
7 |
+
"num_attention_heads": 32,
|
8 |
+
"num_hidden_layers": 32,
|
9 |
+
"rms_norm_eps": 1e-05,
|
10 |
+
"vocab_size": 32000,
|
11 |
+
"position_embedding_base": 1000000.0,
|
12 |
+
"context_window_size": -1,
|
13 |
+
"num_key_value_heads": 8,
|
14 |
+
"head_dim": 128,
|
15 |
+
"sliding_window_size": 1024,
|
16 |
+
"prefill_chunk_size": 1024,
|
17 |
+
"attention_sink_size": 4,
|
18 |
+
"tensor_parallel_shards": 1
|
19 |
+
},
|
20 |
+
"vocab_size": 32000,
|
21 |
+
"context_window_size": -1,
|
22 |
+
"sliding_window_size": 1024,
|
23 |
+
"prefill_chunk_size": 1024,
|
24 |
+
"attention_sink_size": 4,
|
25 |
+
"tensor_parallel_shards": 1,
|
26 |
+
"mean_gen_len": 128,
|
27 |
+
"max_gen_len": 512,
|
28 |
+
"shift_fill_factor": 0.3,
|
29 |
+
"temperature": 0.7,
|
30 |
+
"repetition_penalty": 1.0,
|
31 |
+
"top_p": 0.95,
|
32 |
+
"conv_template": "mistral_default",
|
33 |
+
"pad_token_id": 0,
|
34 |
+
"bos_token_id": 1,
|
35 |
+
"eos_token_id": 2,
|
36 |
+
"tokenizer_files": [
|
37 |
+
"tokenizer.model",
|
38 |
+
"tokenizer.json",
|
39 |
+
"tokenizer_config.json"
|
40 |
+
],
|
41 |
+
"version": "0.1.0"
|
42 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:896126014aa8d1fb94d8431b5741166d004232eefd0f7df1a758cc2cfcc3e5bc
|
3 |
+
size 52736000
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:29699051ae7e6aa45dc271793d79f897c31f4bda7716be62983897ebc4c7c051
|
3 |
+
size 47251456
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aff3482e5502942183c112d1c2ce9c87385cd73e28d668e6d4c1209daa450314
|
3 |
+
size 27848704
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b25c37891ce61e0e89b5d45bedce324e3bf52fbf582321cf0fb6a87571f5d5c
|
3 |
+
size 23527424
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8307790c7414157c01654e71666257ecbb349ae1385ae9312394df85469ebbfb
|
3 |
+
size 47251456
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f5aaa3d7575193dce8a564e0eed5875abe52dfb4a6d174d14d513be243200b90
|
3 |
+
size 27848704
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b3f348f7456177ebcf9295a3f144a7e323ca0a101a95d5f0440f72780b2fa52
|
3 |
+
size 23527424
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77bdf7d2ef70c14e2af3736bbb577809a2346089ca32a7e2ef91912313518e11
|
3 |
+
size 47251456
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab113df484ae322abced85a4c390bb71f2334884441b70e4c31f974a1c1cdea3
|
3 |
+
size 27848704
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:95c4cade5e0ad6f78f4cc88b7397d738c3a43e44b197c00d850bd21dd8590c2d
|
3 |
+
size 23527424
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:37b0ff91d9a0643e3e859ae8b09445ccdfc922252dd2d698f06e164a4a5bd74c
|
3 |
+
size 47251456
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:750e5df582f7fe9033763879a568f65a531454e0f5e676a59f120bd702fe7e97
|
3 |
+
size 27848704
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6d681b2cebc8a240a98a53c044f5e763d37601d7140a404448b563c3779b3cf0
|
3 |
+
size 33068544
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ee15e09003fbba39ebead9079bd1524caeb8530ff0bff6ac8411475e7dd39fef
|
3 |
+
size 23527424
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9e890bcc9db8366faf696f635c58295bee97d4fa0ed62b59fbbd82bb47a94b88
|
3 |
+
size 47251456
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be5676fba4ac1645455ca65488c8820cbc367af35ba5ddd0a6e9c7e118f82d22
|
3 |
+
size 27848704
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:759da103e37f0354d5f6ae4bc286c366323321e5631a3698d5536cfdd8dff70b
|
3 |
+
size 23527424
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f3a28f41bb5def29a73f604ea0cbe45aac603785fbec5d76584e663d4f568e8f
|
3 |
+
size 47251456
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:50d3ef3b5dd7b16194d37ff04502a623f72b51a0fbc21837fb5715e00142f17b
|
3 |
+
size 27848704
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b83d6f9f68836148ecf210479be1c74dca7bb80466b6f910f0118105b1f85036
|
3 |
+
size 23527424
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:00ab81c60649883d5dc606afa2ea6b64076a3b569fe65653e96ba549a8b0c6d2
|
3 |
+
size 47251456
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e996574f35c4e37725ec67b0aefba7b26f71812404ecd58c8631d766857d4f70
|
3 |
+
size 27848704
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:34e9c2d097975e61813d8d8c3feffe610902ba89b46485803e761efeccaa58d8
|
3 |
+
size 52736000
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df99f528c56975d7bea97a4424ace57f5459eb9d241550752dcc61e881cefe98
|
3 |
+
size 47251456
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8239fad75223099da8cfc515202031f61f2083f00d64f3573c07a48384a8064a
|
3 |
+
size 23527424
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e6e159adab96d5e2f20eacd02d349bd8b9257c3bd41db14b1c499e1154c8e9fb
|
3 |
+
size 31507968
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cdfc50c4485e8babc19c8636a7fdff7d5fbc5e4ae43888e935d7c925ff97da53
|
3 |
+
size 47251456
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:33d1ebfeab78e4c26925aa2a0a92ed670b226edb9ddb3eb965218f9f096332c4
|
3 |
+
size 23527424
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ccae87fa7c815ed458e0c36afb185f518620808158805b990251193216a3caad
|
3 |
+
size 47251456
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f5f924e73b479ff3c35cc92156c169e1a4e6f23932154a8daa18d8d83b214b7
|
3 |
+
size 30789632
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:13be28974939d6d4c97300515a0f2896e687a82a4c48010d51ca7a69a06124ea
|
3 |
+
size 47251456
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d5002c33b53b7dfbe039d795bfe9d4be5a79dea071702f3670abd2241321097
|
3 |
+
size 30806016
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8904d27f9fe60840c976fcbc05f56f57d4c529725202e4b2d1a03748651c5ea
|
3 |
+
size 23527424
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d7418af8655f68932a7a3c103952be50ac0219f5f7889336838b30d737f69658
|
3 |
+
size 47251456
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bf9626d2c4b03ddcd9fa9aea0a86c41567cb8218712df057d3b86f459f8bb009
|
3 |
+
size 32391168
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a104b7b64c777aa61cfeaa7dd48eade215f13393b1dbc95c89e162731aaf2d94
|
3 |
+
size 27848704
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f9dffaaad31a9ab75cc540ad26ddfa5c57dc6698d36762df8dcea6bac98906ed
|
3 |
+
size 23527424
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:089dbd9d5994c51f005a827fd5806e2223717f3e1513adb82b31632b0ee595c6
|
3 |
+
size 47251456
|
params_shard_43.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c05542e44fff9848f95e4681060514306467ca95fade6fe8e56b4d01fc8808c
|
3 |
+
size 27848704
|
params_shard_44.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea8270471614d7da99013dc4e319b16fdb36c72beb8d39f7323e0dd15b52fac9
|
3 |
+
size 23527424
|
params_shard_45.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dea5cf5b2571d942395c5c84fe07aeeeaa4b2f5721d387d5305bbed70e7d93b2
|
3 |
+
size 47251456
|
params_shard_46.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c05c686050ccd49e162d331449e1d95817d9d360850b452eb726cc7163183d7
|
3 |
+
size 27848704
|
params_shard_47.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8518ec6cb2a88174cb14bddc649b7373d770ccd1e9dabd9e3ff2911ab1e42467
|
3 |
+
size 23527424
|
params_shard_48.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0026ee98da4442cf5d7b2fd213831b858d0f7a28d3c1862ce1c4c3999e88eadb
|
3 |
+
size 47251456
|
params_shard_49.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6a3a17de1d413f1f1e2a3e5fc91c7fc343498438b1ef0a8b703b8865490b975f
|
3 |
+
size 27848704
|
params_shard_5.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:81e7ab75842f9ab10c3419eb5b76581bd5ed8a7580ff10701ba15414d9ee81e8
|
3 |
+
size 23527424
|
params_shard_50.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b1cda0c3fb5ebef1e4fe0a4239b6972512843b8cfa3fc72ad57bfc27436638ef
|
3 |
+
size 23527424
|
params_shard_51.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2fd30995f32ef7bf2809a11d2b28e62177774daeca0f1c44c54907e024920342
|
3 |
+
size 47251456
|