Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mlc-chat-config.json +83 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_128.bin +3 -0
- params_shard_129.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_130.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,83 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "llama",
|
4 |
+
"quantization": "q0f16",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_size": 4096,
|
7 |
+
"intermediate_size": 14336,
|
8 |
+
"num_attention_heads": 32,
|
9 |
+
"num_hidden_layers": 32,
|
10 |
+
"rms_norm_eps": 1e-05,
|
11 |
+
"vocab_size": 128256,
|
12 |
+
"tie_word_embeddings": false,
|
13 |
+
"position_embedding_base": 500000.0,
|
14 |
+
"rope_scaling": {
|
15 |
+
"factor": 8.0,
|
16 |
+
"low_freq_factor": 1.0,
|
17 |
+
"high_freq_factor": 4.0,
|
18 |
+
"original_max_position_embeddings": 8192,
|
19 |
+
"rope_type": "llama3"
|
20 |
+
},
|
21 |
+
"context_window_size": 131072,
|
22 |
+
"prefill_chunk_size": 8192,
|
23 |
+
"num_key_value_heads": 8,
|
24 |
+
"head_dim": 128,
|
25 |
+
"tensor_parallel_shards": 1,
|
26 |
+
"pipeline_parallel_stages": 1,
|
27 |
+
"max_batch_size": 128,
|
28 |
+
"disaggregation": false
|
29 |
+
},
|
30 |
+
"vocab_size": 128256,
|
31 |
+
"context_window_size": 131072,
|
32 |
+
"sliding_window_size": -1,
|
33 |
+
"prefill_chunk_size": 8192,
|
34 |
+
"attention_sink_size": -1,
|
35 |
+
"tensor_parallel_shards": 1,
|
36 |
+
"pipeline_parallel_stages": 1,
|
37 |
+
"temperature": 1.0,
|
38 |
+
"presence_penalty": 0.0,
|
39 |
+
"frequency_penalty": 0.0,
|
40 |
+
"repetition_penalty": 1.0,
|
41 |
+
"top_p": 1.0,
|
42 |
+
"tokenizer_files": [
|
43 |
+
"tokenizer.json",
|
44 |
+
"tokenizer_config.json"
|
45 |
+
],
|
46 |
+
"tokenizer_info": {
|
47 |
+
"token_postproc_method": "byte_level",
|
48 |
+
"prepend_space_in_encode": false,
|
49 |
+
"strip_space_in_decode": false
|
50 |
+
},
|
51 |
+
"conv_template": {
|
52 |
+
"name": "deepseek_v3",
|
53 |
+
"system_template": "<\uff5cbegin\u2581of\u2581sentence\uff5c>{system_message}",
|
54 |
+
"system_message": "You are a helpful assistant.",
|
55 |
+
"system_prefix_token_ids": null,
|
56 |
+
"add_role_after_system_message": true,
|
57 |
+
"roles": {
|
58 |
+
"user": "<\uff5cUser\uff5c>",
|
59 |
+
"assistant": "<\uff5cAssistant\uff5c>"
|
60 |
+
},
|
61 |
+
"role_templates": {
|
62 |
+
"user": "{user_message}",
|
63 |
+
"assistant": "{assistant_message}",
|
64 |
+
"tool": "{tool_message}"
|
65 |
+
},
|
66 |
+
"messages": [],
|
67 |
+
"seps": [
|
68 |
+
"",
|
69 |
+
"<\uff5cend\u2581of\u2581sentence\uff5c>"
|
70 |
+
],
|
71 |
+
"role_content_sep": "",
|
72 |
+
"role_empty_sep": "",
|
73 |
+
"stop_str": [],
|
74 |
+
"stop_token_ids": [
|
75 |
+
151643
|
76 |
+
],
|
77 |
+
"function_string": "",
|
78 |
+
"use_function_calling": false
|
79 |
+
},
|
80 |
+
"pad_token_id": 0,
|
81 |
+
"bos_token_id": 128000,
|
82 |
+
"eos_token_id": 128001
|
83 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2e70bd89f9121fe29d269b61c297574e3e7f17a40bdda8f0d331a16a4b22830
|
3 |
+
size 1050673152
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a982ca1843ebb5e152ef1a3b7d7dadbe0bb053c4a082037b638f3d1e36675cfd
|
3 |
+
size 50331648
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3dc91b637dd1b3d992983d191ad7c5adc6c104b22e5dc2a4b270c8a2ae741064
|
3 |
+
size 33554432
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec697dedb89eaeefca96c48fb8d5dbb579da02b174e2b4d1dc62bb4891b15318
|
3 |
+
size 117440512
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8857854c7727bb4c1cfbd1ae64d89ef670af9f8d316d928802fee782cef89fd2
|
3 |
+
size 50331648
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f557b48341ce6becb66fcf7abe7598f02fe5296d7875ea66f989e4e689efcfda
|
3 |
+
size 33554432
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:86cb769d2857ed663823d0742bff555b8a5c00d01fa45cc4a463d003d3030cce
|
3 |
+
size 234881024
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dc993f29019c545b86351a704b4dada9465737a77bdfd7be499f708aa16f297f
|
3 |
+
size 117440512
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1b5ac7c54962020bebf311a9bf44311ff52bfc8aea8eb372cecf3d383f6e69a6
|
3 |
+
size 50331648
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bf91b046349fbfc1dc2770f0bf6f405fe5ab165fc28041df8d0cc3dd1df427ba
|
3 |
+
size 33554432
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8fbb5b0550fc9dede5c327b15df981966b4fd9239cfc9666c7a2ce89bf0b6a84
|
3 |
+
size 234881024
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:45ab0b4175eb7a092938f0c538f8f88d3b7c8dade5dffecaf13b8b632a83034a
|
3 |
+
size 117440512
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a08d51c902bd213df5719dfde14d199a236ec8bcf5c3533bd51e29802523eda4
|
3 |
+
size 50331648
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e996959e084e0eed37afab7ee599d816407f1ea8b99d86e7348877da6b9e85fc
|
3 |
+
size 234881024
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:698fc5d6adce693c93c253acdb03637f95d6ed22c7ee9866409e8580c3a582ef
|
3 |
+
size 33554432
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8ea8e01a83e57a3af7c89b180e2055c6e5770624fd5f2587dadfc09b39cf9356
|
3 |
+
size 234881024
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b12fdf3d80353189cfd2047d8d3f52860a68bf1c6900d329356a80b25acda272
|
3 |
+
size 117440512
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d133601d287973e87dda031e59886340723ae795972e6d0e6e113d3d66644cc1
|
3 |
+
size 50331648
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e48a2267424f15e8b76282ddeb24178f93242061ef96fd4ff2c6e5cdf92bd41a
|
3 |
+
size 33554432
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:19d7936fa60aa9c131959acd853d64005f279a6925f317956832006f51c9448d
|
3 |
+
size 234881024
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f0bd4d20cabbfa18dbe8533267a331c7b20903b2c829a1987f64d1bdebf3e094
|
3 |
+
size 117440512
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bf395dfe73f410ee21c14dd179ad2f1e129bb63088ddc7a8f114f3a4d789c21b
|
3 |
+
size 50331648
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2100524bf19883f63e2244339f4639d4337ddcdb15cdd433855b5337f603c16
|
3 |
+
size 33554432
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:976ad24bcf7651193b213b09e38959ba37f617778eb288919823b06356aa3fd8
|
3 |
+
size 234881024
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc24d6ce95e6d4b9651652464ca5ebf7e84345f3dc504efdf1055bf97d66c9a7
|
3 |
+
size 117440512
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd83d51b9f5254a5068f81a13fc022456e58456c7359b3b11ee829b3d4f0a018
|
3 |
+
size 117440512
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0db19ea3cd2b9f700d8e21e4b54a2f78b2500dcac69f6cc191f0ffad274c5996
|
3 |
+
size 50331648
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dda9a677862851f4f346c0f93e58943695c33b97125c62f884088095d1273088
|
3 |
+
size 33554432
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d2acd8c7cc9c4cf47986172ac28ab3d53854a1053b0c468f446c9c3f179783d
|
3 |
+
size 234881024
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:94fd1029891adea05fb7ba0b65483936adbfa845054b27d4ef7f9a0ca977d93d
|
3 |
+
size 117440512
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5709b61da0a03d204b50fec34fb5db93b9f5c4b4ad80d2da249b8baa4d1fefbb
|
3 |
+
size 50331648
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5bae640c1b31edc76751eb7578ce75fdccf327d8a498236ec4acdeee4941d6a1
|
3 |
+
size 33554432
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0e92d3f2722ea2d4ff87f028ffa2b670891972a7f9cb33e798707e66a4a8d0d6
|
3 |
+
size 234881024
|
params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:afecd367c55ea2d2510535fd70fc08adf226b69936af475e12392d2df742006b
|
3 |
+
size 117440512
|
params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f99c1252ae386959e1a777d3b39f319bc12b0b4c3b3d88e3826b5e5b22166b8d
|
3 |
+
size 1050673152
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8013839d695b83cafc6b5c11c36e2fe16e7088001b3fecc1038719e39bf82e5
|
3 |
+
size 50331648
|
params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a65804e8b07da52f092f4d552657bcf9bcb0187035f400ec6368891fc3f41834
|
3 |
+
size 532480
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5d9344cd3174e2d8ee9805ee9e05927e4bdf182f649d830f18d3e0a8aa3aeed9
|
3 |
+
size 33554432
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:727d3db8eb4490553ad6ec062d97f0576e8370a490902497fd85ca76c9163ab1
|
3 |
+
size 234881024
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:46af111033cff416765080d92692c3d533347c821295812f048e0b79b97ef988
|
3 |
+
size 117440512
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f16ac96e3b637457ffeec7875ca986075b4bbd26639771f6b028df33582dfd40
|
3 |
+
size 50331648
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6a5a16cb638c85f1bba5ef13bf3d0556c4f6d3176e852fa6470829a06142f51d
|
3 |
+
size 33554432
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:64901563ece538448531a3d96d540f070613d96fdc604a1aa1ec8abfc4da6d16
|
3 |
+
size 234881024
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3585dd3b72699ca8bff3a48add067c2250c9c3d16a7a9d778c6f51a69ed43b3f
|
3 |
+
size 33554432
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3b740138a7e235e1959336fef794f1108e9945a0a1b5027e2dd662495d6bf1c5
|
3 |
+
size 117440512
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1cbf2e3d89d32042096dec056e02280b3195d36a48fc7db875e758ba665980d0
|
3 |
+
size 50331648
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3c0cc00f0a6feea602cebb38ad606801bc898b85693ddf7d49a4082a16bbd34
|
3 |
+
size 33554432
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6f8587f0e823a4e84c3d8e9f627660e2a0e698f602938e5546acfb2c3b2a21b
|
3 |
+
size 234881024
|