HyunWook An commited on
Commit
84b9c63
·
verified ·
1 Parent(s): 04f7514

Upload 65 files

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
config.json ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "princeton-nlp/Llama-3-Instruct-8B-SimPO",
3
+ "architectures": [
4
+ "LlamaForCausalLM"
5
+ ],
6
+ "attention_bias": false,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 128000,
9
+ "eos_token_id": 128001,
10
+ "hidden_act": "silu",
11
+ "hidden_size": 4096,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 14336,
14
+ "max_position_embeddings": 8192,
15
+ "model_type": "llama",
16
+ "num_attention_heads": 32,
17
+ "num_hidden_layers": 32,
18
+ "num_key_value_heads": 8,
19
+ "pretraining_tp": 1,
20
+ "rms_norm_eps": 1e-05,
21
+ "rope_scaling": null,
22
+ "rope_theta": 500000.0,
23
+ "tie_word_embeddings": false,
24
+ "torch_dtype": "float16",
25
+ "transformers_version": "4.37.2",
26
+ "use_cache": true,
27
+ "vocab_size": 128256
28
+ }
generation_config.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 128000,
4
+ "eos_token_id": [
5
+ 128001,
6
+ 128009
7
+ ],
8
+ "transformers_version": "4.37.2"
9
+ }
mlc-chat-config.json ADDED
@@ -0,0 +1,79 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_type": "llama",
3
+ "quantization": "q4f16_1",
4
+ "model_config": {
5
+ "hidden_size": 4096,
6
+ "intermediate_size": 14336,
7
+ "num_attention_heads": 32,
8
+ "num_hidden_layers": 32,
9
+ "rms_norm_eps": 1e-05,
10
+ "vocab_size": 128256,
11
+ "position_embedding_base": 500000.0,
12
+ "context_window_size": 768,
13
+ "prefill_chunk_size": 128,
14
+ "num_key_value_heads": 8,
15
+ "head_dim": 128,
16
+ "tensor_parallel_shards": 1,
17
+ "max_batch_size": 80
18
+ },
19
+ "vocab_size": 128256,
20
+ "context_window_size": 768,
21
+ "sliding_window_size": -1,
22
+ "prefill_chunk_size": 128,
23
+ "attention_sink_size": -1,
24
+ "tensor_parallel_shards": 1,
25
+ "mean_gen_len": 128,
26
+ "max_gen_len": 512,
27
+ "shift_fill_factor": 0.3,
28
+ "temperature": 0.7,
29
+ "presence_penalty": 0.0,
30
+ "frequency_penalty": 0.0,
31
+ "repetition_penalty": 1.0,
32
+ "top_p": 0.95,
33
+ "conv_template": {
34
+ "name": "llama-3",
35
+ "system_template": "<|start_header_id|>system<|end_header_id|>\n\n{system_message}",
36
+ "system_message": "Below is an instruction that describes a task, paired with an input that provides further context. Write a response that appropriately completes the request.",
37
+ "system_prefix_token_ids": [
38
+ 128000
39
+ ],
40
+ "add_role_after_system_message": true,
41
+ "roles": {
42
+ "user": "user",
43
+ "assistant": "assistant"
44
+ },
45
+ "role_templates": {
46
+ "user": "{user_message}",
47
+ "assistant": "{assistant_message}",
48
+ "tool": "{tool_message}"
49
+ },
50
+ "messages": [],
51
+ "seps": [
52
+ "<|eot_id|><|start_header_id|>"
53
+ ],
54
+ "role_content_sep": "<|end_header_id|>\n\n",
55
+ "role_empty_sep": "<|end_header_id|>\n\n",
56
+ "stop_str": [
57
+ "<|end_of_text|>",
58
+ "<|eot_id|>"
59
+ ],
60
+ "stop_token_ids": [
61
+ 128001,
62
+ 128009
63
+ ],
64
+ "function_string": "",
65
+ "use_function_calling": false
66
+ },
67
+ "pad_token_id": 0,
68
+ "bos_token_id": 128000,
69
+ "eos_token_id": [
70
+ 128001,
71
+ 128009
72
+ ],
73
+ "tokenizer_files": [
74
+ "tokenizer.json",
75
+ "tokenizer_config.json",
76
+ "special_tokens_map.json"
77
+ ],
78
+ "version": "0.1.0"
79
+ }
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71b2b81bea874c67cd70035ab1b0c909d4cd7715162850ff773cfd526ef572aa
3
+ size 262668288
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:58016eafa743672da8245294c9027c539573cb01b3a39e4ca5f38df499d4cdb5
3
+ size 29360128
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb255f41a68715d5078d6a448ede696f779fe4c3344fe9d254d1b93e23f2ce6e
3
+ size 33046528
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:caa88bb8ef2b935915f07578deebc6c5fe3a1a465155b41ec334b4dfc79128d3
3
+ size 29360128
params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d3ad019a3ed08b5c83356af235f35e0dd012cc475f0c1c18e577f7a60ba04c2
3
+ size 58720256
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ecc436837d96cc66a2694f6409d7fc59f85396a731ea98a47dc1e2a6b770b5c
3
+ size 22036480
params_shard_14.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f58af2624df970fecedd7c7d4e12f0ba5de87908ca8db2dfe796ba76282640a
3
+ size 29360128
params_shard_15.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49dc366849f7264d6565a65933dd7d1e606c08b54000d87c7a6c0a6a636d46bd
3
+ size 58720256
params_shard_16.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5a67dde7a88814bdd6c0cd921377fbbfca0f273ca18c467b757e6df5e695c23
3
+ size 27271168
params_shard_17.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:481d2feb475ff87e6f50a10dba21651c122d1c0d1b84543283a5c810d1b8b177
3
+ size 29360128
params_shard_18.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9441bc61c01544934a84148cac39a3996998a366b06b749560cdc3b57ac831c1
3
+ size 30949376
params_shard_19.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b5b5e9d7bcf2c81547783cb456a028686a1471b98a1f4bf20cc1da477461720
3
+ size 58720256
params_shard_2.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20685a9b5f5dcd557c4f2390ffb5d8fe5b7aa3846309f427952329689ecd7ef4
3
+ size 32841728
params_shard_20.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1700dfc37086ed488e4e1ff716da499f364cbe5d445019681a95fcffb77d303
3
+ size 25174016
params_shard_21.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89a520af3804b29b0d914396ccff0625dab70ff14c992755b4388e6bdb8ecee0
3
+ size 29360128
params_shard_22.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4dae1096f0c2be947871199d153fc4e052a38358100bbe5fe7975dce08e3c31
3
+ size 58720256
params_shard_23.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cda0819e114ff7615866ba3c61b0d82456cd27fbaffc0a627eae01ae76ee1a1c
3
+ size 33046528
params_shard_24.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1566fa1591d117a768d1f11c993d70a7cfe2688e84c69939da7b53f677786c85
3
+ size 29360128
params_shard_25.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:202d90dfb5c531d536fcfb42e604e676e712cb51c0a6a46656be8962a67ba5c3
3
+ size 58720256
params_shard_26.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:530e7924ae108bf37a8cc818e91e84644a6273fde0fa799b67c429efdad97205
3
+ size 22036480
params_shard_27.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:853821c2fd8615efa28cd0e4f16e595b73272f5b13edc24323166e36150987ac
3
+ size 29360128
params_shard_28.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:185b77fecbbb984cb513bf8eefe58095b4e2f252b6a7469d5b3c5a3fda72534d
3
+ size 58720256
params_shard_29.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fca797a105c9c5a5364d2a2619e572cb89e876a3083d5c953af9fd912014e4ef
3
+ size 27271168
params_shard_3.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6acbe0aa07670be8518ae89118ddf9d67ebdd653583d5585baa8e751670919fe
3
+ size 262668288
params_shard_30.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f5a368084335a1d069e9bdfc56a0ce4709de570ed1170195f705809d8ad35bc
3
+ size 29360128
params_shard_31.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccfe2bddda560ab380d1dbb05234b8ac6e76d51021068802a59c70b47fac26e8
3
+ size 30949376
params_shard_32.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5dd116ad039ac13f30acce8279e0092c606a08178bb5ae3c5321e5e48769e9eb
3
+ size 58720256
params_shard_33.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89d73dfccee514f14af24f8fdcbf6ba64c4159f8c3fac040e3f37d02b75d8268
3
+ size 25174016
params_shard_34.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da71d2c5c25e66628c9b8950ea3edcf5f950461c3e0e4ccc02662dd4c1284a19
3
+ size 29360128
params_shard_35.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e89e2c496ca8e858ee9c647a578dd29f949e4809addec77caeff10c79474e989
3
+ size 58720256
params_shard_36.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:694e1eb70416b35beac4dfa3dc40eb3d5331c91af6b46cd7d0294b9363206bda
3
+ size 33046528
params_shard_37.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b8b2745bdb23e7609bc7f609794f9763c05e283048ef6c18381db2e9c243ec7
3
+ size 29360128
params_shard_38.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f9a1abb082c996b27d7805b9f3b2397547c403cfd61361bc4ff70ce1f5c06cc
3
+ size 58720256
params_shard_39.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:484c7d8ba2a2dd4a3057d17781c750eb9189737fef3c2766ce76dc2a661dd1c2
3
+ size 22036480
params_shard_4.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:496edd4fcb07e1dffb30c78dc30df75dd366d523ad2a692265258fa36c4b8304
3
+ size 32833536
params_shard_40.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1128bea4eaa56bf425b13f6e006f0d994f4e211800a7d9289be2ba07469e4ab2
3
+ size 29360128
params_shard_41.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d44010d67262f3c7ef7b306d11cbb406aede2775d2dd2bccdd60220ceffef5cb
3
+ size 58720256
params_shard_42.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6cd84e4b608b8dd3a467c57a3a622bcab0c795c6c29b9e576e8f4ddcf5480855
3
+ size 27271168
params_shard_43.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03252de820c5a1c7fc4fe3a9b74bf404baf74dbba3ceb44b7bae680dad665cb4
3
+ size 29360128
params_shard_44.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:827cb9044864a9522d6e9b4736029fe2ee5edf8d8bac38c7448420028d74ad31
3
+ size 30949376
params_shard_45.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff1bc537c66e0239b4fdb663397d982cf0c77e2bd2fa3a85ff65810dcc93dc68
3
+ size 58720256
params_shard_46.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9622b4eec3515e54466cad4b204e39e0cd16eaeed270214821c96d26743ea005
3
+ size 25174016
params_shard_47.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41ec59caaae862edba397ea78d39ac39348c02865addf03e2d1cc5a95142de3c
3
+ size 29360128
params_shard_48.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1616090544e055ce3340f4cbdc7e5fc5f4bca47d6a17be757ad7d24e0753f16b
3
+ size 58720256
params_shard_49.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3ed462c407fa4969e901d68c64ef3492f46767fedec14601d845d6979739b7b
3
+ size 33046528
params_shard_5.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d044f5d1b07c78bbf58400feaa72e486bad2fabcbea3a8a68a869b84a4ee3781
3
+ size 33054720