CharlieFRuan
commited on
Initial commit
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +1 -0
- logs.txt +0 -0
- mlc-chat-config.json +45 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
- params_shard_43.bin +3 -0
- params_shard_44.bin +3 -0
- params_shard_45.bin +3 -0
- params_shard_46.bin +3 -0
- params_shard_47.bin +3 -0
- params_shard_48.bin +3 -0
- params_shard_49.bin +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
logs.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,45 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model_type": "gemma",
|
3 |
+
"quantization": "q4f16_2",
|
4 |
+
"model_config": {
|
5 |
+
"hidden_size": 3072,
|
6 |
+
"hidden_act": "gelu",
|
7 |
+
"intermediate_size": 24576,
|
8 |
+
"attention_bias": false,
|
9 |
+
"num_attention_heads": 16,
|
10 |
+
"num_key_value_heads": 16,
|
11 |
+
"head_dim": 256,
|
12 |
+
"num_hidden_layers": 28,
|
13 |
+
"rms_norm_eps": 1e-06,
|
14 |
+
"vocab_size": 256000,
|
15 |
+
"position_embedding_base": 10000.0,
|
16 |
+
"context_window_size": 8192,
|
17 |
+
"prefill_chunk_size": 1024,
|
18 |
+
"tensor_parallel_shards": 1,
|
19 |
+
"max_batch_size": 80
|
20 |
+
},
|
21 |
+
"vocab_size": 256000,
|
22 |
+
"context_window_size": 8192,
|
23 |
+
"sliding_window_size": -1,
|
24 |
+
"prefill_chunk_size": 1024,
|
25 |
+
"attention_sink_size": -1,
|
26 |
+
"tensor_parallel_shards": 1,
|
27 |
+
"mean_gen_len": 128,
|
28 |
+
"max_gen_len": 512,
|
29 |
+
"shift_fill_factor": 0.3,
|
30 |
+
"temperature": 0.7,
|
31 |
+
"presence_penalty": 0.0,
|
32 |
+
"frequency_penalty": 0.0,
|
33 |
+
"repetition_penalty": 1.0,
|
34 |
+
"top_p": 0.95,
|
35 |
+
"conv_template": "gemma_instruction",
|
36 |
+
"pad_token_id": 0,
|
37 |
+
"bos_token_id": 2,
|
38 |
+
"eos_token_id": 1,
|
39 |
+
"tokenizer_files": [
|
40 |
+
"tokenizer.model",
|
41 |
+
"tokenizer.json",
|
42 |
+
"tokenizer_config.json"
|
43 |
+
],
|
44 |
+
"version": "0.1.0"
|
45 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d2be3ee8010ace2bde14cf19c7a0c3d397674fcea96fcc119fbe99953b4cae48
|
3 |
+
size 1572864000
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1130e8379c29a56b5a289edf23afeec60cdf83512da0593e790aa798d7ae3dc9
|
3 |
+
size 37748736
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9f3f9db02b424a1ccbd92c2fc01a87c95b122c17aaf59004ec2f893b21d3d90c
|
3 |
+
size 33036288
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9aa21f13a894b702c59937a05e6b83e0f6e358d52cce578c96d13dd79e00436b
|
3 |
+
size 9443328
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59297604658d9fa9f1f8bcc7eed56e54aa8981e29b7d747651df4f2b478c1e6c
|
3 |
+
size 37748736
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd0bd536fda772360147b772bd3a9b6836fe45cb4e5a110f7b86cbffbd3a3096
|
3 |
+
size 75497472
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:807bdd15b8ca0129540899a1de88480e1b64d020c2c63d280039608887903d9a
|
3 |
+
size 18874368
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df6dd10a388de0ab97b3c043e424af075ee172567f2bdb1f96aa03d00579198e
|
3 |
+
size 37748736
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38cbc36412114da71ff5bdd784b5f0e1d57689d7519b15898d25cc3888dec22c
|
3 |
+
size 33048576
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:48fbdf889c5ee4e89dcb3b33beb45e9b3019617f922c295c8612f5f45726f8ac
|
3 |
+
size 75497472
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7448c32ebb87c890b18b588a3ad3c305fb66f9ddf8fdba43c43227d6197e8f9c
|
3 |
+
size 33036288
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b4108c883194ab76ccd70e963dd14418d7e5e33ea0fa2b5616b578c7d6a65e3c
|
3 |
+
size 37748736
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d2d60ae458a820ac2dde3f442d458d3552adac3731f3c5e75f061cc6245a75c
|
3 |
+
size 75497472
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:553080c976a8468517c9f06e6c035ca3f3b68f6c3aaac235cfbe73fcadf16e83
|
3 |
+
size 75497472
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:531a609e9dc02757ce53fec738c3e7b8f12ef9205e6548c913562edeaa3aecc9
|
3 |
+
size 18874368
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:23c9478746b4feabf637b811db11088a6b8c855628f603d961eb2690e8868247
|
3 |
+
size 18874368
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:91d5d8f50d0f4309e6906c2bd6ae3b1fa86b5615b5db115bad32314ba43df8da
|
3 |
+
size 33042432
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8599169bd17e3095a177cf05d96d86e472249aa058c59d35c91fe909b94009a8
|
3 |
+
size 37748736
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:34fdb2537192ba739166ece5d7695f96a940d3c1564ac282af8a788e7581c5f0
|
3 |
+
size 75497472
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dba18757f53eefd093f080bcb30b7afa1092f2931ca6f4dc4c23bed1d9c33c05
|
3 |
+
size 18874368
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:291d6a41614312eaa844e9fa7ce52bd018962d6e3eec7af408b3ed309d9c16a8
|
3 |
+
size 37748736
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6cfcddc2f290888b15ad9b14b1b10ba93889dac5637c362242eb84133687dc9e
|
3 |
+
size 33048576
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1d73dffcae5e9bcaabf34f9465b54959977ea41aaaebb27ce729dbe924ed3dc8
|
3 |
+
size 75497472
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c19aa092779aafdfba7cafcf8e24b70b9e23c88259ab2b91740caa42f29e9304
|
3 |
+
size 33036288
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f10fafe09f63759cc53b3b83abcde4f716af9de131d864b49b7974a2b204d2f
|
3 |
+
size 33042432
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:150bb445e889c925d7eadb1e6b975362b7968b66a660d1a0f330ba10c95dcb30
|
3 |
+
size 37748736
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1d1f0386c951611d32ecda6d1b36c60381008d1dea6069b324d4567173f3e51d
|
3 |
+
size 75497472
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f0ed96eff1ce914f186a5f594265d6dc5148a5313da5ba16a06a78d45b32f3c4
|
3 |
+
size 18874368
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1a3ea6fa19cb638779b88bafbbf847e20fe483be748ae0e9b68e56a59652d25
|
3 |
+
size 37748736
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eea2140ead27b51198278e5819b066f27b7b034c47de4bab31b9fb41a1bfbc52
|
3 |
+
size 33048576
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9ffa916390f369f3cb1b3a12336e7714b863f3f16d8bfe6cd7f57bb46cf96e70
|
3 |
+
size 75497472
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c7efecdf8ab91ba9c32d9a4ca1bcfd4d8de25e8ba5c02d84cad55b4b827bec7
|
3 |
+
size 33036288
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2f2e653776cca4a23d2367670fa8cff166b477c484689b6ea36e2c7ac0c64713
|
3 |
+
size 37748736
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:53cd3e101842ebadfdab1b30265552a614acc7bec06cd5352ecead7f59e19a39
|
3 |
+
size 75497472
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:48c5af22911f517a2cbd165fafb7f3160e40a1330534ae67c3f0fc2cae4f61cc
|
3 |
+
size 18874368
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77593eebcd962899109606c50fcda0019e61c12e5a3474a8158846591bf492f7
|
3 |
+
size 37748736
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0f7be00114495a52b47588322a466efcc0900556657c9ab9b35ee286d9883129
|
3 |
+
size 18874368
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8a0a6975701fc96a491c99fa51ece10784f6899742b706d69cc468d2a9823aa2
|
3 |
+
size 33042432
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:637939823a230ef21fc7b5ebd18ce05ac6900cde40cbb3cb2def9be9c1e2e7df
|
3 |
+
size 37748736
|
params_shard_43.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e693c2d4b821ac6f163e994fa9b6cc865556ee01ae41b6afdf71365b4c0fdf7d
|
3 |
+
size 75497472
|
params_shard_44.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a415aa114a25783b2f25f4036348117c9d436fcdef24ab6a93907172a4c328cc
|
3 |
+
size 37748736
|
params_shard_45.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:34c7894fdbaac395327e0f62465b7eede0938dbc237207dcf8fac32676a51433
|
3 |
+
size 75497472
|
params_shard_46.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3c2011a35ff794f4802cfb00e4131ce8517cfd3ddbcee14cc84f32173151416d
|
3 |
+
size 28329984
|
params_shard_47.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d2b7d16f0667098db8b87028ee0a7247a3852cf677e042cbffdcdbce563aca6a
|
3 |
+
size 30676992
|
params_shard_48.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8884497c3a114ffead54f5bc535b3b41e3bd79a14cc614fc5beb47b9028899e2
|
3 |
+
size 37748736
|
params_shard_49.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:45af7e9eee2f4ddbc86b59a9ebd808d41f54bb90b87c3b1aa859ab36c5dc0ad3
|
3 |
+
size 75497472
|