Upload LlamaForCausalLM
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- config.json +29 -0
- generation_config.json +8 -0
- model-00001-of-00106.safetensors +3 -0
- model-00002-of-00106.safetensors +3 -0
- model-00003-of-00106.safetensors +3 -0
- model-00004-of-00106.safetensors +3 -0
- model-00005-of-00106.safetensors +3 -0
- model-00006-of-00106.safetensors +3 -0
- model-00007-of-00106.safetensors +3 -0
- model-00008-of-00106.safetensors +3 -0
- model-00009-of-00106.safetensors +3 -0
- model-00010-of-00106.safetensors +3 -0
- model-00011-of-00106.safetensors +3 -0
- model-00012-of-00106.safetensors +3 -0
- model-00013-of-00106.safetensors +3 -0
- model-00014-of-00106.safetensors +3 -0
- model-00015-of-00106.safetensors +3 -0
- model-00016-of-00106.safetensors +3 -0
- model-00017-of-00106.safetensors +3 -0
- model-00018-of-00106.safetensors +3 -0
- model-00019-of-00106.safetensors +3 -0
- model-00020-of-00106.safetensors +3 -0
- model-00021-of-00106.safetensors +3 -0
- model-00022-of-00106.safetensors +3 -0
- model-00023-of-00106.safetensors +3 -0
- model-00024-of-00106.safetensors +3 -0
- model-00025-of-00106.safetensors +3 -0
- model-00026-of-00106.safetensors +3 -0
- model-00027-of-00106.safetensors +3 -0
- model-00028-of-00106.safetensors +3 -0
- model-00029-of-00106.safetensors +3 -0
- model-00030-of-00106.safetensors +3 -0
- model-00031-of-00106.safetensors +3 -0
- model-00032-of-00106.safetensors +3 -0
- model-00033-of-00106.safetensors +3 -0
- model-00034-of-00106.safetensors +3 -0
- model-00035-of-00106.safetensors +3 -0
- model-00036-of-00106.safetensors +3 -0
- model-00037-of-00106.safetensors +3 -0
- model-00038-of-00106.safetensors +3 -0
- model-00039-of-00106.safetensors +3 -0
- model-00040-of-00106.safetensors +3 -0
- model-00041-of-00106.safetensors +3 -0
- model-00042-of-00106.safetensors +3 -0
- model-00043-of-00106.safetensors +3 -0
- model-00044-of-00106.safetensors +3 -0
- model-00045-of-00106.safetensors +3 -0
- model-00046-of-00106.safetensors +3 -0
- model-00047-of-00106.safetensors +3 -0
- model-00048-of-00106.safetensors +3 -0
config.json
ADDED
@@ -0,0 +1,29 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "./merged3",
|
3 |
+
"architectures": [
|
4 |
+
"LlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 1,
|
9 |
+
"eos_token_id": 2,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 8192,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 28672,
|
14 |
+
"max_position_embeddings": 4096,
|
15 |
+
"model_type": "llama",
|
16 |
+
"num_attention_heads": 64,
|
17 |
+
"num_hidden_layers": 140,
|
18 |
+
"num_key_value_heads": 8,
|
19 |
+
"pad_token_id": 0,
|
20 |
+
"pretraining_tp": 1,
|
21 |
+
"rms_norm_eps": 1e-05,
|
22 |
+
"rope_scaling": null,
|
23 |
+
"rope_theta": 10000.0,
|
24 |
+
"tie_word_embeddings": false,
|
25 |
+
"torch_dtype": "float32",
|
26 |
+
"transformers_version": "4.36.2",
|
27 |
+
"use_cache": false,
|
28 |
+
"vocab_size": 32000
|
29 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 1,
|
4 |
+
"eos_token_id": 2,
|
5 |
+
"pad_token_id": 0,
|
6 |
+
"transformers_version": "4.36.2",
|
7 |
+
"use_cache": false
|
8 |
+
}
|
model-00001-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e3d02ed1178dcb478b46bfaafcfa15f479525264384c4abd269543192973f4e
|
3 |
+
size 4806739440
|
model-00002-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c86dfdd3d2cd005d6317a62ed780925fc0f8f0c4d891d051ea3a2faf76772ef6
|
3 |
+
size 4630578440
|
model-00003-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c68b3ac8eb5b33ad7e3f95dc4e2ed6aa957d1f744c72e99516d8f6d64a6e427e
|
3 |
+
size 4362142864
|
model-00004-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6e70647db6a35e43000cf15380bf695d07d3fad5c21b37f40e0c734c43b903d5
|
3 |
+
size 4966188864
|
model-00005-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97fe33ff1b3415106e59e0def9a8fa44b1835d33ae7292825e9e3022cee021d2
|
3 |
+
size 4362142864
|
model-00006-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c5ac33ed4b0c30dd2b1e63b31b30f8a97dadae2ad5004bd38d28c4f6918e3e6c
|
3 |
+
size 4362142864
|
model-00007-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2291a5e7ec507dda1db8ba0a3c0283974cf23c6bca5bc651d3fd3a27182f09d4
|
3 |
+
size 4966188864
|
model-00008-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d8bce52a82b0aada352eb0c919bdd1e515d599bf008ac4645b29651da7c8739
|
3 |
+
size 4362142880
|
model-00009-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0a791e5ea49f14d30d9640a29ff65a82b6c6880d008136d2509cff3c4abfe722
|
3 |
+
size 4362142872
|
model-00010-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8094e42cc998daa13a13dea3e0e811a8398074d43d06a747f2722e98b6e0da01
|
3 |
+
size 4966188880
|
model-00011-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:462539a05f8ccc64d3468d6f83c5a1bd4180a0b88816b750243dcf87cc10718a
|
3 |
+
size 4362142872
|
model-00012-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9921a70ce4cd1c68935afad9a1dafab6bcea1caf0b8b028a99bf9b33a7dfa226
|
3 |
+
size 4362142872
|
model-00013-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d270424f967098636d380c77df0f67476b7f6539897b1677282f17f883d79b21
|
3 |
+
size 4966188880
|
model-00014-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9260cde85a374cf62f1c4507baf02d7423669e0c466f988bad74fcb44157fdca
|
3 |
+
size 4362142872
|
model-00015-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c579b083ca734d4fea6a399ae413928162f723cf3479311ba64045677a22987e
|
3 |
+
size 4362142872
|
model-00016-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:90d0eefc9cb11eba17d2937f1a3794394b717d8b111eb35533cac914d3f5e83c
|
3 |
+
size 4966188880
|
model-00017-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:453462f72541378743e47ecf4e07ac5102c217c364494b1de0b4dca46ef75e9d
|
3 |
+
size 4362142872
|
model-00018-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e53b08f4b761076b6aa413e43e5b988b765cf0d46d45c49371e110f13f5f037b
|
3 |
+
size 4362142872
|
model-00019-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65096c7783b957e40a03daeeb079a642f4c7ab62e3df92d07fca6a96bdf4861d
|
3 |
+
size 4966188880
|
model-00020-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:806a9eb3da6a1882f5a43b86a2eab21a4592c987dbbe99df64e09f522925fbe2
|
3 |
+
size 4362142872
|
model-00021-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8ee3c8546a50a9cecf187451590d5b1aca7009a5bd9364cfa87a5b8ddfdb4022
|
3 |
+
size 4362142872
|
model-00022-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b7c148533588907213221a276b4d673af8a97b94f5786a6fb4c038cbc39f701c
|
3 |
+
size 4966188880
|
model-00023-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d322bb8653aa4929901b9119dfa0fdcd6633b05d0741b48213c6612e57b76b7
|
3 |
+
size 4362142872
|
model-00024-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3fb7fee679e4b646fce7df478858f7cb7570357ac81ad946564158b2833db3b1
|
3 |
+
size 4362142872
|
model-00025-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2ad5ee15cee34e13106d7addc028405e72ce167032f88efbea995877017118c
|
3 |
+
size 4966188880
|
model-00026-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f5c5ad57fb921e16d18be91deb9a01f9ed89cc515af0be9dcd13f3c0946e7c2
|
3 |
+
size 4362142872
|
model-00027-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1861787259cdb9cf0dbb1cbc2dd907567655ab7dd22e146306ce1fde51ef09a1
|
3 |
+
size 4362142872
|
model-00028-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:919ac271a48742cd63d8e334d4639a2b6affaa8abf1230af44d0ae98928baf7c
|
3 |
+
size 4966188880
|
model-00029-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68f62e4e0b70a2b6c0c8dc0821b9640e2058eadd2518061b70e31af35e2c677d
|
3 |
+
size 4362142872
|
model-00030-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65fa1210cf65d43c47df0d41188e276190fb3b8f1656654fc01225c9e68a54f1
|
3 |
+
size 4362142872
|
model-00031-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1477296b0c43aa6f94b6419cf648d905695f3b02cca451f6760e88f63cd92f7b
|
3 |
+
size 4966188880
|
model-00032-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d527dce5cddc274ac42d91f883b894624d01fa682792bf6901648b8d2d973e59
|
3 |
+
size 4362142872
|
model-00033-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e54efdcf7bec565248080ccbda1629aeb0d2e4085985d996fd622e4fefb83e5
|
3 |
+
size 4362142872
|
model-00034-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:12eff68e1ab5553881a1129f5921dc53c1131bf2ae3a335b989ccddb2ab032bd
|
3 |
+
size 4966188880
|
model-00035-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:22c7ebabe895a7ca100fd97d6f339b7ab5ca67c4fed03a3c69659bd6a31b0747
|
3 |
+
size 4362142872
|
model-00036-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3963ca58c8343fd096240ab13c9c6a044d1f8f63518ae00eaacd4b49d35cfb66
|
3 |
+
size 4362142872
|
model-00037-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf995ee0ccd594e56e321f6527c35d6022b6613fd0244d46299d8484296cd358
|
3 |
+
size 4966188880
|
model-00038-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab2f4957ba21721580beab6aad3d05f8a113198943fac833e66bf38c555265bb
|
3 |
+
size 4362142872
|
model-00039-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82fb192e9cafc7e970dc44f6f3b639414113068b7172e3981708a7027537db34
|
3 |
+
size 4362142872
|
model-00040-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ff283f4e5f9c8da8a8c43023cce34503f6fad46e7a4e38b53bf92c5be96819da
|
3 |
+
size 4966188880
|
model-00041-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3234a503a9f6bf7e1383f2aab2ea7657ba6da313ec27412c8de6f209fc6314fa
|
3 |
+
size 4362142872
|
model-00042-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4634579c66f12c0eadf748242e5fd02d5668f3ff0cb757b377d10eecafa63c5
|
3 |
+
size 4362142872
|
model-00043-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd898142c17a32a31ac8c1af864937596bba7f085452e3205243d208f04258fb
|
3 |
+
size 4966188880
|
model-00044-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f4c8e07789b06e9648062dcf04f7d3202818692cb042c35e8f3f3306cf913276
|
3 |
+
size 4362142872
|
model-00045-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec51be1731eaa80ed1dfb08746e5c1ee7c4f7f51a1ab155333d85a676018db1f
|
3 |
+
size 4362142872
|
model-00046-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f426cc6d0dd49bf68eeabe99bc21a89f77fd630acb1ffc0d9baffc70798ee5eb
|
3 |
+
size 4966188880
|
model-00047-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:63faef73302257485978506e6108c4084e086c198b751bc9b609e0ea1f7f046d
|
3 |
+
size 4362142872
|
model-00048-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7974ed8f4bd10765391d6c0592e23784bad0cc115a129b6cbd046bb71f2433b
|
3 |
+
size 4362142872
|