Treza12 commited on
Commit
40cf087
·
verified ·
1 Parent(s): 4058094

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. config.json +32 -0
  2. mergekit_moe_config.yml +24 -0
  3. model-00001-of-00076.safetensors +3 -0
  4. model-00002-of-00076.safetensors +3 -0
  5. model-00003-of-00076.safetensors +3 -0
  6. model-00004-of-00076.safetensors +3 -0
  7. model-00005-of-00076.safetensors +3 -0
  8. model-00006-of-00076.safetensors +3 -0
  9. model-00007-of-00076.safetensors +3 -0
  10. model-00008-of-00076.safetensors +3 -0
  11. model-00009-of-00076.safetensors +3 -0
  12. model-00010-of-00076.safetensors +3 -0
  13. model-00011-of-00076.safetensors +3 -0
  14. model-00012-of-00076.safetensors +3 -0
  15. model-00013-of-00076.safetensors +3 -0
  16. model-00014-of-00076.safetensors +3 -0
  17. model-00015-of-00076.safetensors +3 -0
  18. model-00016-of-00076.safetensors +3 -0
  19. model-00017-of-00076.safetensors +3 -0
  20. model-00018-of-00076.safetensors +3 -0
  21. model-00019-of-00076.safetensors +3 -0
  22. model-00020-of-00076.safetensors +3 -0
  23. model-00021-of-00076.safetensors +3 -0
  24. model-00022-of-00076.safetensors +3 -0
  25. model-00023-of-00076.safetensors +3 -0
  26. model-00024-of-00076.safetensors +3 -0
  27. model-00025-of-00076.safetensors +3 -0
  28. model-00026-of-00076.safetensors +3 -0
  29. model-00027-of-00076.safetensors +3 -0
  30. model-00028-of-00076.safetensors +3 -0
  31. model-00029-of-00076.safetensors +3 -0
  32. model-00030-of-00076.safetensors +3 -0
  33. model-00031-of-00076.safetensors +3 -0
  34. model-00032-of-00076.safetensors +3 -0
  35. model-00033-of-00076.safetensors +3 -0
  36. model-00034-of-00076.safetensors +3 -0
  37. model-00035-of-00076.safetensors +3 -0
  38. model-00036-of-00076.safetensors +3 -0
  39. model-00037-of-00076.safetensors +3 -0
  40. model-00038-of-00076.safetensors +3 -0
  41. model-00039-of-00076.safetensors +3 -0
  42. model-00040-of-00076.safetensors +3 -0
  43. model-00041-of-00076.safetensors +3 -0
  44. model-00042-of-00076.safetensors +3 -0
  45. model-00043-of-00076.safetensors +3 -0
  46. model-00044-of-00076.safetensors +3 -0
  47. model-00045-of-00076.safetensors +3 -0
  48. model-00046-of-00076.safetensors +3 -0
  49. model-00047-of-00076.safetensors +3 -0
  50. model-00048-of-00076.safetensors +3 -0
config.json ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "BioMistral/BioMistral-7B",
3
+ "architectures": [
4
+ "MixtralForCausalLM"
5
+ ],
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 1,
8
+ "eos_token_id": 2,
9
+ "head_dim": 128,
10
+ "hidden_act": "silu",
11
+ "hidden_size": 4096,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 14336,
14
+ "max_position_embeddings": 32768,
15
+ "model_type": "mixtral",
16
+ "num_attention_heads": 32,
17
+ "num_experts_per_tok": 2,
18
+ "num_hidden_layers": 32,
19
+ "num_key_value_heads": 8,
20
+ "num_local_experts": 6,
21
+ "output_router_logits": false,
22
+ "rms_norm_eps": 1e-05,
23
+ "rope_theta": 10000.0,
24
+ "router_aux_loss_coef": 0.001,
25
+ "router_jitter_noise": 0.0,
26
+ "sliding_window": null,
27
+ "tie_word_embeddings": false,
28
+ "torch_dtype": "bfloat16",
29
+ "transformers_version": "4.45.0.dev0",
30
+ "use_cache": false,
31
+ "vocab_size": 32000
32
+ }
mergekit_moe_config.yml ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ base_model: BioMistral/BioMistral-7B
2
+ gate_mode: approach # one of "hidden", "cheap_embed", or "random"
3
+ dtype: bfloat16 # output dtype (float32, float16, or bfloat16)
4
+ ## (optional)
5
+ # experts_per_token: 2
6
+ experts:
7
+ - source_model: Treza12/BioMistral-Unsloth-Full-Class-0
8
+ positive_prompts:
9
+ - "This is a prompt that is demonstrative of what expert model excels at Screening"
10
+ - source_model: Treza12/BioMistral-Unsloth-Full-Class-1
11
+ positive_prompts:
12
+ - "This is a prompt that is demonstrative of what expert model excels at Diagnosis"
13
+ - source_model: Treza12/BioMistral-Unsloth-Full-Class-2
14
+ positive_prompts:
15
+ - "This is a prompt that is demonstrative of what expert model excels at Staging"
16
+ - source_model: Treza12/BioMistral-Unsloth-Full-Class-33
17
+ positive_prompts:
18
+ - "This is a prompt that is demonstrative of what expert model excels at Treatment Selection"
19
+ - source_model: Treza12/BioMistral-Unsloth-Full-Class-44
20
+ positive_prompts:
21
+ - "This is a prompt that is demonstrative of what expert model excels at Prognosis"
22
+ - source_model: Treza12/BioMistral-Unsloth-Full-Class-55
23
+ positive_prompts:
24
+ - "This is a prompt that is demonstrative of what expert model excels at Follow-up"
model-00001-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91ead4371615d6120af855b56d5fbc085864f702074411a15664c4c42e82af33
3
+ size 933250496
model-00002-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0d4d7cd024ac318815693c08887ca48253876f45575869772ca52b3b44247eb
3
+ size 939525160
model-00003-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65e5a2cac3ae6408e514143aed8b9979a9a860d7365dbb84e3f6e6e38c0023bd
3
+ size 905987672
model-00004-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66f3a2f1242b25eeeb769ca813dfc1931445536dd0e0981529bb6e72607f44e3
3
+ size 939525160
model-00005-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a89c6c10cc21d2e21488eb6b601a650ec0627fbfcc1b9dc203f01f5b5f5d4bdb
3
+ size 989865456
model-00006-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e92bfc592bcede6a67caf1059f375d812a189f29c89e63f3db6065de9403359
3
+ size 973088024
model-00007-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89d50c8f664ac664ce6ddc7b70cbfcb52060f9a9c2d3838208beaadf78ba1610
3
+ size 939525160
model-00008-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29160e7dea4917b11299a327145b8a43082dfd4cb1801fa27c8c2c1af1ea0791
3
+ size 905987672
model-00009-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81c8003fd7dd8ab66ecab91ac6d39039c9c211f823c8647872b5b18c93cb9c65
3
+ size 939525160
model-00010-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccc8d88f913ddc06abfd8c1cd7d146daec41b4f9e2b373859b024b0c95c536d4
3
+ size 905987672
model-00011-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf6b3c99a0e209d9621bcfc6ad7199c96103150a10cb068f12ece4cdc9c3fc59
3
+ size 939525160
model-00012-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11cad6bc9a179993d6f1d9ac5e16f663aa6595ab38a86744706aa20cc7c56b78
3
+ size 989865456
model-00013-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e9f3724b48f6a65357afdb3c62c7df7b974dc59b266163683e8381d9b6ecb46
3
+ size 973088024
model-00014-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57ac0b575b1a73651ddd97b1619d33fd21c81378a64ebea2bd05fe4829ba31d7
3
+ size 939525160
model-00015-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0acdd8e8fc838d30d098f6a75ceaf61a8ff1054a73d2e6043c62534507cafe9f
3
+ size 905987672
model-00016-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a685716f55fdc0aba72726e5167ee48754f85a30bf21c9f6d90cd729651e3a2
3
+ size 939525160
model-00017-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c1d42ff2a85aeec129480eb46c058f6db0f0b9bab89a34a0febbf5c8ff0525e
3
+ size 905987672
model-00018-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85fd961d540f452fe711611b2a220d79f0f01ba18782ae58e752aae6cddd5ef3
3
+ size 939525160
model-00019-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72d9d79f352719850f6b8167a9450c5537a5840194d4b19914b753129ebb4a29
3
+ size 989865456
model-00020-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08072cd2d481473e36438c1bf906089bcca9c0f8fc177cc67ab95e259309678e
3
+ size 973088024
model-00021-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da7ddb64133c485f98dad821a2b52d1f3a2d4dead62f0045e45badf95b7a1097
3
+ size 939525160
model-00022-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71abb29f14ca3249fe14c0fde0334c8ebbae1d47d79a592ebdcdbda1da7e4231
3
+ size 905987672
model-00023-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d02454e082e19ee8ffb7f30cdd8a5fa273f983d90a5bec4b5fa5b7c403421425
3
+ size 939525160
model-00024-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b70275bfbfab64851d8b56121e79824cfa9922758cc2854d6a9d0d2b7201074d
3
+ size 905987680
model-00025-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7ce71d246e86ce7d7fdef0f321d72dfd4cbd036fc1a1ad7da5ac924845e81fe
3
+ size 939525168
model-00026-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98b3f3b5655f89c16dee1c4ad3be2f6027d8a250541e3335a8979f90e644f080
3
+ size 989865472
model-00027-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cfee08194746c7ab2f2007213a262e266867d5cfc0348f3e909b3c4c6a186127
3
+ size 973088032
model-00028-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1fa81df29c115db28f06c5c5ddd129b01226f1f448137b51f4bcf734d841217e
3
+ size 939525168
model-00029-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b3988cff065d937d71d692fd4ee5712fc9ec6cab7325980f6d112aa0453dc16
3
+ size 905987688
model-00030-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3bd27b8f737fa87e8e72aaab7c86a9b5e0ef8d1eacee27aa4d2edfd358fbce1
3
+ size 939525168
model-00031-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c88588dcbca86c53e1f83769dc56a4a1595fb90e4debf9c19db834ff96f173cf
3
+ size 905987688
model-00032-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0bbd5990a0323dea879332fb0892b1a196c765d0c8c3528527cb4bb0c2a5c54e
3
+ size 939525168
model-00033-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3784183831745c071e899b91b574ba558e964a27ef4b1b217d9b639bfa9a5a85
3
+ size 989865472
model-00034-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75d0425ed2787f478b9f1f1c0fd229532630f436accad2256b1a9227200145ad
3
+ size 973088032
model-00035-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76fd6aa7c5d98f43bcb4f4d3ad856e13507b44717b47fe4d5e639a9a3bb2964a
3
+ size 939525168
model-00036-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a7e58a871e8a311dcb48be1c7790d421dc01663e056fe436cbb11d74bbccdd3
3
+ size 905987688
model-00037-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04070baacc8c4ce3fea847ad2c33cab71d9bbe8d3d7a14e855152b6d5f8b6785
3
+ size 939525168
model-00038-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1537f637b2d50e849b4ea1001d4d2d4a73fa3855cd051b2d2caac15cfe40102
3
+ size 905987688
model-00039-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:008f0c1177748eb3d3dedbc5883b59eac8e657f8ae04aabee2bf4e151c9ba3d0
3
+ size 939525168
model-00040-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6752493394d4806a3e6991d7b37aa8bd710c34589f2b41dde4fcc66d2c9642b3
3
+ size 989865472
model-00041-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08d4c17eae6b6f1986329183f59b50005336ea95664e3b7611235d8b4710fbaf
3
+ size 973088032
model-00042-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6e7c0a7be81a164e5f7eb6cc4fbf6deaef85bc5682f174cc9a7dfbcf334db36
3
+ size 939525168
model-00043-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5623622857e6ccda9a5224c7731967db4451056941224d7a2b6219b6021b8e96
3
+ size 905987688
model-00044-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da91e47bd130cda91a37219ff917d53a41ebb22c2e580e516b18ebc4b480b1e2
3
+ size 939525168
model-00045-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84077a7940c09951e75d5a93712ec75bd7c488856270d2f33b83640b6b9c8cee
3
+ size 905987688
model-00046-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4956c32302b0917115035225f3a364d9ba12236cea1f849ec0b44cd449f03af7
3
+ size 939525168
model-00047-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4ae6ee0845d986578cb065688fe54eb44da5d901ada02945eef3133ce206562
3
+ size 989865472
model-00048-of-00076.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2148a81110bb7302e328541ee061c24fe77d0e32f7227883aa1c4803aa122366
3
+ size 973088032