Pclanglais commited on
Commit
183204e
·
verified ·
1 Parent(s): 8498d33

Upload folder using huggingface_hub

Browse files
config.json CHANGED
@@ -16,14 +16,14 @@
16
  "final_logit_softcapping": null,
17
  "head_dim": 256,
18
  "hidden_activation": "gelu_pytorch_tanh",
19
- "hidden_size": 3840,
20
  "initializer_range": 0.02,
21
- "intermediate_size": 15360,
22
  "max_position_embeddings": 131072,
23
  "model_type": "gemma3_text",
24
- "num_attention_heads": 16,
25
- "num_hidden_layers": 48,
26
- "num_key_value_heads": 8,
27
  "query_pre_attn_scalar": 256,
28
  "rms_norm_eps": 1e-06,
29
  "rope_local_base_freq": 10000.0,
 
16
  "final_logit_softcapping": null,
17
  "head_dim": 256,
18
  "hidden_activation": "gelu_pytorch_tanh",
19
+ "hidden_size": 2560,
20
  "initializer_range": 0.02,
21
+ "intermediate_size": 10240,
22
  "max_position_embeddings": 131072,
23
  "model_type": "gemma3_text",
24
+ "num_attention_heads": 8,
25
+ "num_hidden_layers": 34,
26
+ "num_key_value_heads": 4,
27
  "query_pre_attn_scalar": 256,
28
  "rms_norm_eps": 1e-06,
29
  "rope_local_base_freq": 10000.0,
pytorch_model-00001-of-00002.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebc619193af0adb330a24d1a8ad15a02804901c28c400d16b3196453a4c4802d
3
+ size 4961401164
pytorch_model-00002-of-00002.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe3bc6f1c25dd067395ff32d242019f91fad7e1394f8af04347e68c65086790f
3
+ size 3639086221
pytorch_model.bin.index.json CHANGED
The diff for this file is too large to render. See raw diff