winglian commited on
Commit
5e63a62
·
1 Parent(s): 7ad3972

Upload MixFormerSequentialForCausalLM

Browse files
Files changed (3) hide show
  1. config.json +5 -5
  2. generation_config.json +1 -1
  3. pytorch_model.bin +2 -2
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "phi-1.5-half",
3
  "activation_function": "gelu_new",
4
  "architecture": {
5
  "block_cls": "parallel",
@@ -12,8 +12,8 @@
12
  "MixFormerSequentialForCausalLM"
13
  ],
14
  "auto_map": {
15
- "AutoConfig": "configuration_mixformer_sequential.MixFormerSequentialConfig",
16
- "AutoModelForCausalLM": "modeling_mixformer_sequential.MixFormerSequentialForCausalLM"
17
  },
18
  "embd_layer": "default",
19
  "embd_pdrop": 0.0,
@@ -29,7 +29,7 @@
29
  "resid_pdrop": 0.0,
30
  "rotary_dim": 32,
31
  "tie_word_embeddings": false,
32
- "torch_dtype": "float16",
33
- "transformers_version": "4.32.1",
34
  "vocab_size": 51200
35
  }
 
1
  {
2
+ "_name_or_path": "microsoft/phi-1_5",
3
  "activation_function": "gelu_new",
4
  "architecture": {
5
  "block_cls": "parallel",
 
12
  "MixFormerSequentialForCausalLM"
13
  ],
14
  "auto_map": {
15
+ "AutoConfig": "microsoft/phi-1_5--configuration_mixformer_sequential.MixFormerSequentialConfig",
16
+ "AutoModelForCausalLM": "microsoft/phi-1_5--modeling_mixformer_sequential.MixFormerSequentialForCausalLM"
17
  },
18
  "embd_layer": "default",
19
  "embd_pdrop": 0.0,
 
29
  "resid_pdrop": 0.0,
30
  "rotary_dim": 32,
31
  "tie_word_embeddings": false,
32
+ "torch_dtype": "bfloat16",
33
+ "transformers_version": "4.34.0.dev0",
34
  "vocab_size": 51200
35
  }
generation_config.json CHANGED
@@ -1,4 +1,4 @@
1
  {
2
  "_from_model_config": true,
3
- "transformers_version": "4.32.1"
4
  }
 
1
  {
2
  "_from_model_config": true,
3
+ "transformers_version": "4.34.0.dev0"
4
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a2d4c3c769ef4a9f7e1d33af3a305de5c279306829a8dd78811040a2e95d4e0c
3
- size 5253626297
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e0e2d756e4e531f8f949541c592165b61c3b6f7ac2f556fd68f2543a8ec3fb3
3
+ size 5253706317