PyTorch
Safetensors
gemma
DNA
biology
genomics
longchen0421 commited on
Commit
84ee74a
·
verified ·
1 Parent(s): 9182be2

Upload 8 files

Browse files
Files changed (5) hide show
  1. README.md +2 -2
  2. config.json +15 -11
  3. generation_config.json +2 -0
  4. model.safetensors +2 -2
  5. pytorch_model.bin +2 -2
README.md CHANGED
@@ -38,7 +38,7 @@ Here is a simple code for inference:
38
  from transformers import AutoModelForCausalLM, AutoTokenizer
39
  import torch
40
 
41
- model_name = 'plant-dnabert-6mer'
42
  # load model and tokenizer
43
  model = AutoModelForCausalLM.from_pretrained(f'zhangtaolab/{model_name}', trust_remote_code=True)
44
  tokenizer = AutoTokenizer.from_pretrained(f'zhangtaolab/{model_name}', trust_remote_code=True)
@@ -71,4 +71,4 @@ Detailed training procedure can be found in our manuscript.
71
 
72
 
73
  #### Hardware
74
- Model was pre-trained on a NVIDIA RTX4090 GPU (24 GB).
 
38
  from transformers import AutoModelForCausalLM, AutoTokenizer
39
  import torch
40
 
41
+ model_name = 'plant-dnagemma-6mer'
42
  # load model and tokenizer
43
  model = AutoModelForCausalLM.from_pretrained(f'zhangtaolab/{model_name}', trust_remote_code=True)
44
  tokenizer = AutoTokenizer.from_pretrained(f'zhangtaolab/{model_name}', trust_remote_code=True)
 
71
 
72
 
73
  #### Hardware
74
+ Model was pre-trained on a NVIDIA RTX4090 GPU (24 GB).
config.json CHANGED
@@ -1,25 +1,29 @@
1
  {
2
- "_name_or_path": "../model/PlantDna_BERT_6mer",
3
  "architectures": [
4
- "BertForMaskedLM"
5
  ],
6
- "attention_probs_dropout_prob": 0.1,
7
- "classifier_dropout": null,
8
- "hidden_act": "gelu",
9
- "hidden_dropout_prob": 0.1,
 
 
 
10
  "hidden_size": 768,
11
  "initializer_range": 0.02,
12
  "intermediate_size": 3072,
13
- "layer_norm_eps": 1e-12,
14
- "max_position_embeddings": 512,
15
- "model_type": "bert",
16
  "num_attention_heads": 12,
17
  "num_hidden_layers": 12,
 
18
  "pad_token_id": 0,
19
- "position_embedding_type": "absolute",
 
 
20
  "torch_dtype": "float32",
21
  "transformers_version": "4.39.1",
22
- "type_vocab_size": 2,
23
  "use_cache": true,
24
  "vocab_size": 4107
25
  }
 
1
  {
2
+ "_name_or_path": "Plant_DNAGemma",
3
  "architectures": [
4
+ "GemmaForCausalLM"
5
  ],
6
+ "attention_bias": false,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 2,
9
+ "eos_token_id": 1,
10
+ "head_dim": 256,
11
+ "hidden_act": "gelu_pytorch_tanh",
12
+ "hidden_activation": "gelu_pytorch_tanh",
13
  "hidden_size": 768,
14
  "initializer_range": 0.02,
15
  "intermediate_size": 3072,
16
+ "max_position_embeddings": 1024,
17
+ "model_type": "gemma",
 
18
  "num_attention_heads": 12,
19
  "num_hidden_layers": 12,
20
+ "num_key_value_heads": 1,
21
  "pad_token_id": 0,
22
+ "rms_norm_eps": 1e-06,
23
+ "rope_scaling": null,
24
+ "rope_theta": 10000.0,
25
  "torch_dtype": "float32",
26
  "transformers_version": "4.39.1",
 
27
  "use_cache": true,
28
  "vocab_size": 4107
29
  }
generation_config.json CHANGED
@@ -1,5 +1,7 @@
1
  {
2
  "_from_model_config": true,
 
 
3
  "pad_token_id": 0,
4
  "transformers_version": "4.39.1"
5
  }
 
1
  {
2
  "_from_model_config": true,
3
+ "bos_token_id": 0,
4
+ "eos_token_id": 0,
5
  "pad_token_id": 0,
6
  "transformers_version": "4.39.1"
7
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3b5b40af2672337c6e25fde42af91a23fb3e4b37c03a349dd0392e6c4f2dfbf3
3
- size 356828260
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c5437fe24770e71d4a8f4e3eedb4ef0f7309b9fbb96696e2f35bdc12fb121cf
3
+ size 597811128
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2a0e12c47d51f3d2556da5976710c4c2fc05010a1677b147c1f561587df75af9
3
- size 356871026
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1db4c29e12eef1f8e56e52f7d79f14c7ea92bc5c1c2f9f737d66e0dffb1aa1f
3
+ size 597834498