Mohit1Kulkarni commited on
Commit
1c95f70
·
1 Parent(s): e19e1a5

Training in progress epoch 0

Browse files
README.md CHANGED
@@ -1,6 +1,6 @@
1
  ---
2
  license: apache-2.0
3
- base_model: distilgpt2
4
  tags:
5
  - generated_from_keras_callback
6
  model-index:
@@ -13,10 +13,10 @@ probably proofread and complete it, then remove this comment. -->
13
 
14
  # Mohit1Kulkarni/My-Science-LLM
15
 
16
- This model is a fine-tuned version of [distilgpt2](https://huggingface.co/distilgpt2) on an unknown dataset.
17
  It achieves the following results on the evaluation set:
18
- - Train Loss: 1.9337
19
- - Epoch: 1
20
 
21
  ## Model description
22
 
@@ -42,8 +42,7 @@ The following hyperparameters were used during training:
42
 
43
  | Train Loss | Epoch |
44
  |:----------:|:-----:|
45
- | 2.0504 | 0 |
46
- | 1.9337 | 1 |
47
 
48
 
49
  ### Framework versions
 
1
  ---
2
  license: apache-2.0
3
+ base_model: Mohit1Kulkarni/My-Science-LLM
4
  tags:
5
  - generated_from_keras_callback
6
  model-index:
 
13
 
14
  # Mohit1Kulkarni/My-Science-LLM
15
 
16
+ This model is a fine-tuned version of [Mohit1Kulkarni/My-Science-LLM](https://huggingface.co/Mohit1Kulkarni/My-Science-LLM) on an unknown dataset.
17
  It achieves the following results on the evaluation set:
18
+ - Train Loss: 1.8569
19
+ - Epoch: 0
20
 
21
  ## Model description
22
 
 
42
 
43
  | Train Loss | Epoch |
44
  |:----------:|:-----:|
45
+ | 1.8569 | 0 |
 
46
 
47
 
48
  ### Framework versions
added_tokens.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "[PAD]": 50257
3
+ }
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "distilgpt2",
3
  "_num_labels": 1,
4
  "activation_function": "gelu_new",
5
  "architectures": [
 
1
  {
2
+ "_name_or_path": "Mohit1Kulkarni/My-Science-LLM",
3
  "_num_labels": 1,
4
  "activation_function": "gelu_new",
5
  "architectures": [
special_tokens_map.json CHANGED
@@ -1,5 +1,12 @@
1
  {
2
  "bos_token": "<|endoftext|>",
3
  "eos_token": "<|endoftext|>",
 
 
 
 
 
 
 
4
  "unk_token": "<|endoftext|>"
5
  }
 
1
  {
2
  "bos_token": "<|endoftext|>",
3
  "eos_token": "<|endoftext|>",
4
+ "pad_token": {
5
+ "content": "[PAD]",
6
+ "lstrip": false,
7
+ "normalized": false,
8
+ "rstrip": false,
9
+ "single_word": false
10
+ },
11
  "unk_token": "<|endoftext|>"
12
  }
tf_model.h5 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e3f15f1767c2d685f317bb14aee812b6ada4ec06d487ea51da5189c9a28b4f6c
3
  size 327745472
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c6f6fd0d1df51bbe430b367ce1ffb8cb0eacfa4be859c888d7611733927f28b
3
  size 327745472
tokenizer.json CHANGED
@@ -11,6 +11,15 @@
11
  "rstrip": false,
12
  "normalized": true,
13
  "special": true
 
 
 
 
 
 
 
 
 
14
  }
15
  ],
16
  "normalizer": null,
 
11
  "rstrip": false,
12
  "normalized": true,
13
  "special": true
14
+ },
15
+ {
16
+ "id": 50257,
17
+ "content": "[PAD]",
18
+ "single_word": false,
19
+ "lstrip": false,
20
+ "rstrip": false,
21
+ "normalized": false,
22
+ "special": true
23
  }
24
  ],
25
  "normalizer": null,
tokenizer_config.json CHANGED
@@ -8,12 +8,21 @@
8
  "rstrip": false,
9
  "single_word": false,
10
  "special": true
 
 
 
 
 
 
 
 
11
  }
12
  },
13
  "bos_token": "<|endoftext|>",
14
  "clean_up_tokenization_spaces": true,
15
  "eos_token": "<|endoftext|>",
16
  "model_max_length": 1024,
 
17
  "tokenizer_class": "GPT2Tokenizer",
18
  "unk_token": "<|endoftext|>"
19
  }
 
8
  "rstrip": false,
9
  "single_word": false,
10
  "special": true
11
+ },
12
+ "50257": {
13
+ "content": "[PAD]",
14
+ "lstrip": false,
15
+ "normalized": false,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
  }
20
  },
21
  "bos_token": "<|endoftext|>",
22
  "clean_up_tokenization_spaces": true,
23
  "eos_token": "<|endoftext|>",
24
  "model_max_length": 1024,
25
+ "pad_token": "[PAD]",
26
  "tokenizer_class": "GPT2Tokenizer",
27
  "unk_token": "<|endoftext|>"
28
  }