vinaykudari commited on
Commit
b912c63
·
1 Parent(s): 2dbc97b

Training in progress, step 500

Browse files
.gitignore ADDED
@@ -0,0 +1 @@
 
 
1
+ checkpoint-*/
config.json ADDED
@@ -0,0 +1,39 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "gpt2",
3
+ "activation_function": "gelu_new",
4
+ "architectures": [
5
+ "GPT2LMHeadModel"
6
+ ],
7
+ "attn_pdrop": 0.1,
8
+ "bos_token_id": 50256,
9
+ "embd_pdrop": 0.1,
10
+ "eos_token_id": 50256,
11
+ "initializer_range": 0.02,
12
+ "layer_norm_epsilon": 1e-05,
13
+ "model_type": "gpt2",
14
+ "n_ctx": 1024,
15
+ "n_embd": 768,
16
+ "n_head": 12,
17
+ "n_inner": null,
18
+ "n_layer": 12,
19
+ "n_positions": 1024,
20
+ "reorder_and_upcast_attn": false,
21
+ "resid_pdrop": 0.1,
22
+ "scale_attn_by_inverse_layer_idx": false,
23
+ "scale_attn_weights": true,
24
+ "summary_activation": null,
25
+ "summary_first_dropout": 0.1,
26
+ "summary_proj_to_labels": true,
27
+ "summary_type": "cls_index",
28
+ "summary_use_proj": true,
29
+ "task_specific_params": {
30
+ "text-generation": {
31
+ "do_sample": true,
32
+ "max_length": 50
33
+ }
34
+ },
35
+ "torch_dtype": "float32",
36
+ "transformers_version": "4.17.0",
37
+ "use_cache": true,
38
+ "vocab_size": 50257
39
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:967aa3adeb6c2278995f5d81c13dcb560ff4b65eef999ba0a997f575d0690d08
3
+ size 510407137
runs/Mar20_03-17-29_n99c63u8p2/1647746284.4905019/events.out.tfevents.1647746284.n99c63u8p2.16833.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d0901fc8750c15d81d1b81c6696380286571a1cc128b98afdef0ac3920fdb45
3
+ size 4749
runs/Mar20_03-17-29_n99c63u8p2/events.out.tfevents.1647746284.n99c63u8p2.16833.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:42d06cc95f86fb79a3b4fdfa799d23df0d3aa10420d80f723fed92c13fd2fe62
3
+ size 3526
runs/Mar20_03-18-57_n99c63u8p2/1647746345.9307137/events.out.tfevents.1647746345.n99c63u8p2.16833.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:911a509790a3682e0a1ed10b8bf92cb5ceab941542994ce77f9060e4514e79a9
3
+ size 4749
runs/Mar20_03-18-57_n99c63u8p2/events.out.tfevents.1647746345.n99c63u8p2.16833.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6de0bd5fcd1e1084184fc670d749cf72a4363e0599ee8b8cbbef60ca1b302d33
3
+ size 3526
runs/Mar20_03-20-42_n99c63u8p2/1647746448.1405928/events.out.tfevents.1647746448.n99c63u8p2.19487.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e0d6673860a78d10dadc551821de67479cf9ec6916ad5b00f1ba2b28698afb4
3
+ size 4749
runs/Mar20_03-20-42_n99c63u8p2/events.out.tfevents.1647746448.n99c63u8p2.19487.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fca4640b844f42409cb582e4bca1b298be35ab19256007e93867722dc6f9330d
3
+ size 3526
runs/Mar20_03-21-46_n99c63u8p2/1647746511.6691816/events.out.tfevents.1647746511.n99c63u8p2.19487.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a851ce915f7ebdd2685340e380cf773d2c41828324456d0b4f709d972a5e0c85
3
+ size 4749
runs/Mar20_03-21-46_n99c63u8p2/events.out.tfevents.1647746511.n99c63u8p2.19487.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:973686fc54c578f03a97e5c11f75e7590372f792707a90cde30cb76c1fe9e87c
3
+ size 3526
runs/Mar20_11-40-58_nondbhztcd/1647776466.7901292/events.out.tfevents.1647776466.nondbhztcd.172.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df933948f6b4d0ce54912de8a53eb5b89efd17c173032497a4188f390db8d373
3
+ size 4749
runs/Mar20_11-40-58_nondbhztcd/events.out.tfevents.1647776466.nondbhztcd.172.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:27e17354a6eba9e4fe1e12c9cfe5ede0bb30c75493466b37b0a617396b27b631
3
+ size 3683
runs/Mar20_11-48-46_nondbhztcd/1647776934.6408741/events.out.tfevents.1647776934.nondbhztcd.172.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c754bc37a6bc03d842bc44a00823f1ecadf6028f0accae51213b3c1a5c56cc30
3
+ size 4749
runs/Mar20_11-48-46_nondbhztcd/events.out.tfevents.1647776934.nondbhztcd.172.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca89badbcd78921c5e6df66bc4684fa5576fa51bcaa185fc8a56bbc6fbb5c88f
3
+ size 40
runs/Mar20_11-50-31_nondbhztcd/1647777038.7619252/events.out.tfevents.1647777038.nondbhztcd.2851.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4dc796d79090601c38b45cc3b02422cb97f3eaf35405567007992a9453a990f
3
+ size 4749
runs/Mar20_11-50-31_nondbhztcd/events.out.tfevents.1647777038.nondbhztcd.2851.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d4cd2c1f688d133f52cfbc3504bb33495c0cfda709e13d00c34246b98823f84c
3
+ size 3683
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b7f22f8e863e569f089a8f3c9b3a187897ccdff622337d2f707b55f49d0c62f
3
+ size 2991