Commit
·
b912c63
1
Parent(s):
2dbc97b
Training in progress, step 500
Browse files- .gitignore +1 -0
- config.json +39 -0
- pytorch_model.bin +3 -0
- runs/Mar20_03-17-29_n99c63u8p2/1647746284.4905019/events.out.tfevents.1647746284.n99c63u8p2.16833.1 +3 -0
- runs/Mar20_03-17-29_n99c63u8p2/events.out.tfevents.1647746284.n99c63u8p2.16833.0 +3 -0
- runs/Mar20_03-18-57_n99c63u8p2/1647746345.9307137/events.out.tfevents.1647746345.n99c63u8p2.16833.3 +3 -0
- runs/Mar20_03-18-57_n99c63u8p2/events.out.tfevents.1647746345.n99c63u8p2.16833.2 +3 -0
- runs/Mar20_03-20-42_n99c63u8p2/1647746448.1405928/events.out.tfevents.1647746448.n99c63u8p2.19487.1 +3 -0
- runs/Mar20_03-20-42_n99c63u8p2/events.out.tfevents.1647746448.n99c63u8p2.19487.0 +3 -0
- runs/Mar20_03-21-46_n99c63u8p2/1647746511.6691816/events.out.tfevents.1647746511.n99c63u8p2.19487.3 +3 -0
- runs/Mar20_03-21-46_n99c63u8p2/events.out.tfevents.1647746511.n99c63u8p2.19487.2 +3 -0
- runs/Mar20_11-40-58_nondbhztcd/1647776466.7901292/events.out.tfevents.1647776466.nondbhztcd.172.1 +3 -0
- runs/Mar20_11-40-58_nondbhztcd/events.out.tfevents.1647776466.nondbhztcd.172.0 +3 -0
- runs/Mar20_11-48-46_nondbhztcd/1647776934.6408741/events.out.tfevents.1647776934.nondbhztcd.172.3 +3 -0
- runs/Mar20_11-48-46_nondbhztcd/events.out.tfevents.1647776934.nondbhztcd.172.2 +3 -0
- runs/Mar20_11-50-31_nondbhztcd/1647777038.7619252/events.out.tfevents.1647777038.nondbhztcd.2851.1 +3 -0
- runs/Mar20_11-50-31_nondbhztcd/events.out.tfevents.1647777038.nondbhztcd.2851.0 +3 -0
- training_args.bin +3 -0
.gitignore
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
checkpoint-*/
|
config.json
ADDED
@@ -0,0 +1,39 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "gpt2",
|
3 |
+
"activation_function": "gelu_new",
|
4 |
+
"architectures": [
|
5 |
+
"GPT2LMHeadModel"
|
6 |
+
],
|
7 |
+
"attn_pdrop": 0.1,
|
8 |
+
"bos_token_id": 50256,
|
9 |
+
"embd_pdrop": 0.1,
|
10 |
+
"eos_token_id": 50256,
|
11 |
+
"initializer_range": 0.02,
|
12 |
+
"layer_norm_epsilon": 1e-05,
|
13 |
+
"model_type": "gpt2",
|
14 |
+
"n_ctx": 1024,
|
15 |
+
"n_embd": 768,
|
16 |
+
"n_head": 12,
|
17 |
+
"n_inner": null,
|
18 |
+
"n_layer": 12,
|
19 |
+
"n_positions": 1024,
|
20 |
+
"reorder_and_upcast_attn": false,
|
21 |
+
"resid_pdrop": 0.1,
|
22 |
+
"scale_attn_by_inverse_layer_idx": false,
|
23 |
+
"scale_attn_weights": true,
|
24 |
+
"summary_activation": null,
|
25 |
+
"summary_first_dropout": 0.1,
|
26 |
+
"summary_proj_to_labels": true,
|
27 |
+
"summary_type": "cls_index",
|
28 |
+
"summary_use_proj": true,
|
29 |
+
"task_specific_params": {
|
30 |
+
"text-generation": {
|
31 |
+
"do_sample": true,
|
32 |
+
"max_length": 50
|
33 |
+
}
|
34 |
+
},
|
35 |
+
"torch_dtype": "float32",
|
36 |
+
"transformers_version": "4.17.0",
|
37 |
+
"use_cache": true,
|
38 |
+
"vocab_size": 50257
|
39 |
+
}
|
pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:967aa3adeb6c2278995f5d81c13dcb560ff4b65eef999ba0a997f575d0690d08
|
3 |
+
size 510407137
|
runs/Mar20_03-17-29_n99c63u8p2/1647746284.4905019/events.out.tfevents.1647746284.n99c63u8p2.16833.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6d0901fc8750c15d81d1b81c6696380286571a1cc128b98afdef0ac3920fdb45
|
3 |
+
size 4749
|
runs/Mar20_03-17-29_n99c63u8p2/events.out.tfevents.1647746284.n99c63u8p2.16833.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:42d06cc95f86fb79a3b4fdfa799d23df0d3aa10420d80f723fed92c13fd2fe62
|
3 |
+
size 3526
|
runs/Mar20_03-18-57_n99c63u8p2/1647746345.9307137/events.out.tfevents.1647746345.n99c63u8p2.16833.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:911a509790a3682e0a1ed10b8bf92cb5ceab941542994ce77f9060e4514e79a9
|
3 |
+
size 4749
|
runs/Mar20_03-18-57_n99c63u8p2/events.out.tfevents.1647746345.n99c63u8p2.16833.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6de0bd5fcd1e1084184fc670d749cf72a4363e0599ee8b8cbbef60ca1b302d33
|
3 |
+
size 3526
|
runs/Mar20_03-20-42_n99c63u8p2/1647746448.1405928/events.out.tfevents.1647746448.n99c63u8p2.19487.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e0d6673860a78d10dadc551821de67479cf9ec6916ad5b00f1ba2b28698afb4
|
3 |
+
size 4749
|
runs/Mar20_03-20-42_n99c63u8p2/events.out.tfevents.1647746448.n99c63u8p2.19487.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fca4640b844f42409cb582e4bca1b298be35ab19256007e93867722dc6f9330d
|
3 |
+
size 3526
|
runs/Mar20_03-21-46_n99c63u8p2/1647746511.6691816/events.out.tfevents.1647746511.n99c63u8p2.19487.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a851ce915f7ebdd2685340e380cf773d2c41828324456d0b4f709d972a5e0c85
|
3 |
+
size 4749
|
runs/Mar20_03-21-46_n99c63u8p2/events.out.tfevents.1647746511.n99c63u8p2.19487.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:973686fc54c578f03a97e5c11f75e7590372f792707a90cde30cb76c1fe9e87c
|
3 |
+
size 3526
|
runs/Mar20_11-40-58_nondbhztcd/1647776466.7901292/events.out.tfevents.1647776466.nondbhztcd.172.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df933948f6b4d0ce54912de8a53eb5b89efd17c173032497a4188f390db8d373
|
3 |
+
size 4749
|
runs/Mar20_11-40-58_nondbhztcd/events.out.tfevents.1647776466.nondbhztcd.172.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:27e17354a6eba9e4fe1e12c9cfe5ede0bb30c75493466b37b0a617396b27b631
|
3 |
+
size 3683
|
runs/Mar20_11-48-46_nondbhztcd/1647776934.6408741/events.out.tfevents.1647776934.nondbhztcd.172.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c754bc37a6bc03d842bc44a00823f1ecadf6028f0accae51213b3c1a5c56cc30
|
3 |
+
size 4749
|
runs/Mar20_11-48-46_nondbhztcd/events.out.tfevents.1647776934.nondbhztcd.172.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca89badbcd78921c5e6df66bc4684fa5576fa51bcaa185fc8a56bbc6fbb5c88f
|
3 |
+
size 40
|
runs/Mar20_11-50-31_nondbhztcd/1647777038.7619252/events.out.tfevents.1647777038.nondbhztcd.2851.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c4dc796d79090601c38b45cc3b02422cb97f3eaf35405567007992a9453a990f
|
3 |
+
size 4749
|
runs/Mar20_11-50-31_nondbhztcd/events.out.tfevents.1647777038.nondbhztcd.2851.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d4cd2c1f688d133f52cfbc3504bb33495c0cfda709e13d00c34246b98823f84c
|
3 |
+
size 3683
|
training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6b7f22f8e863e569f089a8f3c9b3a187897ccdff622337d2f707b55f49d0c62f
|
3 |
+
size 2991
|