Training in progress, step 5
Browse files
config.json
CHANGED
@@ -1,12 +1,12 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "
|
3 |
"activation_function": "silu",
|
4 |
"architectures": [
|
5 |
-
"
|
6 |
],
|
7 |
"attention_dropout": 0.0,
|
8 |
"auto_map": {
|
9 |
-
"AutoConfig": "
|
10 |
"AutoModelForCausalLM": "LGAI-EXAONE/EXAONE-3.5-2.4B-Instruct--modeling_exaone.ExaoneForCausalLM",
|
11 |
"AutoModelForSequenceClassification": "LGAI-EXAONE/EXAONE-3.5-2.4B-Instruct--modeling_exaone.ExaoneForSequenceClassification"
|
12 |
},
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "/home/edgeai/DeepSpeedExamples/training/autotuning/hf/gpt2-large/saved_based_exaone_block1024_Batch1_Rank28_last_layer_save/",
|
3 |
"activation_function": "silu",
|
4 |
"architectures": [
|
5 |
+
"ExaoneTDForCausalLM"
|
6 |
],
|
7 |
"attention_dropout": 0.0,
|
8 |
"auto_map": {
|
9 |
+
"AutoConfig": "configuration_exaone.ExaoneConfig",
|
10 |
"AutoModelForCausalLM": "LGAI-EXAONE/EXAONE-3.5-2.4B-Instruct--modeling_exaone.ExaoneForCausalLM",
|
11 |
"AutoModelForSequenceClassification": "LGAI-EXAONE/EXAONE-3.5-2.4B-Instruct--modeling_exaone.ExaoneForSequenceClassification"
|
12 |
},
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f53877b20fc544d4ec0d5a09ec23349d6f195b9358d77ef06509e66544e87340
|
3 |
+
size 634692008
|
runs/Mar04_15-52-58_bizon3/events.out.tfevents.1741132410.bizon3.1838119.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1987fda8d5cbaaa38c42b7c6b6c880904adab46117b53c4494e349fcd5235d4e
|
3 |
+
size 11835
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a2527c1ee0e66a904e5ddce5d19da8d9d4794a90739f95e50ea8f7412e23c33f
|
3 |
+
size 7480
|