Training in progress, step 3050
Browse files- adapter_model.safetensors +1 -1
- metrics.json +1 -0
- state.json +18 -3
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 35668592
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9ed692ae9066b81d1913846a8c6f7abfb91f6009fa8af2889c897a3849545166
|
3 |
size 35668592
|
metrics.json
CHANGED
@@ -58,3 +58,4 @@
|
|
58 |
{"Step":2900,"eval_loss":1.7579619884,"eval_runtime":29.3692,"eval_samples_per_second":3.405,"eval_steps_per_second":0.443,"epoch":2.2780832679}
|
59 |
{"Step":2950,"eval_loss":1.7549589872,"eval_runtime":29.4284,"eval_samples_per_second":3.398,"eval_steps_per_second":0.442,"epoch":2.3173605656}
|
60 |
{"Step":3000,"eval_loss":1.7528626919,"eval_runtime":29.4272,"eval_samples_per_second":3.398,"eval_steps_per_second":0.442,"epoch":2.3566378633}
|
|
|
|
58 |
{"Step":2900,"eval_loss":1.7579619884,"eval_runtime":29.3692,"eval_samples_per_second":3.405,"eval_steps_per_second":0.443,"epoch":2.2780832679}
|
59 |
{"Step":2950,"eval_loss":1.7549589872,"eval_runtime":29.4284,"eval_samples_per_second":3.398,"eval_steps_per_second":0.442,"epoch":2.3173605656}
|
60 |
{"Step":3000,"eval_loss":1.7528626919,"eval_runtime":29.4272,"eval_samples_per_second":3.398,"eval_steps_per_second":0.442,"epoch":2.3566378633}
|
61 |
+
{"Step":3050,"eval_loss":1.7513557673,"eval_runtime":29.577,"eval_samples_per_second":3.381,"eval_steps_per_second":0.44,"epoch":2.395915161}
|
state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch": 2.
|
5 |
"eval_steps": 50,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -892,6 +892,21 @@
|
|
892 |
"eval_samples_per_second": 3.398,
|
893 |
"eval_steps_per_second": 0.442,
|
894 |
"step": 2950
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
895 |
}
|
896 |
],
|
897 |
"logging_steps": 50,
|
@@ -911,7 +926,7 @@
|
|
911 |
"attributes": {}
|
912 |
}
|
913 |
},
|
914 |
-
"total_flos": 3.
|
915 |
"train_batch_size": 8,
|
916 |
"trial_name": null,
|
917 |
"trial_params": null
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 2.3959151610369207,
|
5 |
"eval_steps": 50,
|
6 |
+
"global_step": 3050,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
892 |
"eval_samples_per_second": 3.398,
|
893 |
"eval_steps_per_second": 0.442,
|
894 |
"step": 2950
|
895 |
+
},
|
896 |
+
{
|
897 |
+
"epoch": 2.356637863315004,
|
898 |
+
"grad_norm": 0.2826303541660309,
|
899 |
+
"learning_rate": 0.00011914460285132383,
|
900 |
+
"loss": 1.7356,
|
901 |
+
"step": 3000
|
902 |
+
},
|
903 |
+
{
|
904 |
+
"epoch": 2.356637863315004,
|
905 |
+
"eval_loss": 1.7528626918792725,
|
906 |
+
"eval_runtime": 29.4272,
|
907 |
+
"eval_samples_per_second": 3.398,
|
908 |
+
"eval_steps_per_second": 0.442,
|
909 |
+
"step": 3000
|
910 |
}
|
911 |
],
|
912 |
"logging_steps": 50,
|
|
|
926 |
"attributes": {}
|
927 |
}
|
928 |
},
|
929 |
+
"total_flos": 3.774020398798848e+16,
|
930 |
"train_batch_size": 8,
|
931 |
"trial_name": null,
|
932 |
"trial_params": null
|