prosecalign
/

phi3m0128-cds-0.3-kendall-onof-ofif-corr-max-2-simpo-max1500-default

Transformers

Safetensors

Generated from Trainer

llama-factory

Inference Endpoints

Model card Files Files and versions Community

ziansu commited on 8 days ago

Commit

eb8b651

verified ·

1 Parent(s): 18db496

Training in progress, step 1350

Browse files

Files changed (2) hide show

adapter_model.safetensors +1 -1
trainer_log.jsonl +6 -0

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2e16912401614fd5c6a97bfbdfeb20cb10f57ee4ae97399fc5a2361241fae49c
 size 25200088

 version https://git-lfs.github.com/spec/v1
+oid sha256:b8f055b87ef70f365b91f97073ca75c2fbab086f89ab95fe7b4feff2b0947df7
 size 25200088

trainer_log.jsonl CHANGED Viewed

@@ -154,3 +154,9 @@
 {"current_steps": 1290, "total_steps": 1500, "loss": 0.3558, "accuracy": 0.8999999761581421, "learning_rate": 2.3793236883495164e-07, "epoch": 1.6374603174603175, "percentage": 86.0, "elapsed_time": "2:56:58", "remaining_time": "0:28:48", "throughput": "0.00", "total_tokens": 0}
 {"current_steps": 1300, "total_steps": 1500, "loss": 0.3516, "accuracy": 0.925000011920929, "learning_rate": 2.1613635589349756e-07, "epoch": 1.6501587301587302, "percentage": 86.67, "elapsed_time": "2:58:12", "remaining_time": "0:27:24", "throughput": "0.00", "total_tokens": 0}
 {"current_steps": 1300, "total_steps": 1500, "eval_loss": 0.30641260743141174, "epoch": 1.6501587301587302, "percentage": 86.67, "elapsed_time": "2:58:30", "remaining_time": "0:27:27", "throughput": "0.00", "total_tokens": 0}

 {"current_steps": 1290, "total_steps": 1500, "loss": 0.3558, "accuracy": 0.8999999761581421, "learning_rate": 2.3793236883495164e-07, "epoch": 1.6374603174603175, "percentage": 86.0, "elapsed_time": "2:56:58", "remaining_time": "0:28:48", "throughput": "0.00", "total_tokens": 0}
 {"current_steps": 1300, "total_steps": 1500, "loss": 0.3516, "accuracy": 0.925000011920929, "learning_rate": 2.1613635589349756e-07, "epoch": 1.6501587301587302, "percentage": 86.67, "elapsed_time": "2:58:12", "remaining_time": "0:27:24", "throughput": "0.00", "total_tokens": 0}
 {"current_steps": 1300, "total_steps": 1500, "eval_loss": 0.30641260743141174, "epoch": 1.6501587301587302, "percentage": 86.67, "elapsed_time": "2:58:30", "remaining_time": "0:27:27", "throughput": "0.00", "total_tokens": 0}
+{"current_steps": 1310, "total_steps": 1500, "loss": 0.2899, "accuracy": 0.8500000238418579, "learning_rate": 1.95342121028749e-07, "epoch": 1.6628571428571428, "percentage": 87.33, "elapsed_time": "2:59:53", "remaining_time": "0:26:05", "throughput": "0.00", "total_tokens": 0}
+{"current_steps": 1320, "total_steps": 1500, "loss": 0.3251, "accuracy": 0.9125000238418579, "learning_rate": 1.7555878527937164e-07, "epoch": 1.6755555555555555, "percentage": 88.0, "elapsed_time": "3:01:13", "remaining_time": "0:24:42", "throughput": "0.00", "total_tokens": 0}
+{"current_steps": 1330, "total_steps": 1500, "loss": 0.2771, "accuracy": 0.9624999761581421, "learning_rate": 1.567950262702714e-07, "epoch": 1.6882539682539681, "percentage": 88.67, "elapsed_time": "3:02:37", "remaining_time": "0:23:20", "throughput": "0.00", "total_tokens": 0}
+{"current_steps": 1340, "total_steps": 1500, "loss": 0.3232, "accuracy": 0.9750000238418579, "learning_rate": 1.3905907440629752e-07, "epoch": 1.700952380952381, "percentage": 89.33, "elapsed_time": "3:03:55", "remaining_time": "0:21:57", "throughput": "0.00", "total_tokens": 0}
+{"current_steps": 1350, "total_steps": 1500, "loss": 0.2938, "accuracy": 0.925000011920929, "learning_rate": 1.223587092621162e-07, "epoch": 1.7136507936507936, "percentage": 90.0, "elapsed_time": "3:05:09", "remaining_time": "0:20:34", "throughput": "0.00", "total_tokens": 0}
+{"current_steps": 1350, "total_steps": 1500, "eval_loss": 0.30637431144714355, "epoch": 1.7136507936507936, "percentage": 90.0, "elapsed_time": "3:05:28", "remaining_time": "0:20:36", "throughput": "0.00", "total_tokens": 0}