Training in progress, step 696
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f7de0470b200182e960f2c7a9d740b94a48436d48075f819d8b5d9aa28f2a688
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f18b8a9f70be26bd1f7ec8d62130556e601f51740adda8d52ae7d4af233a11e7
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:883c32524eb5643c0ac1e703dc1e1b4660194cde1c8bd0ac6c9809d300081125
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:efb2c9bbfbdf7659ce71cb49f1b9c4b1b5934082bead76a77f47ccd1737d45a5
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -604,3 +604,94 @@
|
|
604 |
{"current_steps": 604, "total_steps": 696, "loss": 0.4345, "lr": 5.235258128979676e-07, "epoch": 2.599713055954089, "percentage": 86.78, "elapsed_time": "3:33:33", "remaining_time": "0:32:31"}
|
605 |
{"current_steps": 605, "total_steps": 696, "loss": 0.3843, "lr": 5.124041311215544e-07, "epoch": 2.6040172166427547, "percentage": 86.93, "elapsed_time": "3:33:54", "remaining_time": "0:32:10"}
|
606 |
{"current_steps": 606, "total_steps": 696, "loss": 0.3959, "lr": 5.0139547158427e-07, "epoch": 2.6083213773314204, "percentage": 87.07, "elapsed_time": "3:34:17", "remaining_time": "0:31:49"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
604 |
{"current_steps": 604, "total_steps": 696, "loss": 0.4345, "lr": 5.235258128979676e-07, "epoch": 2.599713055954089, "percentage": 86.78, "elapsed_time": "3:33:33", "remaining_time": "0:32:31"}
|
605 |
{"current_steps": 605, "total_steps": 696, "loss": 0.3843, "lr": 5.124041311215544e-07, "epoch": 2.6040172166427547, "percentage": 86.93, "elapsed_time": "3:33:54", "remaining_time": "0:32:10"}
|
606 |
{"current_steps": 606, "total_steps": 696, "loss": 0.3959, "lr": 5.0139547158427e-07, "epoch": 2.6083213773314204, "percentage": 87.07, "elapsed_time": "3:34:17", "remaining_time": "0:31:49"}
|
607 |
+
{"current_steps": 607, "total_steps": 696, "loss": 0.4323, "lr": 4.905001115444475e-07, "epoch": 2.6126255380200862, "percentage": 87.21, "elapsed_time": "3:34:37", "remaining_time": "0:31:28"}
|
608 |
+
{"current_steps": 608, "total_steps": 696, "loss": 0.3858, "lr": 4.797183254069176e-07, "epoch": 2.616929698708752, "percentage": 87.36, "elapsed_time": "3:34:58", "remaining_time": "0:31:06"}
|
609 |
+
{"current_steps": 609, "total_steps": 696, "loss": 0.4297, "lr": 4.690503847160982e-07, "epoch": 2.6212338593974174, "percentage": 87.5, "elapsed_time": "3:35:20", "remaining_time": "0:30:45"}
|
610 |
+
{"current_steps": 610, "total_steps": 696, "loss": 0.3975, "lr": 4.5849655814915683e-07, "epoch": 2.625538020086083, "percentage": 87.64, "elapsed_time": "3:35:42", "remaining_time": "0:30:24"}
|
611 |
+
{"current_steps": 611, "total_steps": 696, "loss": 0.3648, "lr": 4.4805711150924304e-07, "epoch": 2.629842180774749, "percentage": 87.79, "elapsed_time": "3:36:03", "remaining_time": "0:30:03"}
|
612 |
+
{"current_steps": 612, "total_steps": 696, "loss": 0.4397, "lr": 4.3773230771879004e-07, "epoch": 2.6341463414634148, "percentage": 87.93, "elapsed_time": "3:36:25", "remaining_time": "0:29:42"}
|
613 |
+
{"current_steps": 613, "total_steps": 696, "loss": 0.3775, "lr": 4.2752240681290027e-07, "epoch": 2.6384505021520805, "percentage": 88.07, "elapsed_time": "3:36:44", "remaining_time": "0:29:20"}
|
614 |
+
{"current_steps": 614, "total_steps": 696, "loss": 0.4052, "lr": 4.1742766593278974e-07, "epoch": 2.642754662840746, "percentage": 88.22, "elapsed_time": "3:37:06", "remaining_time": "0:28:59"}
|
615 |
+
{"current_steps": 615, "total_steps": 696, "loss": 0.3822, "lr": 4.074483393193135e-07, "epoch": 2.6470588235294117, "percentage": 88.36, "elapsed_time": "3:37:28", "remaining_time": "0:28:38"}
|
616 |
+
{"current_steps": 616, "total_steps": 696, "loss": 0.3862, "lr": 3.9758467830656623e-07, "epoch": 2.6513629842180775, "percentage": 88.51, "elapsed_time": "3:37:47", "remaining_time": "0:28:17"}
|
617 |
+
{"current_steps": 617, "total_steps": 696, "loss": 0.3844, "lr": 3.8783693131554836e-07, "epoch": 2.6556671449067433, "percentage": 88.65, "elapsed_time": "3:38:08", "remaining_time": "0:27:55"}
|
618 |
+
{"current_steps": 618, "total_steps": 696, "loss": 0.4243, "lr": 3.782053438479094e-07, "epoch": 2.659971305595409, "percentage": 88.79, "elapsed_time": "3:38:31", "remaining_time": "0:27:34"}
|
619 |
+
{"current_steps": 619, "total_steps": 696, "loss": 0.3809, "lr": 3.686901584797675e-07, "epoch": 2.6642754662840744, "percentage": 88.94, "elapsed_time": "3:38:48", "remaining_time": "0:27:13"}
|
620 |
+
{"current_steps": 620, "total_steps": 696, "loss": 0.3873, "lr": 3.5929161485559694e-07, "epoch": 2.66857962697274, "percentage": 89.08, "elapsed_time": "3:39:11", "remaining_time": "0:26:52"}
|
621 |
+
{"current_steps": 621, "total_steps": 696, "loss": 0.3545, "lr": 3.5000994968219406e-07, "epoch": 2.672883787661406, "percentage": 89.22, "elapsed_time": "3:39:31", "remaining_time": "0:26:30"}
|
622 |
+
{"current_steps": 622, "total_steps": 696, "loss": 0.4052, "lr": 3.4084539672271764e-07, "epoch": 2.677187948350072, "percentage": 89.37, "elapsed_time": "3:39:52", "remaining_time": "0:26:09"}
|
623 |
+
{"current_steps": 623, "total_steps": 696, "loss": 0.3843, "lr": 3.3179818679079936e-07, "epoch": 2.6814921090387376, "percentage": 89.51, "elapsed_time": "3:40:13", "remaining_time": "0:25:48"}
|
624 |
+
{"current_steps": 624, "total_steps": 696, "loss": 0.3866, "lr": 3.228685477447291e-07, "epoch": 2.685796269727403, "percentage": 89.66, "elapsed_time": "3:40:31", "remaining_time": "0:25:26"}
|
625 |
+
{"current_steps": 625, "total_steps": 696, "loss": 0.3993, "lr": 3.140567044817172e-07, "epoch": 2.6901004304160687, "percentage": 89.8, "elapsed_time": "3:40:52", "remaining_time": "0:25:05"}
|
626 |
+
{"current_steps": 626, "total_steps": 696, "loss": 0.3876, "lr": 3.0536287893223603e-07, "epoch": 2.6944045911047345, "percentage": 89.94, "elapsed_time": "3:41:12", "remaining_time": "0:24:44"}
|
627 |
+
{"current_steps": 627, "total_steps": 696, "loss": 0.3943, "lr": 2.967872900544194e-07, "epoch": 2.6987087517934003, "percentage": 90.09, "elapsed_time": "3:41:31", "remaining_time": "0:24:22"}
|
628 |
+
{"current_steps": 628, "total_steps": 696, "loss": 0.4108, "lr": 2.883301538285582e-07, "epoch": 2.703012912482066, "percentage": 90.23, "elapsed_time": "3:41:51", "remaining_time": "0:24:01"}
|
629 |
+
{"current_steps": 629, "total_steps": 696, "loss": 0.3659, "lr": 2.799916832516575e-07, "epoch": 2.7073170731707314, "percentage": 90.37, "elapsed_time": "3:42:11", "remaining_time": "0:23:40"}
|
630 |
+
{"current_steps": 630, "total_steps": 696, "loss": 0.3805, "lr": 2.717720883320685e-07, "epoch": 2.7116212338593977, "percentage": 90.52, "elapsed_time": "3:42:32", "remaining_time": "0:23:18"}
|
631 |
+
{"current_steps": 631, "total_steps": 696, "loss": 0.417, "lr": 2.6367157608420347e-07, "epoch": 2.715925394548063, "percentage": 90.66, "elapsed_time": "3:42:55", "remaining_time": "0:22:57"}
|
632 |
+
{"current_steps": 632, "total_steps": 696, "loss": 0.3635, "lr": 2.556903505233216e-07, "epoch": 2.720229555236729, "percentage": 90.8, "elapsed_time": "3:43:13", "remaining_time": "0:22:36"}
|
633 |
+
{"current_steps": 633, "total_steps": 696, "loss": 0.4361, "lr": 2.4782861266038904e-07, "epoch": 2.7245337159253946, "percentage": 90.95, "elapsed_time": "3:43:35", "remaining_time": "0:22:15"}
|
634 |
+
{"current_steps": 634, "total_steps": 696, "loss": 0.4118, "lr": 2.4008656049701875e-07, "epoch": 2.7288378766140604, "percentage": 91.09, "elapsed_time": "3:43:58", "remaining_time": "0:21:54"}
|
635 |
+
{"current_steps": 635, "total_steps": 696, "loss": 0.3608, "lr": 2.3246438902048196e-07, "epoch": 2.733142037302726, "percentage": 91.24, "elapsed_time": "3:44:19", "remaining_time": "0:21:32"}
|
636 |
+
{"current_steps": 636, "total_steps": 696, "loss": 0.4244, "lr": 2.2496229019879635e-07, "epoch": 2.7374461979913915, "percentage": 91.38, "elapsed_time": "3:44:38", "remaining_time": "0:21:11"}
|
637 |
+
{"current_steps": 637, "total_steps": 696, "loss": 0.4173, "lr": 2.175804529758929e-07, "epoch": 2.7417503586800573, "percentage": 91.52, "elapsed_time": "3:45:00", "remaining_time": "0:20:50"}
|
638 |
+
{"current_steps": 638, "total_steps": 696, "loss": 0.399, "lr": 2.1031906326685946e-07, "epoch": 2.746054519368723, "percentage": 91.67, "elapsed_time": "3:45:20", "remaining_time": "0:20:29"}
|
639 |
+
{"current_steps": 639, "total_steps": 696, "loss": 0.3802, "lr": 2.0317830395325255e-07, "epoch": 2.750358680057389, "percentage": 91.81, "elapsed_time": "3:45:40", "remaining_time": "0:20:07"}
|
640 |
+
{"current_steps": 640, "total_steps": 696, "loss": 0.3867, "lr": 1.9615835487849677e-07, "epoch": 2.7546628407460547, "percentage": 91.95, "elapsed_time": "3:46:02", "remaining_time": "0:19:46"}
|
641 |
+
{"current_steps": 641, "total_steps": 696, "loss": 0.3963, "lr": 1.8925939284335225e-07, "epoch": 2.75896700143472, "percentage": 92.1, "elapsed_time": "3:46:21", "remaining_time": "0:19:25"}
|
642 |
+
{"current_steps": 642, "total_steps": 696, "loss": 0.4116, "lr": 1.824815916014644e-07, "epoch": 2.763271162123386, "percentage": 92.24, "elapsed_time": "3:46:43", "remaining_time": "0:19:04"}
|
643 |
+
{"current_steps": 643, "total_steps": 696, "loss": 0.3818, "lr": 1.7582512185498446e-07, "epoch": 2.7675753228120517, "percentage": 92.39, "elapsed_time": "3:47:06", "remaining_time": "0:18:43"}
|
644 |
+
{"current_steps": 644, "total_steps": 696, "loss": 0.4179, "lr": 1.6929015125027314e-07, "epoch": 2.7718794835007174, "percentage": 92.53, "elapsed_time": "3:47:26", "remaining_time": "0:18:21"}
|
645 |
+
{"current_steps": 645, "total_steps": 696, "loss": 0.4116, "lr": 1.6287684437367724e-07, "epoch": 2.7761836441893832, "percentage": 92.67, "elapsed_time": "3:47:46", "remaining_time": "0:18:00"}
|
646 |
+
{"current_steps": 646, "total_steps": 696, "loss": 0.4216, "lr": 1.5658536274738623e-07, "epoch": 2.7804878048780486, "percentage": 92.82, "elapsed_time": "3:48:06", "remaining_time": "0:17:39"}
|
647 |
+
{"current_steps": 647, "total_steps": 696, "loss": 0.4378, "lr": 1.504158648253584e-07, "epoch": 2.7847919655667144, "percentage": 92.96, "elapsed_time": "3:48:27", "remaining_time": "0:17:18"}
|
648 |
+
{"current_steps": 648, "total_steps": 696, "loss": 0.4068, "lr": 1.443685059893396e-07, "epoch": 2.78909612625538, "percentage": 93.1, "elapsed_time": "3:48:46", "remaining_time": "0:16:56"}
|
649 |
+
{"current_steps": 649, "total_steps": 696, "loss": 0.39, "lr": 1.3844343854494123e-07, "epoch": 2.793400286944046, "percentage": 93.25, "elapsed_time": "3:49:04", "remaining_time": "0:16:35"}
|
650 |
+
{"current_steps": 650, "total_steps": 696, "loss": 0.3683, "lr": 1.3264081171780797e-07, "epoch": 2.7977044476327118, "percentage": 93.39, "elapsed_time": "3:49:24", "remaining_time": "0:16:14"}
|
651 |
+
{"current_steps": 651, "total_steps": 696, "loss": 0.3965, "lr": 1.2696077164986e-07, "epoch": 2.802008608321377, "percentage": 93.53, "elapsed_time": "3:49:45", "remaining_time": "0:15:52"}
|
652 |
+
{"current_steps": 652, "total_steps": 696, "loss": 0.4027, "lr": 1.2140346139561277e-07, "epoch": 2.806312769010043, "percentage": 93.68, "elapsed_time": "3:50:06", "remaining_time": "0:15:31"}
|
653 |
+
{"current_steps": 653, "total_steps": 696, "loss": 0.4236, "lr": 1.1596902091857043e-07, "epoch": 2.8106169296987087, "percentage": 93.82, "elapsed_time": "3:50:25", "remaining_time": "0:15:10"}
|
654 |
+
{"current_steps": 654, "total_steps": 696, "loss": 0.4033, "lr": 1.1065758708770468e-07, "epoch": 2.8149210903873745, "percentage": 93.97, "elapsed_time": "3:50:46", "remaining_time": "0:14:49"}
|
655 |
+
{"current_steps": 655, "total_steps": 696, "loss": 0.3805, "lr": 1.0546929367400705e-07, "epoch": 2.8192252510760403, "percentage": 94.11, "elapsed_time": "3:51:08", "remaining_time": "0:14:28"}
|
656 |
+
{"current_steps": 656, "total_steps": 696, "loss": 0.3917, "lr": 1.004042713471165e-07, "epoch": 2.8235294117647056, "percentage": 94.25, "elapsed_time": "3:51:29", "remaining_time": "0:14:06"}
|
657 |
+
{"current_steps": 657, "total_steps": 696, "loss": 0.4197, "lr": 9.546264767203328e-08, "epoch": 2.827833572453372, "percentage": 94.4, "elapsed_time": "3:51:48", "remaining_time": "0:13:45"}
|
658 |
+
{"current_steps": 658, "total_steps": 696, "loss": 0.3731, "lr": 9.064454710590253e-08, "epoch": 2.832137733142037, "percentage": 94.54, "elapsed_time": "3:52:05", "remaining_time": "0:13:24"}
|
659 |
+
{"current_steps": 659, "total_steps": 696, "loss": 0.3894, "lr": 8.595009099488238e-08, "epoch": 2.836441893830703, "percentage": 94.68, "elapsed_time": "3:52:25", "remaining_time": "0:13:02"}
|
660 |
+
{"current_steps": 660, "total_steps": 696, "loss": 0.4, "lr": 8.137939757108526e-08, "epoch": 2.840746054519369, "percentage": 94.83, "elapsed_time": "3:52:46", "remaining_time": "0:12:41"}
|
661 |
+
{"current_steps": 661, "total_steps": 696, "loss": 0.427, "lr": 7.693258194960252e-08, "epoch": 2.8450502152080346, "percentage": 94.97, "elapsed_time": "3:53:06", "remaining_time": "0:12:20"}
|
662 |
+
{"current_steps": 662, "total_steps": 696, "loss": 0.3931, "lr": 7.260975612560173e-08, "epoch": 2.8493543758967004, "percentage": 95.11, "elapsed_time": "3:53:25", "remaining_time": "0:11:59"}
|
663 |
+
{"current_steps": 663, "total_steps": 696, "loss": 0.3934, "lr": 6.84110289715112e-08, "epoch": 2.8536585365853657, "percentage": 95.26, "elapsed_time": "3:53:47", "remaining_time": "0:11:38"}
|
664 |
+
{"current_steps": 664, "total_steps": 696, "loss": 0.4066, "lr": 6.433650623427379e-08, "epoch": 2.8579626972740315, "percentage": 95.4, "elapsed_time": "3:54:08", "remaining_time": "0:11:17"}
|
665 |
+
{"current_steps": 665, "total_steps": 696, "loss": 0.4122, "lr": 6.038629053268464e-08, "epoch": 2.8622668579626973, "percentage": 95.55, "elapsed_time": "3:54:27", "remaining_time": "0:10:55"}
|
666 |
+
{"current_steps": 666, "total_steps": 696, "loss": 0.3884, "lr": 5.6560481354807625e-08, "epoch": 2.866571018651363, "percentage": 95.69, "elapsed_time": "3:54:48", "remaining_time": "0:10:34"}
|
667 |
+
{"current_steps": 667, "total_steps": 696, "loss": 0.4035, "lr": 5.285917505546967e-08, "epoch": 2.870875179340029, "percentage": 95.83, "elapsed_time": "3:55:09", "remaining_time": "0:10:13"}
|
668 |
+
{"current_steps": 668, "total_steps": 696, "loss": 0.3689, "lr": 4.928246485383148e-08, "epoch": 2.8751793400286942, "percentage": 95.98, "elapsed_time": "3:55:26", "remaining_time": "0:09:52"}
|
669 |
+
{"current_steps": 669, "total_steps": 696, "loss": 0.389, "lr": 4.583044083104282e-08, "epoch": 2.87948350071736, "percentage": 96.12, "elapsed_time": "3:55:45", "remaining_time": "0:09:30"}
|
670 |
+
{"current_steps": 670, "total_steps": 696, "loss": 0.4015, "lr": 4.250318992797375e-08, "epoch": 2.883787661406026, "percentage": 96.26, "elapsed_time": "3:56:06", "remaining_time": "0:09:09"}
|
671 |
+
{"current_steps": 671, "total_steps": 696, "loss": 0.3971, "lr": 3.9300795943021943e-08, "epoch": 2.8880918220946916, "percentage": 96.41, "elapsed_time": "3:56:27", "remaining_time": "0:08:48"}
|
672 |
+
{"current_steps": 672, "total_steps": 696, "loss": 0.369, "lr": 3.622333953000601e-08, "epoch": 2.8923959827833574, "percentage": 96.55, "elapsed_time": "3:56:43", "remaining_time": "0:08:27"}
|
673 |
+
{"current_steps": 673, "total_steps": 696, "loss": 0.403, "lr": 3.3270898196129944e-08, "epoch": 2.8967001434720228, "percentage": 96.7, "elapsed_time": "3:57:04", "remaining_time": "0:08:06"}
|
674 |
+
{"current_steps": 674, "total_steps": 696, "loss": 0.4154, "lr": 3.0443546300035764e-08, "epoch": 2.9010043041606886, "percentage": 96.84, "elapsed_time": "3:57:26", "remaining_time": "0:07:45"}
|
675 |
+
{"current_steps": 675, "total_steps": 696, "loss": 0.4208, "lr": 2.77413550499267e-08, "epoch": 2.9053084648493543, "percentage": 96.98, "elapsed_time": "3:57:47", "remaining_time": "0:07:23"}
|
676 |
+
{"current_steps": 676, "total_steps": 696, "loss": 0.3764, "lr": 2.516439250177749e-08, "epoch": 2.90961262553802, "percentage": 97.13, "elapsed_time": "3:58:10", "remaining_time": "0:07:02"}
|
677 |
+
{"current_steps": 677, "total_steps": 696, "loss": 0.3865, "lr": 2.2712723557616335e-08, "epoch": 2.913916786226686, "percentage": 97.27, "elapsed_time": "3:58:29", "remaining_time": "0:06:41"}
|
678 |
+
{"current_steps": 678, "total_steps": 696, "loss": 0.4393, "lr": 2.038640996389285e-08, "epoch": 2.9182209469153513, "percentage": 97.41, "elapsed_time": "3:58:51", "remaining_time": "0:06:20"}
|
679 |
+
{"current_steps": 679, "total_steps": 696, "loss": 0.377, "lr": 1.818551030992377e-08, "epoch": 2.922525107604017, "percentage": 97.56, "elapsed_time": "3:59:07", "remaining_time": "0:05:59"}
|
680 |
+
{"current_steps": 680, "total_steps": 696, "loss": 0.3919, "lr": 1.6110080026414123e-08, "epoch": 2.926829268292683, "percentage": 97.7, "elapsed_time": "3:59:28", "remaining_time": "0:05:38"}
|
681 |
+
{"current_steps": 681, "total_steps": 696, "loss": 0.4057, "lr": 1.4160171384064447e-08, "epoch": 2.9311334289813487, "percentage": 97.84, "elapsed_time": "3:59:47", "remaining_time": "0:05:16"}
|
682 |
+
{"current_steps": 682, "total_steps": 696, "loss": 0.4022, "lr": 1.2335833492252425e-08, "epoch": 2.9354375896700144, "percentage": 97.99, "elapsed_time": "4:00:09", "remaining_time": "0:04:55"}
|
683 |
+
{"current_steps": 683, "total_steps": 696, "loss": 0.3835, "lr": 1.063711229779718e-08, "epoch": 2.93974175035868, "percentage": 98.13, "elapsed_time": "4:00:30", "remaining_time": "0:04:34"}
|
684 |
+
{"current_steps": 684, "total_steps": 696, "loss": 0.3517, "lr": 9.06405058380022e-09, "epoch": 2.944045911047346, "percentage": 98.28, "elapsed_time": "4:00:47", "remaining_time": "0:04:13"}
|
685 |
+
{"current_steps": 685, "total_steps": 696, "loss": 0.4198, "lr": 7.61668796857018e-09, "epoch": 2.9483500717360114, "percentage": 98.42, "elapsed_time": "4:01:07", "remaining_time": "0:03:52"}
|
686 |
+
{"current_steps": 686, "total_steps": 696, "loss": 0.3796, "lr": 6.295060904623618e-09, "epoch": 2.952654232424677, "percentage": 98.56, "elapsed_time": "4:01:27", "remaining_time": "0:03:31"}
|
687 |
+
{"current_steps": 687, "total_steps": 696, "loss": 0.4188, "lr": 5.099202677767978e-09, "epoch": 2.956958393113343, "percentage": 98.71, "elapsed_time": "4:01:46", "remaining_time": "0:03:10"}
|
688 |
+
{"current_steps": 688, "total_steps": 696, "loss": 0.42, "lr": 4.02914340626226e-09, "epoch": 2.9612625538020088, "percentage": 98.85, "elapsed_time": "4:02:05", "remaining_time": "0:02:48"}
|
689 |
+
{"current_steps": 689, "total_steps": 696, "loss": 0.3739, "lr": 3.0849100400587307e-09, "epoch": 2.9655667144906745, "percentage": 98.99, "elapsed_time": "4:02:24", "remaining_time": "0:02:27"}
|
690 |
+
{"current_steps": 690, "total_steps": 696, "loss": 0.4282, "lr": 2.2665263601240328e-09, "epoch": 2.96987087517934, "percentage": 99.14, "elapsed_time": "4:02:46", "remaining_time": "0:02:06"}
|
691 |
+
{"current_steps": 691, "total_steps": 696, "loss": 0.409, "lr": 1.5740129778413215e-09, "epoch": 2.9741750358680057, "percentage": 99.28, "elapsed_time": "4:03:06", "remaining_time": "0:01:45"}
|
692 |
+
{"current_steps": 692, "total_steps": 696, "loss": 0.383, "lr": 1.0073873344895735e-09, "epoch": 2.9784791965566715, "percentage": 99.43, "elapsed_time": "4:03:27", "remaining_time": "0:01:24"}
|
693 |
+
{"current_steps": 693, "total_steps": 696, "loss": 0.3953, "lr": 5.666637008061582e-10, "epoch": 2.9827833572453373, "percentage": 99.57, "elapsed_time": "4:03:48", "remaining_time": "0:01:03"}
|
694 |
+
{"current_steps": 694, "total_steps": 696, "loss": 0.383, "lr": 2.5185317662490547e-10, "epoch": 2.987087517934003, "percentage": 99.71, "elapsed_time": "4:04:09", "remaining_time": "0:00:42"}
|
695 |
+
{"current_steps": 695, "total_steps": 696, "loss": 0.4103, "lr": 6.296369059854978e-11, "epoch": 2.9913916786226684, "percentage": 99.86, "elapsed_time": "4:04:29", "remaining_time": "0:00:21"}
|
696 |
+
{"current_steps": 696, "total_steps": 696, "loss": 0.3768, "lr": 0.0, "epoch": 2.995695839311334, "percentage": 100.0, "elapsed_time": "4:04:49", "remaining_time": "0:00:00"}
|
697 |
+
{"current_steps": 696, "total_steps": 696, "epoch": 2.995695839311334, "percentage": 100.0, "elapsed_time": "4:05:42", "remaining_time": "0:00:00"}
|