{"current_steps": 5, "total_steps": 747, "loss": 1.3318, "learning_rate": 4.999447296060165e-05, "epoch": 0.02001000500250125, "percentage": 0.67, "elapsed_time": "0:00:24", "remaining_time": "1:01:39", "throughput": 627.74, "total_tokens": 15648} {"current_steps": 10, "total_steps": 747, "loss": 1.2773, "learning_rate": 4.997789428625975e-05, "epoch": 0.0400200100050025, "percentage": 1.34, "elapsed_time": "0:00:45", "remaining_time": "0:56:20", "throughput": 626.07, "total_tokens": 28720} {"current_steps": 15, "total_steps": 747, "loss": 1.1401, "learning_rate": 4.995027130745321e-05, "epoch": 0.060030015007503754, "percentage": 2.01, "elapsed_time": "0:01:09", "remaining_time": "0:56:41", "throughput": 628.49, "total_tokens": 43808} {"current_steps": 20, "total_steps": 747, "loss": 1.089, "learning_rate": 4.99116162380454e-05, "epoch": 0.080040020010005, "percentage": 2.68, "elapsed_time": "0:01:32", "remaining_time": "0:55:44", "throughput": 624.67, "total_tokens": 57472} {"current_steps": 25, "total_steps": 747, "loss": 1.1176, "learning_rate": 4.986194616988364e-05, "epoch": 0.10005002501250625, "percentage": 3.35, "elapsed_time": "0:01:55", "remaining_time": "0:55:32", "throughput": 623.6, "total_tokens": 71968} {"current_steps": 30, "total_steps": 747, "loss": 0.9949, "learning_rate": 4.980128306524183e-05, "epoch": 0.12006003001500751, "percentage": 4.02, "elapsed_time": "0:02:16", "remaining_time": "0:54:33", "throughput": 624.67, "total_tokens": 85552} {"current_steps": 35, "total_steps": 747, "loss": 1.0264, "learning_rate": 4.972965374710952e-05, "epoch": 0.14007003501750875, "percentage": 4.69, "elapsed_time": "0:02:40", "remaining_time": "0:54:23", "throughput": 626.61, "total_tokens": 100512} {"current_steps": 40, "total_steps": 747, "loss": 1.0004, "learning_rate": 4.964708988733178e-05, "epoch": 0.16008004002001, "percentage": 5.35, "elapsed_time": "0:03:01", "remaining_time": "0:53:31", "throughput": 624.07, "total_tokens": 113376} {"current_steps": 45, "total_steps": 747, "loss": 1.1137, "learning_rate": 4.9553627992605066e-05, "epoch": 0.18009004502251125, "percentage": 6.02, "elapsed_time": "0:03:24", "remaining_time": "0:53:10", "throughput": 624.26, "total_tokens": 127680} {"current_steps": 50, "total_steps": 747, "loss": 0.9646, "learning_rate": 4.944930938833535e-05, "epoch": 0.2001000500250125, "percentage": 6.69, "elapsed_time": "0:03:48", "remaining_time": "0:53:05", "throughput": 626.36, "total_tokens": 143136} {"current_steps": 55, "total_steps": 747, "loss": 0.9757, "learning_rate": 4.9334180200365486e-05, "epoch": 0.22011005502751377, "percentage": 7.36, "elapsed_time": "0:04:09", "remaining_time": "0:52:14", "throughput": 624.03, "total_tokens": 155488} {"current_steps": 60, "total_steps": 747, "loss": 0.9126, "learning_rate": 4.9208291334580104e-05, "epoch": 0.24012006003001501, "percentage": 8.03, "elapsed_time": "0:04:33", "remaining_time": "0:52:11", "throughput": 625.35, "total_tokens": 171008} {"current_steps": 65, "total_steps": 747, "loss": 1.0119, "learning_rate": 4.907169845439688e-05, "epoch": 0.26013006503251623, "percentage": 8.7, "elapsed_time": "0:04:56", "remaining_time": "0:51:50", "throughput": 625.91, "total_tokens": 185536} {"current_steps": 70, "total_steps": 747, "loss": 1.1192, "learning_rate": 4.892446195615423e-05, "epoch": 0.2801400700350175, "percentage": 9.37, "elapsed_time": "0:05:21", "remaining_time": "0:51:49", "throughput": 627.38, "total_tokens": 201728} {"current_steps": 75, "total_steps": 747, "loss": 1.0167, "learning_rate": 4.87666469424063e-05, "epoch": 0.3001500750375188, "percentage": 10.04, "elapsed_time": "0:05:46", "remaining_time": "0:51:40", "throughput": 628.71, "total_tokens": 217584} {"current_steps": 80, "total_steps": 747, "loss": 0.8291, "learning_rate": 4.859832319313697e-05, "epoch": 0.32016008004002, "percentage": 10.71, "elapsed_time": "0:06:07", "remaining_time": "0:51:05", "throughput": 627.94, "total_tokens": 230864} {"current_steps": 85, "total_steps": 747, "loss": 0.9591, "learning_rate": 4.841956513490577e-05, "epoch": 0.3401700850425213, "percentage": 11.38, "elapsed_time": "0:06:31", "remaining_time": "0:50:48", "throughput": 627.43, "total_tokens": 245584} {"current_steps": 90, "total_steps": 747, "loss": 0.9869, "learning_rate": 4.8230451807939135e-05, "epoch": 0.3601800900450225, "percentage": 12.05, "elapsed_time": "0:06:53", "remaining_time": "0:50:22", "throughput": 627.47, "total_tokens": 259760} {"current_steps": 95, "total_steps": 747, "loss": 1.0423, "learning_rate": 4.803106683118177e-05, "epoch": 0.38019009504752377, "percentage": 12.72, "elapsed_time": "0:07:17", "remaining_time": "0:49:59", "throughput": 627.86, "total_tokens": 274432} {"current_steps": 100, "total_steps": 747, "loss": 1.0122, "learning_rate": 4.782149836532345e-05, "epoch": 0.400200100050025, "percentage": 13.39, "elapsed_time": "0:07:39", "remaining_time": "0:49:32", "throughput": 627.48, "total_tokens": 288256} {"current_steps": 105, "total_steps": 747, "loss": 0.9849, "learning_rate": 4.760183907381757e-05, "epoch": 0.42021010505252626, "percentage": 14.06, "elapsed_time": "0:08:01", "remaining_time": "0:49:05", "throughput": 625.12, "total_tokens": 301136} {"current_steps": 110, "total_steps": 747, "loss": 0.7958, "learning_rate": 4.737218608190878e-05, "epoch": 0.44022011005502754, "percentage": 14.73, "elapsed_time": "0:08:22", "remaining_time": "0:48:30", "throughput": 624.25, "total_tokens": 313712} {"current_steps": 115, "total_steps": 747, "loss": 0.9773, "learning_rate": 4.713264093368783e-05, "epoch": 0.46023011505752875, "percentage": 15.39, "elapsed_time": "0:08:46", "remaining_time": "0:48:10", "throughput": 624.47, "total_tokens": 328496} {"current_steps": 120, "total_steps": 747, "loss": 0.9953, "learning_rate": 4.6883309547192476e-05, "epoch": 0.48024012006003003, "percentage": 16.06, "elapsed_time": "0:09:08", "remaining_time": "0:47:45", "throughput": 624.14, "total_tokens": 342288} {"current_steps": 125, "total_steps": 747, "loss": 0.9726, "learning_rate": 4.6624302167574436e-05, "epoch": 0.5002501250625313, "percentage": 16.73, "elapsed_time": "0:09:30", "remaining_time": "0:47:18", "throughput": 624.23, "total_tokens": 356128} {"current_steps": 130, "total_steps": 747, "loss": 0.9987, "learning_rate": 4.635573331835302e-05, "epoch": 0.5202601300650325, "percentage": 17.4, "elapsed_time": "0:09:50", "remaining_time": "0:46:42", "throughput": 623.25, "total_tokens": 368000} {"current_steps": 135, "total_steps": 747, "loss": 1.012, "learning_rate": 4.607772175077711e-05, "epoch": 0.5402701350675337, "percentage": 18.07, "elapsed_time": "0:10:12", "remaining_time": "0:46:14", "throughput": 622.79, "total_tokens": 381216} {"current_steps": 140, "total_steps": 747, "loss": 0.9104, "learning_rate": 4.5790390391317675e-05, "epoch": 0.560280140070035, "percentage": 18.74, "elapsed_time": "0:10:34", "remaining_time": "0:45:51", "throughput": 622.96, "total_tokens": 395296} {"current_steps": 145, "total_steps": 747, "loss": 0.9087, "learning_rate": 4.549386628731425e-05, "epoch": 0.5802901450725363, "percentage": 19.41, "elapsed_time": "0:10:56", "remaining_time": "0:45:27", "throughput": 623.09, "total_tokens": 409312} {"current_steps": 150, "total_steps": 747, "loss": 1.0859, "learning_rate": 4.518828055079925e-05, "epoch": 0.6003001500750376, "percentage": 20.08, "elapsed_time": "0:11:20", "remaining_time": "0:45:08", "throughput": 623.08, "total_tokens": 424064} {"current_steps": 155, "total_steps": 747, "loss": 0.9696, "learning_rate": 4.487376830052511e-05, "epoch": 0.6203101550775387, "percentage": 20.75, "elapsed_time": "0:11:42", "remaining_time": "0:44:42", "throughput": 622.55, "total_tokens": 437264} {"current_steps": 160, "total_steps": 747, "loss": 1.0014, "learning_rate": 4.4550468602219716e-05, "epoch": 0.64032016008004, "percentage": 21.42, "elapsed_time": "0:12:03", "remaining_time": "0:44:14", "throughput": 622.76, "total_tokens": 450624} {"current_steps": 165, "total_steps": 747, "loss": 0.8877, "learning_rate": 4.421852440709666e-05, "epoch": 0.6603301650825413, "percentage": 22.09, "elapsed_time": "0:12:27", "remaining_time": "0:43:56", "throughput": 623.35, "total_tokens": 465968} {"current_steps": 170, "total_steps": 747, "loss": 0.9694, "learning_rate": 4.387808248864751e-05, "epoch": 0.6803401700850426, "percentage": 22.76, "elapsed_time": "0:12:50", "remaining_time": "0:43:36", "throughput": 623.55, "total_tokens": 480720} {"current_steps": 175, "total_steps": 747, "loss": 0.8613, "learning_rate": 4.352929337774395e-05, "epoch": 0.7003501750875438, "percentage": 23.43, "elapsed_time": "0:13:13", "remaining_time": "0:43:14", "throughput": 623.73, "total_tokens": 495008} {"current_steps": 180, "total_steps": 747, "loss": 0.907, "learning_rate": 4.3172311296078595e-05, "epoch": 0.720360180090045, "percentage": 24.1, "elapsed_time": "0:13:36", "remaining_time": "0:42:51", "throughput": 623.61, "total_tokens": 509024} {"current_steps": 185, "total_steps": 747, "loss": 1.0501, "learning_rate": 4.2807294087973834e-05, "epoch": 0.7403701850925463, "percentage": 24.77, "elapsed_time": "0:14:00", "remaining_time": "0:42:34", "throughput": 623.97, "total_tokens": 524752} {"current_steps": 190, "total_steps": 747, "loss": 0.9158, "learning_rate": 4.2434403150588895e-05, "epoch": 0.7603801900950475, "percentage": 25.44, "elapsed_time": "0:14:22", "remaining_time": "0:42:07", "throughput": 623.91, "total_tokens": 537872} {"current_steps": 195, "total_steps": 747, "loss": 0.9756, "learning_rate": 4.205380336255594e-05, "epoch": 0.7803901950975488, "percentage": 26.1, "elapsed_time": "0:14:46", "remaining_time": "0:41:48", "throughput": 623.92, "total_tokens": 552832} {"current_steps": 200, "total_steps": 747, "loss": 1.0702, "learning_rate": 4.166566301107687e-05, "epoch": 0.80040020010005, "percentage": 26.77, "elapsed_time": "0:15:07", "remaining_time": "0:41:22", "throughput": 623.93, "total_tokens": 566224} {"current_steps": 205, "total_steps": 747, "loss": 0.8236, "learning_rate": 4.127015371751284e-05, "epoch": 0.8204102051025512, "percentage": 27.44, "elapsed_time": "0:15:33", "remaining_time": "0:41:09", "throughput": 623.81, "total_tokens": 582560} {"current_steps": 210, "total_steps": 747, "loss": 0.8779, "learning_rate": 4.08674503614997e-05, "epoch": 0.8404202101050525, "percentage": 28.11, "elapsed_time": "0:15:54", "remaining_time": "0:40:41", "throughput": 623.71, "total_tokens": 595568} {"current_steps": 215, "total_steps": 747, "loss": 0.9544, "learning_rate": 4.0457731003622606e-05, "epoch": 0.8604302151075538, "percentage": 28.78, "elapsed_time": "0:16:16", "remaining_time": "0:40:17", "throughput": 623.48, "total_tokens": 609040} {"current_steps": 220, "total_steps": 747, "loss": 0.8529, "learning_rate": 4.004117680668422e-05, "epoch": 0.8804402201100551, "percentage": 29.45, "elapsed_time": "0:16:39", "remaining_time": "0:39:54", "throughput": 623.49, "total_tokens": 623168} {"current_steps": 225, "total_steps": 747, "loss": 0.916, "learning_rate": 3.961797195560118e-05, "epoch": 0.9004502251125562, "percentage": 30.12, "elapsed_time": "0:17:05", "remaining_time": "0:39:38", "throughput": 624.01, "total_tokens": 639680} {"current_steps": 230, "total_steps": 747, "loss": 1.0282, "learning_rate": 3.918830357596434e-05, "epoch": 0.9204602301150575, "percentage": 30.79, "elapsed_time": "0:17:28", "remaining_time": "0:39:17", "throughput": 624.15, "total_tokens": 654512} {"current_steps": 235, "total_steps": 747, "loss": 1.0636, "learning_rate": 3.8752361651298675e-05, "epoch": 0.9404702351175588, "percentage": 31.46, "elapsed_time": "0:17:51", "remaining_time": "0:38:54", "throughput": 624.33, "total_tokens": 668992} {"current_steps": 240, "total_steps": 747, "loss": 0.855, "learning_rate": 3.8310338939059644e-05, "epoch": 0.9604802401200601, "percentage": 32.13, "elapsed_time": "0:18:14", "remaining_time": "0:38:32", "throughput": 624.37, "total_tokens": 683360} {"current_steps": 245, "total_steps": 747, "loss": 0.9286, "learning_rate": 3.7862430885402876e-05, "epoch": 0.9804902451225613, "percentage": 32.8, "elapsed_time": "0:18:36", "remaining_time": "0:38:08", "throughput": 624.49, "total_tokens": 697456} {"current_steps": 250, "total_steps": 747, "loss": 0.9295, "learning_rate": 3.740883553876515e-05, "epoch": 1.0005002501250626, "percentage": 33.47, "elapsed_time": "0:19:01", "remaining_time": "0:37:49", "throughput": 624.76, "total_tokens": 713088} {"current_steps": 255, "total_steps": 747, "loss": 0.9945, "learning_rate": 3.694975346229458e-05, "epoch": 1.0205102551275638, "percentage": 34.14, "elapsed_time": "0:19:22", "remaining_time": "0:37:23", "throughput": 624.62, "total_tokens": 726176} {"current_steps": 260, "total_steps": 747, "loss": 0.8799, "learning_rate": 3.6485387645169064e-05, "epoch": 1.040520260130065, "percentage": 34.81, "elapsed_time": "0:19:46", "remaining_time": "0:37:03", "throughput": 624.83, "total_tokens": 741664} {"current_steps": 265, "total_steps": 747, "loss": 0.8551, "learning_rate": 3.601594341284195e-05, "epoch": 1.0605302651325663, "percentage": 35.48, "elapsed_time": "0:20:08", "remaining_time": "0:36:37", "throughput": 624.62, "total_tokens": 754720} {"current_steps": 270, "total_steps": 747, "loss": 0.8381, "learning_rate": 3.55416283362546e-05, "epoch": 1.0805402701350675, "percentage": 36.14, "elapsed_time": "0:20:29", "remaining_time": "0:36:11", "throughput": 624.42, "total_tokens": 767568} {"current_steps": 275, "total_steps": 747, "loss": 0.8036, "learning_rate": 3.5062652140056275e-05, "epoch": 1.1005502751375689, "percentage": 36.81, "elapsed_time": "0:20:54", "remaining_time": "0:35:53", "throughput": 624.96, "total_tokens": 784192} {"current_steps": 280, "total_steps": 747, "loss": 0.7851, "learning_rate": 3.457922660987155e-05, "epoch": 1.12056028014007, "percentage": 37.48, "elapsed_time": "0:21:16", "remaining_time": "0:35:28", "throughput": 624.83, "total_tokens": 797328} {"current_steps": 285, "total_steps": 747, "loss": 0.8262, "learning_rate": 3.409156549865654e-05, "epoch": 1.1405702851425712, "percentage": 38.15, "elapsed_time": "0:21:39", "remaining_time": "0:35:06", "throughput": 625.11, "total_tokens": 812416} {"current_steps": 290, "total_steps": 747, "loss": 0.9297, "learning_rate": 3.3599884432185225e-05, "epoch": 1.1605802901450726, "percentage": 38.82, "elapsed_time": "0:22:01", "remaining_time": "0:34:41", "throughput": 625.01, "total_tokens": 825744} {"current_steps": 295, "total_steps": 747, "loss": 1.0422, "learning_rate": 3.310440081370767e-05, "epoch": 1.1805902951475737, "percentage": 39.49, "elapsed_time": "0:22:24", "remaining_time": "0:34:19", "throughput": 625.18, "total_tokens": 840256} {"current_steps": 300, "total_steps": 747, "loss": 0.8906, "learning_rate": 3.260533372782234e-05, "epoch": 1.2006003001500751, "percentage": 40.16, "elapsed_time": "0:22:46", "remaining_time": "0:33:55", "throughput": 625.09, "total_tokens": 854016} {"current_steps": 305, "total_steps": 747, "loss": 0.7934, "learning_rate": 3.2102903843604885e-05, "epoch": 1.2206103051525763, "percentage": 40.83, "elapsed_time": "0:23:10", "remaining_time": "0:33:35", "throughput": 624.62, "total_tokens": 868592} {"current_steps": 310, "total_steps": 747, "loss": 0.7439, "learning_rate": 3.1597333317036545e-05, "epoch": 1.2406203101550775, "percentage": 41.5, "elapsed_time": "0:23:31", "remaining_time": "0:33:09", "throughput": 624.54, "total_tokens": 881280} {"current_steps": 315, "total_steps": 747, "loss": 0.841, "learning_rate": 3.10888456927748e-05, "epoch": 1.2606303151575788, "percentage": 42.17, "elapsed_time": "0:23:53", "remaining_time": "0:32:45", "throughput": 624.54, "total_tokens": 895168} {"current_steps": 320, "total_steps": 747, "loss": 0.9016, "learning_rate": 3.057766580531031e-05, "epoch": 1.28064032016008, "percentage": 42.84, "elapsed_time": "0:24:17", "remaining_time": "0:32:24", "throughput": 624.76, "total_tokens": 910624} {"current_steps": 325, "total_steps": 747, "loss": 0.8938, "learning_rate": 3.0064019679553274e-05, "epoch": 1.3006503251625814, "percentage": 43.51, "elapsed_time": "0:24:38", "remaining_time": "0:32:00", "throughput": 624.51, "total_tokens": 923648} {"current_steps": 330, "total_steps": 747, "loss": 0.8739, "learning_rate": 2.9548134430893604e-05, "epoch": 1.3206603301650826, "percentage": 44.18, "elapsed_time": "0:25:01", "remaining_time": "0:31:37", "throughput": 624.67, "total_tokens": 938256} {"current_steps": 335, "total_steps": 747, "loss": 0.9641, "learning_rate": 2.903023816477885e-05, "epoch": 1.3406703351675837, "percentage": 44.85, "elapsed_time": "0:25:26", "remaining_time": "0:31:17", "throughput": 624.81, "total_tokens": 954000} {"current_steps": 340, "total_steps": 747, "loss": 0.8616, "learning_rate": 2.8510559875854377e-05, "epoch": 1.360680340170085, "percentage": 45.52, "elapsed_time": "0:25:46", "remaining_time": "0:30:51", "throughput": 624.36, "total_tokens": 965744} {"current_steps": 345, "total_steps": 747, "loss": 0.7673, "learning_rate": 2.7989329346710375e-05, "epoch": 1.3806903451725863, "percentage": 46.18, "elapsed_time": "0:26:10", "remaining_time": "0:30:29", "throughput": 624.37, "total_tokens": 980512} {"current_steps": 350, "total_steps": 747, "loss": 0.9637, "learning_rate": 2.7466777046280457e-05, "epoch": 1.4007003501750876, "percentage": 46.85, "elapsed_time": "0:26:34", "remaining_time": "0:30:08", "throughput": 624.7, "total_tokens": 996224} {"current_steps": 355, "total_steps": 747, "loss": 0.7466, "learning_rate": 2.69431340279368e-05, "epoch": 1.4207103551775888, "percentage": 47.52, "elapsed_time": "0:26:55", "remaining_time": "0:29:43", "throughput": 624.45, "total_tokens": 1008816} {"current_steps": 360, "total_steps": 747, "loss": 0.8695, "learning_rate": 2.6418631827326857e-05, "epoch": 1.44072036018009, "percentage": 48.19, "elapsed_time": "0:27:19", "remaining_time": "0:29:22", "throughput": 624.52, "total_tokens": 1024032} {"current_steps": 365, "total_steps": 747, "loss": 0.8742, "learning_rate": 2.5893502359996786e-05, "epoch": 1.4607303651825914, "percentage": 48.86, "elapsed_time": "0:27:39", "remaining_time": "0:28:56", "throughput": 624.17, "total_tokens": 1035536} {"current_steps": 370, "total_steps": 747, "loss": 0.8879, "learning_rate": 2.5367977818847034e-05, "epoch": 1.4807403701850925, "percentage": 49.53, "elapsed_time": "0:28:00", "remaining_time": "0:28:32", "throughput": 624.04, "total_tokens": 1048784} {"current_steps": 375, "total_steps": 747, "loss": 0.8188, "learning_rate": 2.484229057146507e-05, "epoch": 1.500750375187594, "percentage": 50.2, "elapsed_time": "0:28:24", "remaining_time": "0:28:10", "throughput": 624.25, "total_tokens": 1063920} {"current_steps": 380, "total_steps": 747, "loss": 0.8898, "learning_rate": 2.431667305738112e-05, "epoch": 1.520760380190095, "percentage": 50.87, "elapsed_time": "0:28:49", "remaining_time": "0:27:49", "throughput": 624.63, "total_tokens": 1080048} {"current_steps": 385, "total_steps": 747, "loss": 0.8779, "learning_rate": 2.3791357685291863e-05, "epoch": 1.5407703851925962, "percentage": 51.54, "elapsed_time": "0:29:10", "remaining_time": "0:27:26", "throughput": 624.6, "total_tokens": 1093584} {"current_steps": 390, "total_steps": 747, "loss": 0.9372, "learning_rate": 2.3266576730297956e-05, "epoch": 1.5607803901950974, "percentage": 52.21, "elapsed_time": "0:29:33", "remaining_time": "0:27:03", "throughput": 624.81, "total_tokens": 1108192} {"current_steps": 395, "total_steps": 747, "loss": 0.7406, "learning_rate": 2.274256223120051e-05, "epoch": 1.5807903951975988, "percentage": 52.88, "elapsed_time": "0:29:56", "remaining_time": "0:26:40", "throughput": 624.88, "total_tokens": 1122368} {"current_steps": 400, "total_steps": 747, "loss": 0.8414, "learning_rate": 2.221954588790206e-05, "epoch": 1.6008004002001002, "percentage": 53.55, "elapsed_time": "0:30:16", "remaining_time": "0:26:16", "throughput": 624.72, "total_tokens": 1135040} {"current_steps": 405, "total_steps": 747, "loss": 0.8781, "learning_rate": 2.1697758958957448e-05, "epoch": 1.6208104052026013, "percentage": 54.22, "elapsed_time": "0:30:42", "remaining_time": "0:25:55", "throughput": 624.32, "total_tokens": 1150096} {"current_steps": 410, "total_steps": 747, "loss": 0.8304, "learning_rate": 2.1177432159319754e-05, "epoch": 1.6408204102051025, "percentage": 54.89, "elapsed_time": "0:31:04", "remaining_time": "0:25:32", "throughput": 624.17, "total_tokens": 1163840} {"current_steps": 415, "total_steps": 747, "loss": 0.9539, "learning_rate": 2.0658795558326743e-05, "epoch": 1.6608304152076037, "percentage": 55.56, "elapsed_time": "0:31:28", "remaining_time": "0:25:10", "throughput": 624.39, "total_tokens": 1179024} {"current_steps": 420, "total_steps": 747, "loss": 0.7972, "learning_rate": 2.014207847797256e-05, "epoch": 1.680840420210105, "percentage": 56.22, "elapsed_time": "0:31:50", "remaining_time": "0:24:47", "throughput": 624.32, "total_tokens": 1192800} {"current_steps": 425, "total_steps": 747, "loss": 0.9455, "learning_rate": 1.9627509391510086e-05, "epoch": 1.7008504252126064, "percentage": 56.89, "elapsed_time": "0:32:11", "remaining_time": "0:24:23", "throughput": 624.31, "total_tokens": 1206160} {"current_steps": 430, "total_steps": 747, "loss": 0.742, "learning_rate": 1.9115315822428437e-05, "epoch": 1.7208604302151076, "percentage": 57.56, "elapsed_time": "0:32:33", "remaining_time": "0:24:00", "throughput": 624.22, "total_tokens": 1219456} {"current_steps": 435, "total_steps": 747, "loss": 0.9298, "learning_rate": 1.8605724243850502e-05, "epoch": 1.7408704352176088, "percentage": 58.23, "elapsed_time": "0:32:55", "remaining_time": "0:23:36", "throughput": 624.21, "total_tokens": 1232848} {"current_steps": 440, "total_steps": 747, "loss": 0.8751, "learning_rate": 1.809895997839482e-05, "epoch": 1.76088044022011, "percentage": 58.9, "elapsed_time": "0:33:15", "remaining_time": "0:23:12", "throughput": 624.0, "total_tokens": 1244944} {"current_steps": 445, "total_steps": 747, "loss": 0.8162, "learning_rate": 1.759524709854626e-05, "epoch": 1.7808904452226113, "percentage": 59.57, "elapsed_time": "0:33:38", "remaining_time": "0:22:49", "throughput": 624.01, "total_tokens": 1259584} {"current_steps": 450, "total_steps": 747, "loss": 0.9372, "learning_rate": 1.70948083275794e-05, "epoch": 1.8009004502251127, "percentage": 60.24, "elapsed_time": "0:34:02", "remaining_time": "0:22:28", "throughput": 624.06, "total_tokens": 1274640} {"current_steps": 455, "total_steps": 747, "loss": 0.9076, "learning_rate": 1.6597864941078552e-05, "epoch": 1.8209104552276139, "percentage": 60.91, "elapsed_time": "0:34:26", "remaining_time": "0:22:05", "throughput": 624.32, "total_tokens": 1289936} {"current_steps": 460, "total_steps": 747, "loss": 0.8189, "learning_rate": 1.6104636669097776e-05, "epoch": 1.840920460230115, "percentage": 61.58, "elapsed_time": "0:34:48", "remaining_time": "0:21:42", "throughput": 624.02, "total_tokens": 1303184} {"current_steps": 465, "total_steps": 747, "loss": 0.8545, "learning_rate": 1.561534159900441e-05, "epoch": 1.8609304652326162, "percentage": 62.25, "elapsed_time": "0:35:11", "remaining_time": "0:21:20", "throughput": 624.11, "total_tokens": 1317920} {"current_steps": 470, "total_steps": 747, "loss": 0.8544, "learning_rate": 1.513019607904882e-05, "epoch": 1.8809404702351176, "percentage": 62.92, "elapsed_time": "0:35:34", "remaining_time": "0:20:58", "throughput": 624.12, "total_tokens": 1332192} {"current_steps": 475, "total_steps": 747, "loss": 0.9191, "learning_rate": 1.464941462270325e-05, "epoch": 1.900950475237619, "percentage": 63.59, "elapsed_time": "0:35:58", "remaining_time": "0:20:36", "throughput": 624.37, "total_tokens": 1348000} {"current_steps": 480, "total_steps": 747, "loss": 0.8605, "learning_rate": 1.4173209813811788e-05, "epoch": 1.9209604802401201, "percentage": 64.26, "elapsed_time": "0:36:21", "remaining_time": "0:20:13", "throughput": 624.42, "total_tokens": 1362096} {"current_steps": 485, "total_steps": 747, "loss": 0.937, "learning_rate": 1.3701792212593662e-05, "epoch": 1.9409704852426213, "percentage": 64.93, "elapsed_time": "0:36:46", "remaining_time": "0:19:52", "throughput": 624.77, "total_tokens": 1378656} {"current_steps": 490, "total_steps": 747, "loss": 0.9073, "learning_rate": 1.3235370262541272e-05, "epoch": 1.9609804902451224, "percentage": 65.6, "elapsed_time": "0:37:09", "remaining_time": "0:19:29", "throughput": 624.89, "total_tokens": 1393344} {"current_steps": 495, "total_steps": 747, "loss": 0.8941, "learning_rate": 1.277415019825417e-05, "epoch": 1.9809904952476238, "percentage": 66.27, "elapsed_time": "0:37:34", "remaining_time": "0:19:07", "throughput": 625.08, "total_tokens": 1409280} {"current_steps": 500, "total_steps": 747, "loss": 0.8051, "learning_rate": 1.2318335954249669e-05, "epoch": 2.001000500250125, "percentage": 66.93, "elapsed_time": "0:37:57", "remaining_time": "0:18:45", "throughput": 625.0, "total_tokens": 1423536} {"current_steps": 505, "total_steps": 747, "loss": 0.751, "learning_rate": 1.1868129074790577e-05, "epoch": 2.0210105052526264, "percentage": 67.6, "elapsed_time": "0:38:19", "remaining_time": "0:18:21", "throughput": 624.51, "total_tokens": 1436048} {"current_steps": 510, "total_steps": 747, "loss": 0.762, "learning_rate": 1.1423728624769695e-05, "epoch": 2.0410205102551275, "percentage": 68.27, "elapsed_time": "0:38:42", "remaining_time": "0:17:59", "throughput": 624.57, "total_tokens": 1450272} {"current_steps": 515, "total_steps": 747, "loss": 0.8222, "learning_rate": 1.098533110169071e-05, "epoch": 2.0610305152576287, "percentage": 68.94, "elapsed_time": "0:39:05", "remaining_time": "0:17:36", "throughput": 624.49, "total_tokens": 1464656} {"current_steps": 520, "total_steps": 747, "loss": 0.7271, "learning_rate": 1.0553130348784182e-05, "epoch": 2.08104052026013, "percentage": 69.61, "elapsed_time": "0:39:26", "remaining_time": "0:17:13", "throughput": 624.45, "total_tokens": 1478016} {"current_steps": 525, "total_steps": 747, "loss": 0.7618, "learning_rate": 1.0127317469297277e-05, "epoch": 2.1010505252626315, "percentage": 70.28, "elapsed_time": "0:39:49", "remaining_time": "0:16:50", "throughput": 624.48, "total_tokens": 1492080} {"current_steps": 530, "total_steps": 747, "loss": 0.7738, "learning_rate": 9.708080741994868e-06, "epoch": 2.1210605302651326, "percentage": 70.95, "elapsed_time": "0:40:13", "remaining_time": "0:16:28", "throughput": 624.61, "total_tokens": 1507504} {"current_steps": 535, "total_steps": 747, "loss": 0.7976, "learning_rate": 9.295605537909708e-06, "epoch": 2.141070535267634, "percentage": 71.62, "elapsed_time": "0:40:34", "remaining_time": "0:16:04", "throughput": 624.49, "total_tokens": 1520080} {"current_steps": 540, "total_steps": 747, "loss": 0.7181, "learning_rate": 8.890074238378074e-06, "epoch": 2.161080540270135, "percentage": 72.29, "elapsed_time": "0:40:53", "remaining_time": "0:15:40", "throughput": 624.31, "total_tokens": 1531920} {"current_steps": 545, "total_steps": 747, "loss": 0.7375, "learning_rate": 8.491666154397573e-06, "epoch": 2.181090545272636, "percentage": 72.96, "elapsed_time": "0:41:16", "remaining_time": "0:15:17", "throughput": 624.28, "total_tokens": 1545856} {"current_steps": 550, "total_steps": 747, "loss": 0.7557, "learning_rate": 8.100557447342327e-06, "epoch": 2.2011005502751377, "percentage": 73.63, "elapsed_time": "0:41:36", "remaining_time": "0:14:54", "throughput": 624.07, "total_tokens": 1558256} {"current_steps": 555, "total_steps": 747, "loss": 0.7973, "learning_rate": 7.71692105107098e-06, "epoch": 2.221110555277639, "percentage": 74.3, "elapsed_time": "0:42:01", "remaining_time": "0:14:32", "throughput": 624.25, "total_tokens": 1573776} {"current_steps": 560, "total_steps": 747, "loss": 0.881, "learning_rate": 7.340926595461687e-06, "epoch": 2.24112056028014, "percentage": 74.97, "elapsed_time": "0:42:26", "remaining_time": "0:14:10", "throughput": 624.4, "total_tokens": 1589968} {"current_steps": 565, "total_steps": 747, "loss": 0.7725, "learning_rate": 6.972740331408015e-06, "epoch": 2.2611305652826412, "percentage": 75.64, "elapsed_time": "0:42:48", "remaining_time": "0:13:47", "throughput": 624.33, "total_tokens": 1603488} {"current_steps": 570, "total_steps": 747, "loss": 0.8143, "learning_rate": 6.612525057308949e-06, "epoch": 2.2811405702851424, "percentage": 76.31, "elapsed_time": "0:43:12", "remaining_time": "0:13:25", "throughput": 624.55, "total_tokens": 1619136} {"current_steps": 575, "total_steps": 747, "loss": 0.7383, "learning_rate": 6.260440047085439e-06, "epoch": 2.301150575287644, "percentage": 76.97, "elapsed_time": "0:43:37", "remaining_time": "0:13:02", "throughput": 624.73, "total_tokens": 1635088} {"current_steps": 580, "total_steps": 747, "loss": 0.9513, "learning_rate": 5.9166409797553415e-06, "epoch": 2.321160580290145, "percentage": 77.64, "elapsed_time": "0:44:03", "remaining_time": "0:12:41", "throughput": 625.05, "total_tokens": 1652560} {"current_steps": 585, "total_steps": 747, "loss": 0.6249, "learning_rate": 5.581279870597867e-06, "epoch": 2.3411705852926463, "percentage": 78.31, "elapsed_time": "0:44:24", "remaining_time": "0:12:17", "throughput": 624.84, "total_tokens": 1665168} {"current_steps": 590, "total_steps": 747, "loss": 0.7327, "learning_rate": 5.254505003938043e-06, "epoch": 2.3611805902951475, "percentage": 78.98, "elapsed_time": "0:44:44", "remaining_time": "0:11:54", "throughput": 624.77, "total_tokens": 1677312} {"current_steps": 595, "total_steps": 747, "loss": 0.8425, "learning_rate": 4.936460867580889e-06, "epoch": 2.3811905952976486, "percentage": 79.65, "elapsed_time": "0:45:06", "remaining_time": "0:11:31", "throughput": 624.65, "total_tokens": 1690400} {"current_steps": 600, "total_steps": 747, "loss": 0.8224, "learning_rate": 4.627288088924156e-06, "epoch": 2.4012006003001503, "percentage": 80.32, "elapsed_time": "0:45:28", "remaining_time": "0:11:08", "throughput": 624.69, "total_tokens": 1704640} {"current_steps": 605, "total_steps": 747, "loss": 0.7743, "learning_rate": 4.327123372778122e-06, "epoch": 2.4212106053026514, "percentage": 80.99, "elapsed_time": "0:45:51", "remaining_time": "0:10:45", "throughput": 624.38, "total_tokens": 1717808} {"current_steps": 610, "total_steps": 747, "loss": 0.6191, "learning_rate": 4.036099440919763e-06, "epoch": 2.4412206103051526, "percentage": 81.66, "elapsed_time": "0:46:11", "remaining_time": "0:10:22", "throughput": 624.36, "total_tokens": 1730688} {"current_steps": 615, "total_steps": 747, "loss": 0.8898, "learning_rate": 3.754344973408064e-06, "epoch": 2.4612306153076537, "percentage": 82.33, "elapsed_time": "0:46:35", "remaining_time": "0:09:59", "throughput": 624.41, "total_tokens": 1745472} {"current_steps": 620, "total_steps": 747, "loss": 0.9432, "learning_rate": 3.481984551686429e-06, "epoch": 2.481240620310155, "percentage": 83.0, "elapsed_time": "0:46:59", "remaining_time": "0:09:37", "throughput": 624.53, "total_tokens": 1761008} {"current_steps": 625, "total_steps": 747, "loss": 0.8175, "learning_rate": 3.2191386034973627e-06, "epoch": 2.5012506253126565, "percentage": 83.67, "elapsed_time": "0:47:21", "remaining_time": "0:09:14", "throughput": 624.54, "total_tokens": 1774704} {"current_steps": 630, "total_steps": 747, "loss": 0.793, "learning_rate": 2.9659233496337786e-06, "epoch": 2.5212606303151577, "percentage": 84.34, "elapsed_time": "0:47:44", "remaining_time": "0:08:51", "throughput": 624.54, "total_tokens": 1788768} {"current_steps": 635, "total_steps": 747, "loss": 0.8368, "learning_rate": 2.722450752550429e-06, "epoch": 2.541270635317659, "percentage": 85.01, "elapsed_time": "0:48:03", "remaining_time": "0:08:28", "throughput": 624.24, "total_tokens": 1799968} {"current_steps": 640, "total_steps": 747, "loss": 0.8236, "learning_rate": 2.4888284668582285e-06, "epoch": 2.56128064032016, "percentage": 85.68, "elapsed_time": "0:48:27", "remaining_time": "0:08:06", "throughput": 624.36, "total_tokens": 1815008} {"current_steps": 645, "total_steps": 747, "loss": 0.7644, "learning_rate": 2.265159791723373e-06, "epoch": 2.581290645322661, "percentage": 86.35, "elapsed_time": "0:48:51", "remaining_time": "0:07:43", "throughput": 624.45, "total_tokens": 1830400} {"current_steps": 650, "total_steps": 747, "loss": 0.7604, "learning_rate": 2.051543625192226e-06, "epoch": 2.6013006503251628, "percentage": 87.01, "elapsed_time": "0:49:13", "remaining_time": "0:07:20", "throughput": 624.43, "total_tokens": 1844256} {"current_steps": 655, "total_steps": 747, "loss": 0.8209, "learning_rate": 1.8480744204622757e-06, "epoch": 2.621310655327664, "percentage": 87.68, "elapsed_time": "0:49:36", "remaining_time": "0:06:58", "throughput": 624.49, "total_tokens": 1859024} {"current_steps": 660, "total_steps": 747, "loss": 0.8396, "learning_rate": 1.6548421441183875e-06, "epoch": 2.641320660330165, "percentage": 88.35, "elapsed_time": "0:50:01", "remaining_time": "0:06:35", "throughput": 624.65, "total_tokens": 1874624} {"current_steps": 665, "total_steps": 747, "loss": 0.7678, "learning_rate": 1.4719322363529242e-06, "epoch": 2.6613306653326663, "percentage": 89.02, "elapsed_time": "0:50:22", "remaining_time": "0:06:12", "throughput": 624.69, "total_tokens": 1888064} {"current_steps": 670, "total_steps": 747, "loss": 0.8765, "learning_rate": 1.2994255731871963e-06, "epoch": 2.6813406703351674, "percentage": 89.69, "elapsed_time": "0:50:45", "remaining_time": "0:05:50", "throughput": 624.76, "total_tokens": 1902976} {"current_steps": 675, "total_steps": 747, "loss": 0.8124, "learning_rate": 1.137398430711123e-06, "epoch": 2.701350675337669, "percentage": 90.36, "elapsed_time": "0:51:07", "remaining_time": "0:05:27", "throughput": 624.77, "total_tokens": 1916416} {"current_steps": 680, "total_steps": 747, "loss": 0.8009, "learning_rate": 9.85922451356694e-07, "epoch": 2.72136068034017, "percentage": 91.03, "elapsed_time": "0:51:30", "remaining_time": "0:05:04", "throughput": 624.91, "total_tokens": 1931536} {"current_steps": 685, "total_steps": 747, "loss": 0.8841, "learning_rate": 8.450646122203865e-07, "epoch": 2.7413706853426714, "percentage": 91.7, "elapsed_time": "0:51:55", "remaining_time": "0:04:41", "throughput": 625.0, "total_tokens": 1947072} {"current_steps": 690, "total_steps": 747, "loss": 0.7737, "learning_rate": 7.148871954483105e-07, "epoch": 2.7613806903451725, "percentage": 92.37, "elapsed_time": "0:52:17", "remaining_time": "0:04:19", "throughput": 624.91, "total_tokens": 1960624} {"current_steps": 695, "total_steps": 747, "loss": 0.7897, "learning_rate": 5.954477606973679e-07, "epoch": 2.7813906953476737, "percentage": 93.04, "elapsed_time": "0:52:40", "remaining_time": "0:03:56", "throughput": 625.01, "total_tokens": 1975232} {"current_steps": 700, "total_steps": 747, "loss": 0.7096, "learning_rate": 4.867991196844918e-07, "epoch": 2.8014007003501753, "percentage": 93.71, "elapsed_time": "0:53:03", "remaining_time": "0:03:33", "throughput": 625.0, "total_tokens": 1989760} {"current_steps": 705, "total_steps": 747, "loss": 0.8227, "learning_rate": 3.8898931283523344e-07, "epoch": 2.8214107053526765, "percentage": 94.38, "elapsed_time": "0:53:30", "remaining_time": "0:03:11", "throughput": 624.97, "total_tokens": 2006720} {"current_steps": 710, "total_steps": 747, "loss": 0.7987, "learning_rate": 3.020615880420713e-07, "epoch": 2.8414207103551776, "percentage": 95.05, "elapsed_time": "0:53:54", "remaining_time": "0:02:48", "throughput": 624.97, "total_tokens": 2021664} {"current_steps": 715, "total_steps": 747, "loss": 0.7853, "learning_rate": 2.2605438154179038e-07, "epoch": 2.861430715357679, "percentage": 95.72, "elapsed_time": "0:54:19", "remaining_time": "0:02:25", "throughput": 625.14, "total_tokens": 2037536} {"current_steps": 720, "total_steps": 747, "loss": 0.7808, "learning_rate": 1.6100130092037703e-07, "epoch": 2.88144072036018, "percentage": 96.39, "elapsed_time": "0:54:40", "remaining_time": "0:02:03", "throughput": 625.09, "total_tokens": 2050432} {"current_steps": 725, "total_steps": 747, "loss": 0.7777, "learning_rate": 1.0693111025300017e-07, "epoch": 2.9014507253626816, "percentage": 97.05, "elapsed_time": "0:55:02", "remaining_time": "0:01:40", "throughput": 625.05, "total_tokens": 2064080} {"current_steps": 730, "total_steps": 747, "loss": 0.8181, "learning_rate": 6.386771738558506e-08, "epoch": 2.9214607303651827, "percentage": 97.72, "elapsed_time": "0:55:26", "remaining_time": "0:01:17", "throughput": 625.19, "total_tokens": 2079760} {"current_steps": 735, "total_steps": 747, "loss": 0.7858, "learning_rate": 3.1830163363655296e-08, "epoch": 2.941470735367684, "percentage": 98.39, "elapsed_time": "0:55:49", "remaining_time": "0:00:54", "throughput": 625.24, "total_tokens": 2094000} {"current_steps": 740, "total_steps": 747, "loss": 0.9016, "learning_rate": 1.0832614013073228e-08, "epoch": 2.961480740370185, "percentage": 99.06, "elapsed_time": "0:56:12", "remaining_time": "0:00:31", "throughput": 625.23, "total_tokens": 2108592} {"current_steps": 745, "total_steps": 747, "loss": 0.7275, "learning_rate": 8.843536764419069e-10, "epoch": 2.981490745372686, "percentage": 99.73, "elapsed_time": "0:56:34", "remaining_time": "0:00:09", "throughput": 625.07, "total_tokens": 2121680} {"current_steps": 747, "total_steps": 747, "epoch": 2.989494747373687, "percentage": 100.0, "elapsed_time": "0:56:45", "remaining_time": "0:00:00", "throughput": 624.84, "total_tokens": 2127792}