{"current_steps": 10, "total_steps": 1000, "loss": 7.3908, "accuracy": 0.550000011920929, "learning_rate": 4.998766400914329e-06, "epoch": 0.007248346470961312, "percentage": 1.0, "elapsed_time": "0:01:19", "remaining_time": "2:10:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20, "total_steps": 1000, "loss": 7.3753, "accuracy": 0.574999988079071, "learning_rate": 4.9950668210706795e-06, "epoch": 0.014496692941922623, "percentage": 2.0, "elapsed_time": "0:02:33", "remaining_time": "2:05:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 30, "total_steps": 1000, "loss": 7.4516, "accuracy": 0.4375, "learning_rate": 4.9889049115077e-06, "epoch": 0.021745039412883936, "percentage": 3.0, "elapsed_time": "0:03:46", "remaining_time": "2:01:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 40, "total_steps": 1000, "loss": 7.3888, "accuracy": 0.6499999761581421, "learning_rate": 4.980286753286196e-06, "epoch": 0.028993385883845247, "percentage": 4.0, "elapsed_time": "0:05:00", "remaining_time": "2:00:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 50, "total_steps": 1000, "loss": 7.518, "accuracy": 0.512499988079071, "learning_rate": 4.9692208514878445e-06, "epoch": 0.03624173235480656, "percentage": 5.0, "elapsed_time": "0:06:16", "remaining_time": "1:59:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 50, "total_steps": 1000, "eval_loss": 0.9120966196060181, "epoch": 0.03624173235480656, "percentage": 5.0, "elapsed_time": "0:06:46", "remaining_time": "2:08:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 60, "total_steps": 1000, "loss": 7.3929, "accuracy": 0.5625, "learning_rate": 4.9557181268217225e-06, "epoch": 0.04349007882576787, "percentage": 6.0, "elapsed_time": "0:08:15", "remaining_time": "2:09:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 70, "total_steps": 1000, "loss": 7.1863, "accuracy": 0.6000000238418579, "learning_rate": 4.939791904846869e-06, "epoch": 0.05073842529672919, "percentage": 7.0, "elapsed_time": "0:09:28", "remaining_time": "2:05:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 80, "total_steps": 1000, "loss": 7.3662, "accuracy": 0.5874999761581421, "learning_rate": 4.921457902821578e-06, "epoch": 0.057986771767690494, "percentage": 8.0, "elapsed_time": "0:10:43", "remaining_time": "2:03:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 90, "total_steps": 1000, "loss": 7.268, "accuracy": 0.6000000238418579, "learning_rate": 4.900734214192358e-06, "epoch": 0.0652351182386518, "percentage": 9.0, "elapsed_time": "0:11:56", "remaining_time": "2:00:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 100, "total_steps": 1000, "loss": 7.2544, "accuracy": 0.5874999761581421, "learning_rate": 4.8776412907378845e-06, "epoch": 0.07248346470961312, "percentage": 10.0, "elapsed_time": "0:13:09", "remaining_time": "1:58:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 100, "total_steps": 1000, "eval_loss": 0.8920583724975586, "epoch": 0.07248346470961312, "percentage": 10.0, "elapsed_time": "0:13:39", "remaining_time": "2:02:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 110, "total_steps": 1000, "loss": 7.1762, "accuracy": 0.550000011920929, "learning_rate": 4.852201922385564e-06, "epoch": 0.07973181118057443, "percentage": 11.0, "elapsed_time": "0:15:07", "remaining_time": "2:02:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 120, "total_steps": 1000, "loss": 7.1442, "accuracy": 0.625, "learning_rate": 4.824441214720629e-06, "epoch": 0.08698015765153574, "percentage": 12.0, "elapsed_time": "0:16:20", "remaining_time": "1:59:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 130, "total_steps": 1000, "loss": 7.1449, "accuracy": 0.612500011920929, "learning_rate": 4.794386564209953e-06, "epoch": 0.09422850412249706, "percentage": 13.0, "elapsed_time": "0:17:32", "remaining_time": "1:57:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 140, "total_steps": 1000, "loss": 7.122, "accuracy": 0.625, "learning_rate": 4.762067631165049e-06, "epoch": 0.10147685059345837, "percentage": 14.0, "elapsed_time": "0:18:47", "remaining_time": "1:55:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 150, "total_steps": 1000, "loss": 7.1253, "accuracy": 0.6625000238418579, "learning_rate": 4.72751631047092e-06, "epoch": 0.10872519706441967, "percentage": 15.0, "elapsed_time": "0:19:59", "remaining_time": "1:53:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 150, "total_steps": 1000, "eval_loss": 0.8764163851737976, "epoch": 0.10872519706441967, "percentage": 15.0, "elapsed_time": "0:20:29", "remaining_time": "1:56:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 160, "total_steps": 1000, "loss": 7.0307, "accuracy": 0.5375000238418579, "learning_rate": 4.690766700109659e-06, "epoch": 0.11597354353538099, "percentage": 16.0, "elapsed_time": "0:21:56", "remaining_time": "1:55:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 170, "total_steps": 1000, "loss": 7.1652, "accuracy": 0.637499988079071, "learning_rate": 4.65185506750986e-06, "epoch": 0.1232218900063423, "percentage": 17.0, "elapsed_time": "0:23:06", "remaining_time": "1:52:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 180, "total_steps": 1000, "loss": 7.0022, "accuracy": 0.625, "learning_rate": 4.610819813755038e-06, "epoch": 0.1304702364773036, "percentage": 18.0, "elapsed_time": "0:24:21", "remaining_time": "1:50:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 190, "total_steps": 1000, "loss": 7.004, "accuracy": 0.5874999761581421, "learning_rate": 4.567701435686405e-06, "epoch": 0.13771858294826492, "percentage": 19.0, "elapsed_time": "0:25:35", "remaining_time": "1:49:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 200, "total_steps": 1000, "loss": 7.0539, "accuracy": 0.6499999761581421, "learning_rate": 4.522542485937369e-06, "epoch": 0.14496692941922623, "percentage": 20.0, "elapsed_time": "0:26:48", "remaining_time": "1:47:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 200, "total_steps": 1000, "eval_loss": 0.8565592169761658, "epoch": 0.14496692941922623, "percentage": 20.0, "elapsed_time": "0:27:19", "remaining_time": "1:49:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 210, "total_steps": 1000, "loss": 6.9013, "accuracy": 0.5874999761581421, "learning_rate": 4.475387530939226e-06, "epoch": 0.15221527589018755, "percentage": 21.0, "elapsed_time": "0:28:46", "remaining_time": "1:48:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 220, "total_steps": 1000, "loss": 6.9366, "accuracy": 0.699999988079071, "learning_rate": 4.426283106939474e-06, "epoch": 0.15946362236114886, "percentage": 22.0, "elapsed_time": "0:29:59", "remaining_time": "1:46:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 230, "total_steps": 1000, "loss": 6.8823, "accuracy": 0.699999988079071, "learning_rate": 4.3752776740761495e-06, "epoch": 0.16671196883211017, "percentage": 23.0, "elapsed_time": "0:31:13", "remaining_time": "1:44:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 240, "total_steps": 1000, "loss": 6.7139, "accuracy": 0.6625000238418579, "learning_rate": 4.322421568553529e-06, "epoch": 0.1739603153030715, "percentage": 24.0, "elapsed_time": "0:32:29", "remaining_time": "1:42:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 250, "total_steps": 1000, "loss": 6.7737, "accuracy": 0.550000011920929, "learning_rate": 4.267766952966369e-06, "epoch": 0.1812086617740328, "percentage": 25.0, "elapsed_time": "0:33:48", "remaining_time": "1:41:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 250, "total_steps": 1000, "eval_loss": 0.816527247428894, "epoch": 0.1812086617740328, "percentage": 25.0, "elapsed_time": "0:34:18", "remaining_time": "1:42:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 260, "total_steps": 1000, "loss": 6.6574, "accuracy": 0.625, "learning_rate": 4.211367764821722e-06, "epoch": 0.18845700824499412, "percentage": 26.0, "elapsed_time": "0:35:47", "remaining_time": "1:41:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 270, "total_steps": 1000, "loss": 6.6017, "accuracy": 0.5874999761581421, "learning_rate": 4.15327966330913e-06, "epoch": 0.19570535471595543, "percentage": 27.0, "elapsed_time": "0:37:03", "remaining_time": "1:40:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 280, "total_steps": 1000, "loss": 6.3849, "accuracy": 0.550000011920929, "learning_rate": 4.093559974371725e-06, "epoch": 0.20295370118691675, "percentage": 28.0, "elapsed_time": "0:38:19", "remaining_time": "1:38:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 290, "total_steps": 1000, "loss": 6.0103, "accuracy": 0.7124999761581421, "learning_rate": 4.032267634132442e-06, "epoch": 0.21020204765787803, "percentage": 29.0, "elapsed_time": "0:39:32", "remaining_time": "1:36:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 300, "total_steps": 1000, "loss": 5.9678, "accuracy": 0.6875, "learning_rate": 3.969463130731183e-06, "epoch": 0.21745039412883935, "percentage": 30.0, "elapsed_time": "0:40:44", "remaining_time": "1:35:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 300, "total_steps": 1000, "eval_loss": 0.7266466617584229, "epoch": 0.21745039412883935, "percentage": 30.0, "elapsed_time": "0:41:14", "remaining_time": "1:36:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 310, "total_steps": 1000, "loss": 5.5511, "accuracy": 0.637499988079071, "learning_rate": 3.905208444630326e-06, "epoch": 0.22469874059980066, "percentage": 31.0, "elapsed_time": "0:42:41", "remaining_time": "1:35:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 320, "total_steps": 1000, "loss": 5.5495, "accuracy": 0.6625000238418579, "learning_rate": 3.839566987447492e-06, "epoch": 0.23194708707076198, "percentage": 32.0, "elapsed_time": "0:43:51", "remaining_time": "1:33:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 330, "total_steps": 1000, "loss": 5.526, "accuracy": 0.6875, "learning_rate": 3.772603539375929e-06, "epoch": 0.2391954335417233, "percentage": 33.0, "elapsed_time": "0:45:03", "remaining_time": "1:31:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 340, "total_steps": 1000, "loss": 5.0865, "accuracy": 0.612500011920929, "learning_rate": 3.7043841852542884e-06, "epoch": 0.2464437800126846, "percentage": 34.0, "elapsed_time": "0:46:16", "remaining_time": "1:29:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 350, "total_steps": 1000, "loss": 5.0036, "accuracy": 0.6499999761581421, "learning_rate": 3.634976249348867e-06, "epoch": 0.2536921264836459, "percentage": 35.0, "elapsed_time": "0:47:29", "remaining_time": "1:28:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 350, "total_steps": 1000, "eval_loss": 0.6240565776824951, "epoch": 0.2536921264836459, "percentage": 35.0, "elapsed_time": "0:48:00", "remaining_time": "1:29:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 360, "total_steps": 1000, "loss": 5.2602, "accuracy": 0.637499988079071, "learning_rate": 3.564448228912682e-06, "epoch": 0.2609404729546072, "percentage": 36.0, "elapsed_time": "0:49:25", "remaining_time": "1:27:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 370, "total_steps": 1000, "loss": 4.9912, "accuracy": 0.6625000238418579, "learning_rate": 3.4928697265869516e-06, "epoch": 0.26818881942556855, "percentage": 37.0, "elapsed_time": "0:50:38", "remaining_time": "1:26:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 380, "total_steps": 1000, "loss": 4.7972, "accuracy": 0.625, "learning_rate": 3.4203113817116955e-06, "epoch": 0.27543716589652983, "percentage": 38.0, "elapsed_time": "0:51:52", "remaining_time": "1:24:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 390, "total_steps": 1000, "loss": 4.7275, "accuracy": 0.7749999761581421, "learning_rate": 3.346844800613229e-06, "epoch": 0.2826855123674912, "percentage": 39.0, "elapsed_time": "0:53:10", "remaining_time": "1:23:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 400, "total_steps": 1000, "loss": 4.5874, "accuracy": 0.6625000238418579, "learning_rate": 3.272542485937369e-06, "epoch": 0.28993385883845246, "percentage": 40.0, "elapsed_time": "0:54:25", "remaining_time": "1:21:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 400, "total_steps": 1000, "eval_loss": 0.5390450358390808, "epoch": 0.28993385883845246, "percentage": 40.0, "elapsed_time": "0:54:55", "remaining_time": "1:22:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 410, "total_steps": 1000, "loss": 4.3201, "accuracy": 0.6875, "learning_rate": 3.1974777650980737e-06, "epoch": 0.2971822053094138, "percentage": 41.0, "elapsed_time": "0:56:24", "remaining_time": "1:21:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 420, "total_steps": 1000, "loss": 4.1763, "accuracy": 0.7250000238418579, "learning_rate": 3.121724717912138e-06, "epoch": 0.3044305517803751, "percentage": 42.0, "elapsed_time": "0:57:40", "remaining_time": "1:19:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 430, "total_steps": 1000, "loss": 4.1528, "accuracy": 0.6875, "learning_rate": 3.045358103491357e-06, "epoch": 0.31167889825133643, "percentage": 43.0, "elapsed_time": "0:58:54", "remaining_time": "1:18:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 440, "total_steps": 1000, "loss": 3.7696, "accuracy": 0.762499988079071, "learning_rate": 2.9684532864643123e-06, "epoch": 0.3189272447222977, "percentage": 44.0, "elapsed_time": "1:00:10", "remaining_time": "1:16:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 450, "total_steps": 1000, "loss": 4.3625, "accuracy": 0.7749999761581421, "learning_rate": 2.8910861626005774e-06, "epoch": 0.32617559119325906, "percentage": 45.0, "elapsed_time": "1:01:24", "remaining_time": "1:15:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 450, "total_steps": 1000, "eval_loss": 0.49255281686782837, "epoch": 0.32617559119325906, "percentage": 45.0, "elapsed_time": "1:01:55", "remaining_time": "1:15:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 460, "total_steps": 1000, "loss": 3.9344, "accuracy": 0.675000011920929, "learning_rate": 2.813333083910761e-06, "epoch": 0.33342393766422035, "percentage": 46.0, "elapsed_time": "1:03:23", "remaining_time": "1:14:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 470, "total_steps": 1000, "loss": 3.8492, "accuracy": 0.7124999761581421, "learning_rate": 2.7352707832962865e-06, "epoch": 0.34067228413518164, "percentage": 47.0, "elapsed_time": "1:04:37", "remaining_time": "1:12:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 480, "total_steps": 1000, "loss": 3.5822, "accuracy": 0.8500000238418579, "learning_rate": 2.6569762988232838e-06, "epoch": 0.347920630606143, "percentage": 48.0, "elapsed_time": "1:05:55", "remaining_time": "1:11:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 490, "total_steps": 1000, "loss": 3.8437, "accuracy": 0.7124999761581421, "learning_rate": 2.578526897695321e-06, "epoch": 0.35516897707710426, "percentage": 49.0, "elapsed_time": "1:07:08", "remaining_time": "1:09:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 500, "total_steps": 1000, "loss": 3.8597, "accuracy": 0.7749999761581421, "learning_rate": 2.5e-06, "epoch": 0.3624173235480656, "percentage": 50.0, "elapsed_time": "1:08:23", "remaining_time": "1:08:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 500, "total_steps": 1000, "eval_loss": 0.45747870206832886, "epoch": 0.3624173235480656, "percentage": 50.0, "elapsed_time": "1:08:53", "remaining_time": "1:08:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 510, "total_steps": 1000, "loss": 3.6558, "accuracy": 0.75, "learning_rate": 2.4214731023046795e-06, "epoch": 0.3696656700190269, "percentage": 51.0, "elapsed_time": "1:10:17", "remaining_time": "1:07:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 520, "total_steps": 1000, "loss": 3.8086, "accuracy": 0.762499988079071, "learning_rate": 2.3430237011767166e-06, "epoch": 0.37691401648998824, "percentage": 52.0, "elapsed_time": "1:11:27", "remaining_time": "1:05:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 530, "total_steps": 1000, "loss": 3.3647, "accuracy": 0.887499988079071, "learning_rate": 2.2647292167037143e-06, "epoch": 0.3841623629609495, "percentage": 53.0, "elapsed_time": "1:12:44", "remaining_time": "1:04:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 540, "total_steps": 1000, "loss": 3.6972, "accuracy": 0.8374999761581421, "learning_rate": 2.186666916089239e-06, "epoch": 0.39141070943191086, "percentage": 54.0, "elapsed_time": "1:13:56", "remaining_time": "1:02:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 550, "total_steps": 1000, "loss": 3.6202, "accuracy": 0.762499988079071, "learning_rate": 2.1089138373994226e-06, "epoch": 0.39865905590287215, "percentage": 55.0, "elapsed_time": "1:15:07", "remaining_time": "1:01:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 550, "total_steps": 1000, "eval_loss": 0.43277421593666077, "epoch": 0.39865905590287215, "percentage": 55.0, "elapsed_time": "1:15:37", "remaining_time": "1:01:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 560, "total_steps": 1000, "loss": 3.2952, "accuracy": 0.8500000238418579, "learning_rate": 2.031546713535688e-06, "epoch": 0.4059074023738335, "percentage": 56.0, "elapsed_time": "1:17:05", "remaining_time": "1:00:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 570, "total_steps": 1000, "loss": 3.3085, "accuracy": 0.8125, "learning_rate": 1.9546418965086444e-06, "epoch": 0.4131557488447948, "percentage": 57.0, "elapsed_time": "1:18:16", "remaining_time": "0:59:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 580, "total_steps": 1000, "loss": 3.2304, "accuracy": 0.7749999761581421, "learning_rate": 1.8782752820878636e-06, "epoch": 0.42040409531575607, "percentage": 58.0, "elapsed_time": "1:19:29", "remaining_time": "0:57:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 590, "total_steps": 1000, "loss": 3.2736, "accuracy": 0.7875000238418579, "learning_rate": 1.8025222349019273e-06, "epoch": 0.4276524417867174, "percentage": 59.0, "elapsed_time": "1:20:45", "remaining_time": "0:56:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 600, "total_steps": 1000, "loss": 3.343, "accuracy": 0.875, "learning_rate": 1.7274575140626318e-06, "epoch": 0.4349007882576787, "percentage": 60.0, "elapsed_time": "1:21:59", "remaining_time": "0:54:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 600, "total_steps": 1000, "eval_loss": 0.3846723139286041, "epoch": 0.4349007882576787, "percentage": 60.0, "elapsed_time": "1:22:29", "remaining_time": "0:54:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 610, "total_steps": 1000, "loss": 3.0472, "accuracy": 0.7875000238418579, "learning_rate": 1.6531551993867717e-06, "epoch": 0.44214913472864004, "percentage": 61.0, "elapsed_time": "1:23:56", "remaining_time": "0:53:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 620, "total_steps": 1000, "loss": 3.1013, "accuracy": 0.9125000238418579, "learning_rate": 1.5796886182883053e-06, "epoch": 0.4493974811996013, "percentage": 62.0, "elapsed_time": "1:25:10", "remaining_time": "0:52:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 630, "total_steps": 1000, "loss": 2.7849, "accuracy": 0.824999988079071, "learning_rate": 1.5071302734130488e-06, "epoch": 0.45664582767056267, "percentage": 63.0, "elapsed_time": "1:26:29", "remaining_time": "0:50:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 640, "total_steps": 1000, "loss": 2.6839, "accuracy": 0.887499988079071, "learning_rate": 1.4355517710873184e-06, "epoch": 0.46389417414152395, "percentage": 64.0, "elapsed_time": "1:27:44", "remaining_time": "0:49:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 650, "total_steps": 1000, "loss": 2.884, "accuracy": 0.8999999761581421, "learning_rate": 1.3650237506511333e-06, "epoch": 0.4711425206124853, "percentage": 65.0, "elapsed_time": "1:28:58", "remaining_time": "0:47:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 650, "total_steps": 1000, "eval_loss": 0.35537806153297424, "epoch": 0.4711425206124853, "percentage": 65.0, "elapsed_time": "1:29:29", "remaining_time": "0:48:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 660, "total_steps": 1000, "loss": 2.7163, "accuracy": 0.8999999761581421, "learning_rate": 1.2956158147457116e-06, "epoch": 0.4783908670834466, "percentage": 66.0, "elapsed_time": "1:30:55", "remaining_time": "0:46:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 670, "total_steps": 1000, "loss": 2.9501, "accuracy": 0.887499988079071, "learning_rate": 1.2273964606240718e-06, "epoch": 0.4856392135544079, "percentage": 67.0, "elapsed_time": "1:32:09", "remaining_time": "0:45:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 680, "total_steps": 1000, "loss": 2.777, "accuracy": 0.925000011920929, "learning_rate": 1.160433012552508e-06, "epoch": 0.4928875600253692, "percentage": 68.0, "elapsed_time": "1:33:22", "remaining_time": "0:43:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 690, "total_steps": 1000, "loss": 2.673, "accuracy": 0.9125000238418579, "learning_rate": 1.0947915553696742e-06, "epoch": 0.5001359064963306, "percentage": 69.0, "elapsed_time": "1:34:38", "remaining_time": "0:42:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 700, "total_steps": 1000, "loss": 2.6632, "accuracy": 0.925000011920929, "learning_rate": 1.0305368692688175e-06, "epoch": 0.5073842529672918, "percentage": 70.0, "elapsed_time": "1:35:49", "remaining_time": "0:41:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 700, "total_steps": 1000, "eval_loss": 0.32792916893959045, "epoch": 0.5073842529672918, "percentage": 70.0, "elapsed_time": "1:36:20", "remaining_time": "0:41:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 710, "total_steps": 1000, "loss": 2.6968, "accuracy": 0.887499988079071, "learning_rate": 9.677323658675594e-07, "epoch": 0.5146325994382531, "percentage": 71.0, "elapsed_time": "1:37:45", "remaining_time": "0:39:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 720, "total_steps": 1000, "loss": 2.6929, "accuracy": 0.9125000238418579, "learning_rate": 9.064400256282757e-07, "epoch": 0.5218809459092144, "percentage": 72.0, "elapsed_time": "1:39:05", "remaining_time": "0:38:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 730, "total_steps": 1000, "loss": 2.6089, "accuracy": 0.887499988079071, "learning_rate": 8.467203366908708e-07, "epoch": 0.5291292923801758, "percentage": 73.0, "elapsed_time": "1:40:20", "remaining_time": "0:37:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 740, "total_steps": 1000, "loss": 2.3252, "accuracy": 0.9375, "learning_rate": 7.886322351782782e-07, "epoch": 0.5363776388511371, "percentage": 74.0, "elapsed_time": "1:41:34", "remaining_time": "0:35:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 750, "total_steps": 1000, "loss": 2.4229, "accuracy": 0.9624999761581421, "learning_rate": 7.322330470336314e-07, "epoch": 0.5436259853220984, "percentage": 75.0, "elapsed_time": "1:42:52", "remaining_time": "0:34:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 750, "total_steps": 1000, "eval_loss": 0.30500930547714233, "epoch": 0.5436259853220984, "percentage": 75.0, "elapsed_time": "1:43:23", "remaining_time": "0:34:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 760, "total_steps": 1000, "loss": 2.2663, "accuracy": 0.8999999761581421, "learning_rate": 6.775784314464717e-07, "epoch": 0.5508743317930597, "percentage": 76.0, "elapsed_time": "1:44:48", "remaining_time": "0:33:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 770, "total_steps": 1000, "loss": 2.5056, "accuracy": 0.8999999761581421, "learning_rate": 6.247223259238511e-07, "epoch": 0.5581226782640211, "percentage": 77.0, "elapsed_time": "1:46:06", "remaining_time": "0:31:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 780, "total_steps": 1000, "loss": 2.2382, "accuracy": 0.949999988079071, "learning_rate": 5.737168930605272e-07, "epoch": 0.5653710247349824, "percentage": 78.0, "elapsed_time": "1:47:19", "remaining_time": "0:30:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 790, "total_steps": 1000, "loss": 2.2271, "accuracy": 0.8999999761581421, "learning_rate": 5.24612469060774e-07, "epoch": 0.5726193712059436, "percentage": 79.0, "elapsed_time": "1:48:35", "remaining_time": "0:28:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 800, "total_steps": 1000, "loss": 2.2777, "accuracy": 0.9125000238418579, "learning_rate": 4.774575140626317e-07, "epoch": 0.5798677176769049, "percentage": 80.0, "elapsed_time": "1:49:47", "remaining_time": "0:27:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 800, "total_steps": 1000, "eval_loss": 0.2918218672275543, "epoch": 0.5798677176769049, "percentage": 80.0, "elapsed_time": "1:50:17", "remaining_time": "0:27:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 810, "total_steps": 1000, "loss": 2.5536, "accuracy": 0.925000011920929, "learning_rate": 4.3229856431359516e-07, "epoch": 0.5871160641478663, "percentage": 81.0, "elapsed_time": "1:51:43", "remaining_time": "0:26:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 820, "total_steps": 1000, "loss": 2.279, "accuracy": 0.8999999761581421, "learning_rate": 3.891801862449629e-07, "epoch": 0.5943644106188276, "percentage": 82.0, "elapsed_time": "1:52:57", "remaining_time": "0:24:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 830, "total_steps": 1000, "loss": 2.1291, "accuracy": 0.9125000238418579, "learning_rate": 3.481449324901412e-07, "epoch": 0.6016127570897889, "percentage": 83.0, "elapsed_time": "1:54:13", "remaining_time": "0:23:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 840, "total_steps": 1000, "loss": 2.2548, "accuracy": 0.949999988079071, "learning_rate": 3.092332998903416e-07, "epoch": 0.6088611035607502, "percentage": 84.0, "elapsed_time": "1:55:26", "remaining_time": "0:21:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 850, "total_steps": 1000, "loss": 2.2852, "accuracy": 0.887499988079071, "learning_rate": 2.7248368952908055e-07, "epoch": 0.6161094500317115, "percentage": 85.0, "elapsed_time": "1:56:40", "remaining_time": "0:20:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 850, "total_steps": 1000, "eval_loss": 0.2818227708339691, "epoch": 0.6161094500317115, "percentage": 85.0, "elapsed_time": "1:57:10", "remaining_time": "0:20:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 860, "total_steps": 1000, "loss": 2.2219, "accuracy": 0.9375, "learning_rate": 2.3793236883495164e-07, "epoch": 0.6233577965026729, "percentage": 86.0, "elapsed_time": "1:58:36", "remaining_time": "0:19:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 870, "total_steps": 1000, "loss": 2.0656, "accuracy": 0.9375, "learning_rate": 2.0561343579004716e-07, "epoch": 0.6306061429736342, "percentage": 87.0, "elapsed_time": "1:59:54", "remaining_time": "0:17:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 880, "total_steps": 1000, "loss": 2.2936, "accuracy": 0.9750000238418579, "learning_rate": 1.7555878527937164e-07, "epoch": 0.6378544894445954, "percentage": 88.0, "elapsed_time": "2:01:05", "remaining_time": "0:16:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 890, "total_steps": 1000, "loss": 2.1442, "accuracy": 0.9624999761581421, "learning_rate": 1.4779807761443638e-07, "epoch": 0.6451028359155567, "percentage": 89.0, "elapsed_time": "2:02:23", "remaining_time": "0:15:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 900, "total_steps": 1000, "loss": 2.6127, "accuracy": 0.9624999761581421, "learning_rate": 1.223587092621162e-07, "epoch": 0.6523511823865181, "percentage": 90.0, "elapsed_time": "2:03:41", "remaining_time": "0:13:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 900, "total_steps": 1000, "eval_loss": 0.27813127636909485, "epoch": 0.6523511823865181, "percentage": 90.0, "elapsed_time": "2:04:11", "remaining_time": "0:13:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 910, "total_steps": 1000, "loss": 2.1376, "accuracy": 0.9375, "learning_rate": 9.926578580764234e-08, "epoch": 0.6595995288574794, "percentage": 91.0, "elapsed_time": "2:05:39", "remaining_time": "0:12:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 920, "total_steps": 1000, "loss": 2.1545, "accuracy": 0.9375, "learning_rate": 7.854209717842231e-08, "epoch": 0.6668478753284407, "percentage": 92.0, "elapsed_time": "2:06:52", "remaining_time": "0:11:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 930, "total_steps": 1000, "loss": 1.8919, "accuracy": 0.925000011920929, "learning_rate": 6.020809515313141e-08, "epoch": 0.674096221799402, "percentage": 93.0, "elapsed_time": "2:08:06", "remaining_time": "0:09:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 940, "total_steps": 1000, "loss": 2.3143, "accuracy": 0.8999999761581421, "learning_rate": 4.428187317827848e-08, "epoch": 0.6813445682703633, "percentage": 94.0, "elapsed_time": "2:09:16", "remaining_time": "0:08:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 950, "total_steps": 1000, "loss": 2.0087, "accuracy": 0.9375, "learning_rate": 3.077914851215585e-08, "epoch": 0.6885929147413247, "percentage": 95.0, "elapsed_time": "2:10:31", "remaining_time": "0:06:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 950, "total_steps": 1000, "eval_loss": 0.27470529079437256, "epoch": 0.6885929147413247, "percentage": 95.0, "elapsed_time": "2:11:01", "remaining_time": "0:06:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 960, "total_steps": 1000, "loss": 2.3667, "accuracy": 0.9375, "learning_rate": 1.9713246713805588e-08, "epoch": 0.695841261212286, "percentage": 96.0, "elapsed_time": "2:12:25", "remaining_time": "0:05:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 970, "total_steps": 1000, "loss": 2.4385, "accuracy": 0.949999988079071, "learning_rate": 1.109508849230001e-08, "epoch": 0.7030896076832472, "percentage": 97.0, "elapsed_time": "2:13:36", "remaining_time": "0:04:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 980, "total_steps": 1000, "loss": 2.1329, "accuracy": 0.925000011920929, "learning_rate": 4.933178929321103e-09, "epoch": 0.7103379541542085, "percentage": 98.0, "elapsed_time": "2:14:47", "remaining_time": "0:02:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 990, "total_steps": 1000, "loss": 2.0641, "accuracy": 0.9125000238418579, "learning_rate": 1.2335990856710001e-09, "epoch": 0.7175863006251699, "percentage": 99.0, "elapsed_time": "2:16:06", "remaining_time": "0:01:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1000, "total_steps": 1000, "loss": 2.2805, "accuracy": 0.8999999761581421, "learning_rate": 0.0, "epoch": 0.7248346470961312, "percentage": 100.0, "elapsed_time": "2:17:23", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1000, "total_steps": 1000, "eval_loss": 0.27469781041145325, "epoch": 0.7248346470961312, "percentage": 100.0, "elapsed_time": "2:17:54", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1000, "total_steps": 1000, "epoch": 0.7248346470961312, "percentage": 100.0, "elapsed_time": "2:18:05", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}